From b4c5b8d265f896f9f7312f75838abafdeff2943c Mon Sep 17 00:00:00 2001 From: yyhhyyyyyy Date: Wed, 17 Dec 2025 10:17:32 +0800 Subject: [PATCH] fix(renderer): apply custom font to shell tab bar and tooltip overlay --- mise.toml | 3 + resources/model-db/providers.json | 32130 ++++++++++++------- src/renderer/shell/App.vue | 3 + src/renderer/shell/tooltip-overlay/main.ts | 35 + src/renderer/src/lib/fontStack.ts | 13 + src/renderer/src/stores/uiSettingsStore.ts | 17 +- 6 files changed, 20575 insertions(+), 11626 deletions(-) create mode 100644 mise.toml create mode 100644 src/renderer/src/lib/fontStack.ts diff --git a/mise.toml b/mise.toml new file mode 100644 index 000000000..40ca167b6 --- /dev/null +++ b/mise.toml @@ -0,0 +1,3 @@ +[tools] +node = "24" +pnpm = "latest" diff --git a/resources/model-db/providers.json b/resources/model-db/providers.json index 0c035f03b..a6c8f6029 100644 --- a/resources/model-db/providers.json +++ b/resources/model-db/providers.json @@ -526,8 +526,8 @@ }, { "id": "glm-4.5v", - "name": "GLM 4.5V", - "display_name": "GLM 4.5V", + "name": "GLM-4.5V", + "display_name": "GLM-4.5V", "modalities": { "input": [ "text", @@ -591,6 +591,40 @@ "cache_read": 0, "cache_write": 0 } + }, + { + "id": "glm-4.6v", + "name": "GLM-4.6V", + "display_name": "GLM-4.6V", + "modalities": { + "input": [ + "text", + "image", + "video" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 32768 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-12-08", + "last_updated": "2025-12-08", + "cost": { + "input": 0, + "output": 0 + } } ] }, @@ -655,9 +689,9 @@ "last_updated": "2025-09-22" }, { - "id": "gpt-oss:120b-cloud", - "name": "GPT-OSS 120B", - "display_name": "GPT-OSS 120B", + "id": "qwen3-coder:480b-cloud", + "name": "Qwen3 Coder 480B", + "display_name": "Qwen3 Coder 480B", "modalities": { "input": [ "text" @@ -673,18 +707,17 @@ "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2025-08-05", - "last_updated": "2025-08-05" + "release_date": "2025-07-22", + "last_updated": "2025-07-22" }, { - "id": "qwen3-coder-480b-cloud", - "name": "Qwen3 Coder 480B", - "display_name": "Qwen3 Coder 480B", + "id": "gpt-oss:120b-cloud", + "name": "GPT-OSS 120B", + "display_name": "GPT-OSS 120B", "modalities": { "input": [ "text" @@ -700,12 +733,13 @@ "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": true, - "release_date": "2025-07-22", - "last_updated": "2025-07-22" + "release_date": "2025-08-05", + "last_updated": "2025-08-05" }, { "id": "deepseek-v3.1:671b-cloud", @@ -4182,6 +4216,40 @@ "output": 0 } }, + { + "id": "moonshotai/kimi-k2-thinking", + "name": "Kimi K2 Thinking", + "display_name": "Kimi K2 Thinking", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 262144, + "output": 262144 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-07", + "release_date": "2025-11", + "last_updated": "2025-12", + "cost": { + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 + } + }, { "id": "moonshotai/kimi-k2-instruct", "name": "Kimi K2 Instruct", @@ -4693,6 +4761,102 @@ "output": 0 } }, + { + "id": "mistralai/devstral-2-123b-instruct-2512", + "name": "Devstral-2-123B-Instruct-2512", + "display_name": "Devstral-2-123B-Instruct-2512", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 262144, + "output": 262144 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": true, + "knowledge": "2025-12", + "release_date": "2025-12-08", + "last_updated": "2025-12-09", + "cost": { + "input": 0, + "output": 0 + } + }, + { + "id": "mistralai/mistral-large-3-675b-instruct-2512", + "name": "Mistral Large 3 675B Instruct 2512", + "display_name": "Mistral Large 3 675B Instruct 2512", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 262144, + "output": 262144 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2025-12-02", + "last_updated": "2025-12-02", + "cost": { + "input": 0, + "output": 0 + } + }, + { + "id": "mistralai/ministral-14b-instruct-2512", + "name": "Ministral 3 14B Instruct 2512", + "display_name": "Ministral 3 14B Instruct 2512", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 262144, + "output": 262144 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": true, + "knowledge": "2025-12", + "release_date": "2025-12-01", + "last_updated": "2025-12-08", + "cost": { + "input": 0, + "output": 0 + } + }, { "id": "deepseek-ai/deepseek-v3.1-terminus", "name": "DeepSeek V3.1 Terminus", @@ -6263,9 +6427,9 @@ } }, { - "id": "o3", - "name": "o3 (Preview)", - "display_name": "o3 (Preview)", + "id": "gpt-5.1-codex-max", + "name": "GPT-5.1-Codex-max", + "display_name": "GPT-5.1-Codex-max", "modalities": { "input": [ "text", @@ -6277,7 +6441,7 @@ }, "limit": { "context": 128000, - "output": 16384 + "output": 128000 }, "temperature": false, "tool_call": true, @@ -6287,51 +6451,18 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2024-05", - "release_date": "2025-04-16", - "last_updated": "2025-04-16", - "cost": { - "input": 0, - "output": 0 - } - }, - { - "id": "claude-sonnet-4", - "name": "Claude Sonnet 4", - "display_name": "Claude Sonnet 4", - "modalities": { - "input": [ - "text", - "image" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 128000, - "output": 16000 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": true, - "default": true - }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-05-22", - "last_updated": "2025-05-22", + "knowledge": "2024-09-30", + "release_date": "2025-12-04", + "last_updated": "2025-12-04", "cost": { "input": 0, "output": 0 } }, { - "id": "gpt-5", - "name": "GPT-5", - "display_name": "GPT-5", + "id": "o3", + "name": "o3 (Preview)", + "display_name": "o3 (Preview)", "modalities": { "input": [ "text", @@ -6343,42 +6474,9 @@ }, "limit": { "context": 128000, - "output": 128000 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": true, - "default": true - }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-10", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", - "cost": { - "input": 0, - "output": 0 - } - }, - { - "id": "claude-3.7-sonnet-thought", - "name": "Claude Sonnet 3.7 Thinking", - "display_name": "Claude Sonnet 3.7 Thinking", - "modalities": { - "input": [ - "text", - "image" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 200000, "output": 16384 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -6386,18 +6484,117 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-02-19", - "last_updated": "2025-02-19", + "knowledge": "2024-05", + "release_date": "2025-04-16", + "last_updated": "2025-04-16", "cost": { "input": 0, "output": 0 } }, { - "id": "claude-opus-4.5", - "name": "Claude Opus 4.5", - "display_name": "Claude Opus 4.5", + "id": "claude-sonnet-4", + "name": "Claude Sonnet 4", + "display_name": "Claude Sonnet 4", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 16000 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-03-31", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", + "cost": { + "input": 0, + "output": 0 + } + }, + { + "id": "gpt-5", + "name": "GPT-5", + "display_name": "GPT-5", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 128000 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": false, + "knowledge": "2024-10", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", + "cost": { + "input": 0, + "output": 0 + } + }, + { + "id": "claude-3.7-sonnet-thought", + "name": "Claude Sonnet 3.7 Thinking", + "display_name": "Claude Sonnet 3.7 Thinking", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 200000, + "output": 16384 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2025-02-19", + "last_updated": "2025-02-19", + "cost": { + "input": 0, + "output": 0 + } + }, + { + "id": "claude-opus-4.5", + "name": "Claude Opus 4.5", + "display_name": "Claude Opus 4.5", "modalities": { "input": [ "text", @@ -6427,6 +6624,39 @@ "output": 0 } }, + { + "id": "gpt-5.2", + "name": "GPT-5.2", + "display_name": "GPT-5.2", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 64000 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2025-12-11", + "last_updated": "2025-12-11", + "cost": { + "input": 0, + "output": 0 + } + }, { "id": "claude-sonnet-4.5", "name": "Claude Sonnet 4.5", @@ -6499,6 +6729,38 @@ "output": 2 } }, + { + "id": "mistral-large-2512", + "name": "Mistral Large 3", + "display_name": "Mistral Large 3", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 262144, + "output": 262144 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": true, + "knowledge": "2024-11", + "release_date": "2024-11-01", + "last_updated": "2025-12-02", + "cost": { + "input": 0.5, + "output": 1.5 + } + }, { "id": "open-mixtral-8x22b", "name": "Mixtral 8x22B", @@ -6593,6 +6855,38 @@ "output": 6 } }, + { + "id": "mistral-small-2506", + "name": "Mistral Small 3.2", + "display_name": "Mistral Small 3.2", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 16384 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-03", + "release_date": "2025-06-20", + "last_updated": "2025-06-20", + "cost": { + "input": 0.1, + "output": 0.3 + } + }, { "id": "ministral-3b-latest", "name": "Ministral 3B", @@ -6688,6 +6982,69 @@ "output": 2 } }, + { + "id": "labs-devstral-small-2512", + "name": "Devstral Small 2", + "display_name": "Devstral Small 2", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 256000, + "output": 256000 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-12", + "release_date": "2025-12-09", + "last_updated": "2025-12-09", + "cost": { + "input": 0.1, + "output": 0.3 + } + }, + { + "id": "devstral-medium-latest", + "name": "Devstral 2", + "display_name": "Devstral 2", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 262144, + "output": 262144 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-12", + "release_date": "2025-12-02", + "last_updated": "2025-12-02", + "cost": { + "input": 0.4, + "output": 2 + } + }, { "id": "devstral-small-2505", "name": "Devstral Small 2505", @@ -6751,6 +7108,36 @@ "output": 2 } }, + { + "id": "mistral-embed", + "name": "Mistral Embed", + "display_name": "Mistral Embed", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 8000, + "output": 3072 + }, + "temperature": false, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "release_date": "2023-12-11", + "last_updated": "2023-12-11", + "cost": { + "input": 0.1, + "output": 0 + } + }, { "id": "mistral-small-latest", "name": "Mistral Small", @@ -6976,29 +7363,30 @@ "display_name": "Mistral Large", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 16384 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": true, "knowledge": "2024-11", "release_date": "2024-11-01", - "last_updated": "2024-11-04", + "last_updated": "2025-12-02", "cost": { - "input": 2, - "output": 6 + "input": 0.5, + "output": 1.5 } }, { @@ -7033,6 +7421,37 @@ "output": 2 } }, + { + "id": "mistral-large-2411", + "name": "Mistral Large 2.1", + "display_name": "Mistral Large 2.1", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 16384 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "knowledge": "2024-11", + "release_date": "2024-11-01", + "last_updated": "2024-11-04", + "cost": { + "input": 2, + "output": 6 + } + }, { "id": "magistral-medium-latest", "name": "Magistral Medium", @@ -7694,29 +8113,30 @@ "display_name": "Mistral Large", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 16384 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": true, "knowledge": "2024-11", "release_date": "2024-11-01", - "last_updated": "2024-11-04", + "last_updated": "2025-12-02", "cost": { - "input": 2, - "output": 6 + "input": 0.5, + "output": 1.5 } }, { @@ -9546,7 +9966,8 @@ "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" @@ -9581,7 +10002,8 @@ "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" @@ -9616,7 +10038,8 @@ "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" @@ -9650,7 +10073,8 @@ "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" @@ -9685,7 +10109,8 @@ "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" @@ -9720,7 +10145,8 @@ "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" @@ -9754,7 +10180,8 @@ "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" @@ -9789,7 +10216,8 @@ "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" @@ -9824,7 +10252,8 @@ "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" @@ -9858,7 +10287,8 @@ "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" @@ -9892,7 +10322,8 @@ "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" @@ -13258,44 +13689,45 @@ "doc": "https://docs.venice.ai", "models": [ { - "id": "dolphin-2.9.2-qwen2-72b", - "name": "Dolphin 72B", - "display_name": "Dolphin 72B", + "id": "grok-41-fast", + "name": "Grok 4.1 Fast", + "display_name": "Grok 4.1 Fast", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 32768, + "context": 262144, "output": 8192 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2021-09", - "release_date": "2025-05-21", - "last_updated": "2025-05-21", + "attachment": true, + "open_weights": false, + "knowledge": "2025-07", + "release_date": "2025-11-19", + "last_updated": "2025-11-19", "cost": { - "input": 0.7, - "output": 2.8 + "input": 0.5, + "output": 1.25 } }, { - "id": "mistral-31-24b", - "name": "Venice Medium", - "display_name": "Venice Medium", + "id": "qwen3-235b-a22b-instruct-2507", + "name": "Qwen 3 235B A22B Instruct 2507", + "display_name": "Qwen 3 235B A22B Instruct 2507", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" @@ -13312,53 +13744,87 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2023-10", - "release_date": "2025-07-15", - "last_updated": "2025-07-15", + "knowledge": "2025-07", + "release_date": "2025-07-27", + "last_updated": "2025-07-27", "cost": { - "input": 0.5, - "output": 2 + "input": 0.15, + "output": 0.75 } }, { - "id": "venice-uncensored", - "name": "Venice Uncensored 1.1", - "display_name": "Venice Uncensored 1.1", + "id": "claude-opus-45", + "name": "Claude Opus 4.5", + "display_name": "Claude Opus 4.5", "modalities": { "input": [ + "text", + "image", + "pdf" + ], + "output": [ "text" + ] + }, + "limit": { + "context": 202752, + "output": 8192 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-03", + "release_date": "2025-12-05", + "last_updated": "2025-12-05", + "cost": { + "input": 6, + "output": 30 + } + }, + { + "id": "mistral-31-24b", + "name": "Venice Medium", + "display_name": "Venice Medium", + "modalities": { + "input": [ + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 32768, + "context": 131072, "output": 8192 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": true, "knowledge": "2023-10", "release_date": "2025-07-15", - "last_updated": "2025-07-15", + "last_updated": "2025-12-09", "cost": { "input": 0.5, "output": 2 } }, { - "id": "qwen-2.5-vl", - "name": "Qwen 2.5 VL 72B", - "display_name": "Qwen 2.5 VL 72B", + "id": "venice-uncensored", + "name": "Venice Uncensored 1.1", + "display_name": "Venice Uncensored 1.1", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" @@ -13376,17 +13842,17 @@ "attachment": false, "open_weights": true, "knowledge": "2023-10", - "release_date": "2025-06-09", - "last_updated": "2025-06-09", + "release_date": "2025-07-15", + "last_updated": "2025-12-09", "cost": { - "input": 0.7, - "output": 2.8 + "input": 0.2, + "output": 0.9 } }, { - "id": "qwen3-235b", - "name": "Venice Large", - "display_name": "Venice Large", + "id": "gemini-3-pro-preview", + "name": "Gemini 3 Pro Preview", + "display_name": "Gemini 3 Pro Preview", "modalities": { "input": [ "text" @@ -13396,7 +13862,7 @@ ] }, "limit": { - "context": 131072, + "context": 202752, "output": 8192 }, "temperature": true, @@ -13405,52 +13871,54 @@ "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-10", - "release_date": "2025-07-27", - "last_updated": "2025-07-27", + "attachment": true, + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2025-11-18", + "last_updated": "2025-11-18", "cost": { - "input": 1.5, - "output": 6 + "input": 2.5, + "output": 15 } }, { - "id": "qwen-2.5-qwq-32b", - "name": "Venice Reasoning", - "display_name": "Venice Reasoning", + "id": "openai-gpt-52", + "name": "GPT-5.2", + "display_name": "GPT-5.2", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 32768, - "output": 8192 + "context": 200000, + "output": 128000 }, - "temperature": true, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2023-10", - "release_date": "2025-07-08", - "last_updated": "2025-07-08", + "attachment": true, + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2025-12-11", + "last_updated": "2025-12-11", "cost": { - "input": 0.5, - "output": 2 + "input": 2.19, + "output": 17.5, + "cache_read": 0.175 } }, { - "id": "deepseek-coder-v2-lite", - "name": "DeepSeek Coder V2 Lite", - "display_name": "DeepSeek Coder V2 Lite", + "id": "qwen3-235b", + "name": "Venice Large 1.1", + "display_name": "Venice Large 1.1", "modalities": { "input": [ "text" @@ -13464,18 +13932,19 @@ "output": 8192 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": true, - "knowledge": "2021-09", - "release_date": "2025-06-22", - "last_updated": "2025-06-22", + "knowledge": "2024-10", + "release_date": "2025-07-27", + "last_updated": "2025-12-09", "cost": { - "input": 0.5, - "output": 2 + "input": 0.45, + "output": 3.5 } }, { @@ -13504,10 +13973,10 @@ "open_weights": true, "knowledge": "2024-07", "release_date": "2025-07-27", - "last_updated": "2025-07-27", + "last_updated": "2025-12-09", "cost": { - "input": 0.15, - "output": 0.6 + "input": 0.05, + "output": 0.15 } }, { @@ -13542,9 +14011,9 @@ } }, { - "id": "qwen-2.5-coder-32b", - "name": "Qwen 2.5 Coder 32B", - "display_name": "Qwen 2.5 Coder 32B", + "id": "openai-gpt-oss-120b", + "name": "OpenAI GPT OSS 120B", + "display_name": "OpenAI GPT OSS 120B", "modalities": { "input": [ "text" @@ -13554,28 +14023,60 @@ ] }, "limit": { - "context": 32768, + "context": 131072, "output": 8192 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2023-10", - "release_date": "2025-06-14", - "last_updated": "2025-06-14", + "knowledge": "2025-07", + "release_date": "2025-07-27", + "last_updated": "2025-07-27", "cost": { - "input": 0.5, - "output": 2 + "input": 0.07, + "output": 0.3 + } + }, + { + "id": "kimi-k2-thinking", + "name": "Kimi K2 Thinking", + "display_name": "Kimi K2 Thinking", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 262144, + "output": 8192 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": false, + "open_weights": true, + "knowledge": "2024-04", + "release_date": "2025-09-05", + "last_updated": "2025-09-05", + "cost": { + "input": 0.75, + "output": 3.2 } }, { - "id": "deepseek-r1-671b", - "name": "DeepSeek R1 671B", - "display_name": "DeepSeek R1 671B", + "id": "qwen3-235b-a22b-thinking-2507", + "name": "Qwen 3 235B A22B Thinking 2507", + "display_name": "Qwen 3 235B A22B Thinking 2507", "modalities": { "input": [ "text" @@ -13589,19 +14090,19 @@ "output": 8192 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, "default": true }, "attachment": false, "open_weights": true, - "knowledge": "2023-10", - "release_date": "2025-06-05", - "last_updated": "2025-06-05", + "knowledge": "2025-07", + "release_date": "2025-07-27", + "last_updated": "2025-07-27", "cost": { - "input": 3.5, - "output": 14 + "input": 0.45, + "output": 3.5 } }, { @@ -13636,9 +14137,41 @@ } }, { - "id": "llama-3.1-405b", - "name": "Llama 3.1 405B", - "display_name": "Llama 3.1 405B", + "id": "google-gemma-3-27b-it", + "name": "Google Gemma 3 27B Instruct", + "display_name": "Google Gemma 3 27B Instruct", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 202752, + "output": 8192 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": true, + "knowledge": "2025-07", + "release_date": "2025-07-27", + "last_updated": "2025-07-27", + "cost": { + "input": 0.12, + "output": 0.2 + } + }, + { + "id": "hermes-3-llama-3.1-405b", + "name": "Hermes 3 Llama 3.1 405b", + "display_name": "Hermes 3 Llama 3.1 405b", "modalities": { "input": [ "text" @@ -13648,7 +14181,7 @@ ] }, "limit": { - "context": 65536, + "context": 131072, "output": 8192 }, "temperature": true, @@ -13658,12 +14191,43 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2023-12", - "release_date": "2025-06-30", - "last_updated": "2025-06-30", + "knowledge": "2024-04", + "release_date": "2024-04-15", + "last_updated": "2024-04-15", "cost": { - "input": 1.5, - "output": 6 + "input": 1.1, + "output": 3 + } + }, + { + "id": "qwen3-next-80b", + "name": "Qwen 3 Next 80b", + "display_name": "Qwen 3 Next 80b", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 262144, + "output": 8192 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-07", + "release_date": "2025-07-27", + "last_updated": "2025-07-27", + "cost": { + "input": 0.35, + "output": 1.9 } }, { @@ -13696,6 +14260,68 @@ "input": 0.85, "output": 2.75 } + }, + { + "id": "qwen3-coder-480b-a35b-instruct", + "name": "Qwen 3 Coder 480b", + "display_name": "Qwen 3 Coder 480b", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 262144, + "output": 8192 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-07", + "release_date": "2025-07-27", + "last_updated": "2025-07-27", + "cost": { + "input": 0.75, + "output": 3 + } + }, + { + "id": "deepseek-v3.2", + "name": "DeepSeek V3.2", + "display_name": "DeepSeek V3.2", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 163840, + "output": 8192 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-10", + "release_date": "2025-10-05", + "last_updated": "2025-10-05", + "cost": { + "input": 0.4, + "output": 1 + } } ] }, @@ -13886,93 +14512,105 @@ "attachment": false, "open_weights": true, "release_date": "2025-11-08", - "last_updated": "2025-11-08", + "last_updated": "2025-12-11", "cost": { - "input": 0.13, - "output": 0.52 + "input": 0.04, + "output": 0.15 } } ] }, - "agentrouter": { - "id": "agentrouter", - "name": "AgentRouter", - "display_name": "AgentRouter", - "api": "https://agentrouter.org/v1", - "doc": "https://docs.agentrouter.org", + "kimi-for-coding": { + "id": "kimi-for-coding", + "name": "Kimi For Coding", + "display_name": "Kimi For Coding", + "api": "https://api.kimi.com/coding/v1", + "doc": "https://www.kimi.com/coding/docs/en/third-party-agents.html", "models": [ { - "id": "claude-3-5-sonnet-20241022", - "name": "Claude Sonnet 3.5 v2", - "display_name": "Claude Sonnet 3.5 v2", + "id": "kimi-k2-thinking", + "name": "Kimi K2 Thinking", + "display_name": "Kimi K2 Thinking", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 8192 + "context": 262144, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-04-30", - "release_date": "2024-10-22", - "last_updated": "2024-10-22", + "attachment": false, + "open_weights": true, + "knowledge": "2025-07", + "release_date": "2025-11", + "last_updated": "2025-12", "cost": { - "input": 3, - "output": 15 + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 } - }, + } + ] + }, + "cortecs": { + "id": "cortecs", + "name": "Cortecs", + "display_name": "Cortecs", + "api": "https://api.cortecs.ai/v1", + "doc": "https://api.cortecs.ai/v1/models", + "models": [ { - "id": "deepseek-r1-0528", - "name": "DeepSeek R1 (0528)", - "display_name": "DeepSeek R1 (0528)", + "id": "nova-pro-v1", + "name": "Nova Pro 1.0", + "display_name": "Nova Pro 1.0", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 128000 + "context": 300000, + "output": 5000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-07", - "release_date": "2025-05-28", - "last_updated": "2025-05-28", + "knowledge": "2024-04", + "release_date": "2024-12-03", + "last_updated": "2024-12-03", "cost": { - "input": 0.3, - "output": 0.045 + "input": 1.016, + "output": 4.061 } }, { - "id": "claude-sonnet-4-20250514-thinking", - "name": "Claude Sonnet 4 Thinking", - "display_name": "Claude Sonnet 4 Thinking", + "id": "claude-4-5-sonnet", + "name": "Claude 4.5 Sonnet", + "display_name": "Claude 4.5 Sonnet", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" @@ -13980,7 +14618,7 @@ }, "limit": { "context": 200000, - "output": 64000 + "output": 200000 }, "temperature": true, "tool_call": true, @@ -13990,18 +14628,18 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-05-22", - "last_updated": "2025-05-22", + "knowledge": "2025-07-31", + "release_date": "2025-09-29", + "last_updated": "2025-09-29", "cost": { - "input": 2, - "output": 10 + "input": 3.259, + "output": 16.296 } }, { - "id": "glm-4.5", - "name": "GLM-4.5", - "display_name": "GLM-4.5", + "id": "deepseek-v3-0324", + "name": "DeepSeek V3 0324", + "display_name": "DeepSeek V3 0324", "modalities": { "input": [ "text" @@ -14011,8 +14649,8 @@ ] }, "limit": { - "context": 131072, - "output": 98304 + "context": 128000, + "output": 128000 }, "temperature": true, "tool_call": true, @@ -14021,86 +14659,81 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-28", - "last_updated": "2025-07-28", + "knowledge": "2024-07", + "release_date": "2025-03-24", + "last_updated": "2025-03-24", "cost": { - "input": 0.003, - "output": 0 + "input": 0.551, + "output": 1.654 } }, { - "id": "claude-3-5-sonnet-20240620", - "name": "Claude Sonnet 3.5", - "display_name": "Claude Sonnet 3.5", + "id": "kimi-k2-instruct", + "name": "Kimi K2 Instruct", + "display_name": "Kimi K2 Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 8192 + "context": 131000, + "output": 131000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-04-30", - "release_date": "2024-06-20", - "last_updated": "2024-06-20", + "attachment": false, + "open_weights": true, + "knowledge": "2024-07", + "release_date": "2025-07-11", + "last_updated": "2025-09-05", "cost": { - "input": 3, - "output": 15 + "input": 0.551, + "output": 2.646 } }, { - "id": "gemini-3-pro-preview", - "name": "Gemini 3 Pro Preview", - "display_name": "Gemini 3 Pro Preview", + "id": "gpt-4.1", + "name": "GPT 4.1", + "display_name": "GPT 4.1", "modalities": { "input": [ "text", - "image", - "video", - "audio", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 64000 + "context": 1047576, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-11-01", - "last_updated": "2025-11-01", + "knowledge": "2024-06", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { - "input": 2, - "output": 8 + "input": 2.354, + "output": 9.417 } }, { - "id": "claude-3-7-sonnet-20250219-thinking", - "name": "Claude Sonnet 3.7 Thinking", - "display_name": "Claude Sonnet 3.7 Thinking", + "id": "gemini-2.5-pro", + "name": "Gemini 2.5 Pro", + "display_name": "Gemini 2.5 Pro", "modalities": { "input": [ "text", @@ -14111,29 +14744,28 @@ ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 1048576, + "output": 65535 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-10-31", - "release_date": "2025-02-19", - "last_updated": "2025-02-19", + "knowledge": "2025-01", + "release_date": "2025-03-20", + "last_updated": "2025-06-17", "cost": { - "input": 3, - "output": 15 + "input": 1.654, + "output": 11.024 } }, { - "id": "deepseek-v3.1", - "name": "DeepSeek V3.1", - "display_name": "DeepSeek V3.1", + "id": "gpt-oss-120b", + "name": "GPT Oss 120b", + "display_name": "GPT Oss 120b", "modalities": { "input": [ "text" @@ -14144,159 +14776,162 @@ }, "limit": { "context": 128000, - "output": 8192 + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-07", - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "attachment": false, + "open_weights": true, + "knowledge": "2024-01", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 0.3, - "output": 0.045 + "input": 0, + "output": 0 } }, { - "id": "claude-sonnet-4-5-20250929", - "name": "Claude Sonnet 4.5 (20250929)", - "display_name": "Claude Sonnet 4.5 (20250929)", + "id": "qwen3-coder-480b-a35b-instruct", + "name": "Qwen3 Coder 480B A35B Instruct", + "display_name": "Qwen3 Coder 480B A35B Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 64000 + "context": 262000, + "output": 262000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-07-31", - "release_date": "2025-09-29", - "last_updated": "2025-09-29", + "attachment": false, + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2025-07-25", + "last_updated": "2025-07-25", "cost": { - "input": 6, - "output": 30 + "input": 0.441, + "output": 1.984 } }, { - "id": "kimi-k2-thinking", - "name": "Kimi K2 Thinking", - "display_name": "Kimi K2 Thinking", + "id": "claude-sonnet-4", + "name": "Claude Sonnet 4", + "display_name": "Claude Sonnet 4", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2024-10", - "release_date": "2025-09-05", - "last_updated": "2025-09-05", + "open_weights": false, + "knowledge": "2025-03", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", "cost": { - "input": 0.002, - "output": 0 + "input": 3.307, + "output": 16.536 } }, { - "id": "gpt-5.1", - "name": "GPT-5.1", - "display_name": "GPT-5.1", + "id": "llama-3.1-405b-instruct", + "name": "Llama 3.1 405B Instruct", + "display_name": "Llama 3.1 405B Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ - "text", - "image" + "text" ] }, "limit": { - "context": 400000, + "context": 128000, "output": 128000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-12", - "last_updated": "2025-11-12", + "attachment": false, + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2024-07-23", + "last_updated": "2024-07-23", "cost": { - "input": 2, - "output": 2 + "input": 0, + "output": 0 } }, { - "id": "claude-sonnet-4-20250514", - "name": "Claude Sonnet 4", - "display_name": "Claude Sonnet 4", + "id": "qwen3-32b", + "name": "Qwen3 32B", + "display_name": "Qwen3 32B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 16384, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-05-22", - "last_updated": "2025-05-22", + "attachment": false, + "open_weights": true, + "knowledge": "2024-12", + "release_date": "2025-04-29", + "last_updated": "2025-04-29", "cost": { - "input": 3, - "output": 15 + "input": 0.099, + "output": 0.33 } - }, + } + ] + }, + "github-models": { + "id": "github-models", + "name": "GitHub Models", + "display_name": "GitHub Models", + "api": "https://models.github.ai/inference", + "doc": "https://docs.github.com/en/github-models", + "models": [ { - "id": "glm-4.6", - "name": "GLM-4.6", - "display_name": "GLM-4.6", + "id": "core42/jais-30b-chat", + "name": "JAIS 30b Chat", + "display_name": "JAIS 30b Chat", "modalities": { "input": [ "text" @@ -14306,8 +14941,8 @@ ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 8192, + "output": 2048 }, "temperature": true, "tool_call": true, @@ -14317,30 +14952,29 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-09-30", - "last_updated": "2025-09-30", + "knowledge": "2023-03", + "release_date": "2023-08-30", + "last_updated": "2023-08-30", "cost": { - "input": 0.003, + "input": 0, "output": 0 } }, { - "id": "claude-opus-4-20250514", - "name": "Claude Opus 4", - "display_name": "Claude Opus 4", + "id": "xai/grok-3", + "name": "Grok 3", + "display_name": "Grok 3", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 32000 + "context": 128000, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -14348,64 +14982,63 @@ "supported": true, "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-05-22", - "last_updated": "2025-05-22", + "knowledge": "2024-10", + "release_date": "2024-12-09", + "last_updated": "2024-12-09", "cost": { - "input": 21, - "output": 105 + "input": 0, + "output": 0 } }, { - "id": "claude-3-5-haiku-20241022", - "name": "Claude 3.5 Haiku (20241022)", - "display_name": "Claude 3.5 Haiku (20241022)", + "id": "xai/grok-3-mini", + "name": "Grok 3 Mini", + "display_name": "Grok 3 Mini", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, + "context": 128000, "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-07-31", - "release_date": "2024-10-22", - "last_updated": "2024-10-22", + "knowledge": "2024-10", + "release_date": "2024-12-09", + "last_updated": "2024-12-09", "cost": { - "input": 1, - "output": 5 + "input": 0, + "output": 0 } }, { - "id": "claude-3-7-sonnet-20250219", - "name": "Claude Sonnet 3.7", - "display_name": "Claude Sonnet 3.7", + "id": "cohere/cohere-command-r-08-2024", + "name": "Cohere Command R 08-2024", + "display_name": "Cohere Command R 08-2024", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, @@ -14413,20 +15046,20 @@ "supported": true, "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-10-31", - "release_date": "2025-02-19", - "last_updated": "2025-02-19", + "knowledge": "2024-03", + "release_date": "2024-08-01", + "last_updated": "2024-08-01", "cost": { - "input": 3, - "output": 15 + "input": 0, + "output": 0 } }, { - "id": "gpt-5", - "name": "GPT-5", - "display_name": "GPT-5", + "id": "cohere/cohere-command-a", + "name": "Cohere Command A", + "display_name": "Cohere Command A", "modalities": { "input": [ "text" @@ -14436,8 +15069,8 @@ ] }, "limit": { - "context": 1280000, - "output": 1280000 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, @@ -14447,29 +15080,29 @@ }, "attachment": false, "open_weights": false, - "release_date": "2025-11-27", - "last_updated": "2025-11-27", + "knowledge": "2024-03", + "release_date": "2024-11-01", + "last_updated": "2024-11-01", "cost": { "input": 0, "output": 0 } }, { - "id": "claude-opus-4-20250514-thinking", - "name": "Claude Opus 4 Thinking", - "display_name": "Claude Opus 4 Thinking", + "id": "cohere/cohere-command-r-plus-08-2024", + "name": "Cohere Command R+ 08-2024", + "display_name": "Cohere Command R+ 08-2024", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 32000 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, @@ -14477,20 +15110,20 @@ "supported": true, "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-05-22", - "last_updated": "2025-05-22", + "knowledge": "2024-03", + "release_date": "2024-08-01", + "last_updated": "2024-08-01", "cost": { - "input": 2, - "output": 10 + "input": 0, + "output": 0 } }, { - "id": "deepseek-v3.2", - "name": "DeepSeek V3.2", - "display_name": "DeepSeek V3.2", + "id": "cohere/cohere-command-r", + "name": "Cohere Command R", + "display_name": "Cohere Command R", "modalities": { "input": [ "text" @@ -14501,39 +15134,39 @@ }, "limit": { "context": 128000, - "output": 8192 + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-07", - "release_date": "2025-02-01", - "last_updated": "2025-02-01", + "knowledge": "2024-03", + "release_date": "2024-03-11", + "last_updated": "2024-08-01", "cost": { - "input": 0.3, - "output": 0.045 + "input": 0, + "output": 0 } }, { - "id": "claude-haiku-4-5-20251001", - "name": "Claude Haiku 4.5 (20251001)", - "display_name": "Claude Haiku 4.5 (20251001)", + "id": "cohere/cohere-command-r-plus", + "name": "Cohere Command R+", + "display_name": "Cohere Command R+", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, @@ -14541,73 +15174,63 @@ "supported": true, "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-02-28", - "release_date": "2025-10-01", - "last_updated": "2025-10-01", + "knowledge": "2024-03", + "release_date": "2024-04-04", + "last_updated": "2024-08-01", "cost": { - "input": 2, - "output": 4 + "input": 0, + "output": 0 } - } - ] - }, - "cortecs": { - "id": "cortecs", - "name": "Cortecs", - "display_name": "Cortecs", - "api": "https://api.cortecs.ai/v1", - "doc": "https://api.cortecs.ai/v1/models", - "models": [ + }, { - "id": "nova-pro-v1", - "name": "Nova Pro 1.0", - "display_name": "Nova Pro 1.0", + "id": "deepseek/deepseek-r1-0528", + "name": "DeepSeek-R1-0528", + "display_name": "DeepSeek-R1-0528", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 300000, - "output": 5000 + "context": 65536, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2024-12-03", - "last_updated": "2024-12-03", + "open_weights": true, + "knowledge": "2024-06", + "release_date": "2025-05-28", + "last_updated": "2025-05-28", "cost": { - "input": 1.016, - "output": 4.061 + "input": 0, + "output": 0 } }, { - "id": "claude-4-5-sonnet", - "name": "Claude 4.5 Sonnet", - "display_name": "Claude 4.5 Sonnet", + "id": "deepseek/deepseek-r1", + "name": "DeepSeek-R1", + "display_name": "DeepSeek-R1", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 200000 + "context": 65536, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -14615,20 +15238,20 @@ "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-07-31", - "release_date": "2025-09-29", - "last_updated": "2025-09-29", + "attachment": false, + "open_weights": true, + "knowledge": "2024-06", + "release_date": "2025-01-20", + "last_updated": "2025-01-20", "cost": { - "input": 3.259, - "output": 16.296 + "input": 0, + "output": 0 } }, { - "id": "deepseek-v3-0324", - "name": "DeepSeek V3 0324", - "display_name": "DeepSeek V3 0324", + "id": "deepseek/deepseek-v3-0324", + "name": "DeepSeek-V3-0324", + "display_name": "DeepSeek-V3-0324", "modalities": { "input": [ "text" @@ -14639,122 +15262,125 @@ }, "limit": { "context": 128000, - "output": 128000 + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": true, - "knowledge": "2024-07", + "knowledge": "2024-06", "release_date": "2025-03-24", "last_updated": "2025-03-24", "cost": { - "input": 0.551, - "output": 1.654 + "input": 0, + "output": 0 } }, { - "id": "kimi-k2-instruct", - "name": "Kimi K2 Instruct", - "display_name": "Kimi K2 Instruct", + "id": "mistral-ai/mistral-medium-2505", + "name": "Mistral Medium 3 (25.05)", + "display_name": "Mistral Medium 3 (25.05)", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131000, - "output": 131000 + "context": 128000, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": true, - "knowledge": "2024-07", - "release_date": "2025-07-11", - "last_updated": "2025-09-05", + "open_weights": false, + "knowledge": "2024-09", + "release_date": "2025-05-01", + "last_updated": "2025-05-01", "cost": { - "input": 0.551, - "output": 2.646 + "input": 0, + "output": 0 } }, { - "id": "gpt-4.1", - "name": "GPT 4.1", - "display_name": "GPT 4.1", + "id": "mistral-ai/ministral-3b", + "name": "Ministral 3B", + "display_name": "Ministral 3B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1047576, - "output": 32768 + "context": 128000, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": false, - "knowledge": "2024-06", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", + "open_weights": true, + "knowledge": "2024-03", + "release_date": "2024-10-22", + "last_updated": "2024-10-22", "cost": { - "input": 2.354, - "output": 9.417 + "input": 0, + "output": 0 } }, { - "id": "gemini-2.5-pro", - "name": "Gemini 2.5 Pro", - "display_name": "Gemini 2.5 Pro", + "id": "mistral-ai/mistral-nemo", + "name": "Mistral Nemo", + "display_name": "Mistral Nemo", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65535 + "context": 128000, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-03-20", - "last_updated": "2025-06-17", + "open_weights": true, + "knowledge": "2024-03", + "release_date": "2024-07-18", + "last_updated": "2024-07-18", "cost": { - "input": 1.654, - "output": 11.024 + "input": 0, + "output": 0 } }, { - "id": "gpt-oss-120b", - "name": "GPT Oss 120b", - "display_name": "GPT Oss 120b", + "id": "mistral-ai/mistral-large-2411", + "name": "Mistral Large 24.11", + "display_name": "Mistral Large 24.11", "modalities": { "input": [ "text" @@ -14765,27 +15391,28 @@ }, "limit": { "context": 128000, - "output": 128000 + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": true, - "knowledge": "2024-01", - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "open_weights": false, + "knowledge": "2024-09", + "release_date": "2024-11-01", + "last_updated": "2024-11-01", "cost": { "input": 0, "output": 0 } }, { - "id": "qwen3-coder-480b-a35b-instruct", - "name": "Qwen3 Coder 480B A35B Instruct", - "display_name": "Qwen3 Coder 480B A35B Instruct", + "id": "mistral-ai/codestral-2501", + "name": "Codestral 25.01", + "display_name": "Codestral 25.01", "modalities": { "input": [ "text" @@ -14795,28 +15422,29 @@ ] }, "limit": { - "context": 262000, - "output": 262000 + "context": 32000, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": true, - "knowledge": "2025-01", - "release_date": "2025-07-25", - "last_updated": "2025-07-25", + "open_weights": false, + "knowledge": "2024-03", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 0.441, - "output": 1.984 + "input": 0, + "output": 0 } }, { - "id": "claude-sonnet-4", - "name": "Claude Sonnet 4", - "display_name": "Claude Sonnet 4", + "id": "mistral-ai/mistral-small-2503", + "name": "Mistral Small 3.1", + "display_name": "Mistral Small 3.1", "modalities": { "input": [ "text", @@ -14827,28 +15455,29 @@ ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 128000, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": false, - "knowledge": "2025-03", - "release_date": "2025-05-22", - "last_updated": "2025-05-22", + "knowledge": "2024-09", + "release_date": "2025-03-01", + "last_updated": "2025-03-01", "cost": { - "input": 3.307, - "output": 16.536 + "input": 0, + "output": 0 } }, { - "id": "llama-3.1-405b-instruct", - "name": "Llama 3.1 405B Instruct", - "display_name": "Llama 3.1 405B Instruct", + "id": "microsoft/phi-3-medium-128k-instruct", + "name": "Phi-3-medium instruct (128k)", + "display_name": "Phi-3-medium instruct (128k)", "modalities": { "input": [ "text" @@ -14859,27 +15488,28 @@ }, "limit": { "context": 128000, - "output": 128000 + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-07-23", - "last_updated": "2024-07-23", + "knowledge": "2023-10", + "release_date": "2024-04-23", + "last_updated": "2024-04-23", "cost": { "input": 0, "output": 0 } }, { - "id": "qwen3-32b", - "name": "Qwen3 32B", - "display_name": "Qwen3 32B", + "id": "microsoft/phi-3-mini-4k-instruct", + "name": "Phi-3-mini instruct (4k)", + "display_name": "Phi-3-mini instruct (4k)", "modalities": { "input": [ "text" @@ -14889,37 +15519,29 @@ ] }, "limit": { - "context": 16384, - "output": 16384 + "context": 4096, + "output": 1024 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": true, - "knowledge": "2024-12", - "release_date": "2025-04-29", - "last_updated": "2025-04-29", + "knowledge": "2023-10", + "release_date": "2024-04-23", + "last_updated": "2024-04-23", "cost": { - "input": 0.099, - "output": 0.33 + "input": 0, + "output": 0 } - } - ] - }, - "github-models": { - "id": "github-models", - "name": "GitHub Models", - "display_name": "GitHub Models", - "api": "https://models.github.ai/inference", - "doc": "https://docs.github.com/en/github-models", - "models": [ + }, { - "id": "core42/jais-30b-chat", - "name": "JAIS 30b Chat", - "display_name": "JAIS 30b Chat", + "id": "microsoft/phi-3-small-128k-instruct", + "name": "Phi-3-small instruct (128k)", + "display_name": "Phi-3-small instruct (128k)", "modalities": { "input": [ "text" @@ -14929,8 +15551,8 @@ ] }, "limit": { - "context": 8192, - "output": 2048 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, @@ -14940,21 +15562,22 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2023-03", - "release_date": "2023-08-30", - "last_updated": "2023-08-30", + "knowledge": "2023-10", + "release_date": "2024-04-23", + "last_updated": "2024-04-23", "cost": { "input": 0, "output": 0 } }, { - "id": "xai/grok-3", - "name": "Grok 3", - "display_name": "Grok 3", + "id": "microsoft/phi-3.5-vision-instruct", + "name": "Phi-3.5-vision instruct (128k)", + "display_name": "Phi-3.5-vision instruct (128k)", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -14962,7 +15585,7 @@ }, "limit": { "context": 128000, - "output": 8192 + "output": 4096 }, "temperature": true, "tool_call": true, @@ -14971,19 +15594,19 @@ "default": true }, "attachment": false, - "open_weights": false, - "knowledge": "2024-10", - "release_date": "2024-12-09", - "last_updated": "2024-12-09", + "open_weights": true, + "knowledge": "2023-10", + "release_date": "2024-08-20", + "last_updated": "2024-08-20", "cost": { "input": 0, "output": 0 } }, { - "id": "xai/grok-3-mini", - "name": "Grok 3 Mini", - "display_name": "Grok 3 Mini", + "id": "microsoft/phi-4", + "name": "Phi-4", + "display_name": "Phi-4", "modalities": { "input": [ "text" @@ -14993,8 +15616,8 @@ ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 16000, + "output": 4096 }, "temperature": true, "tool_call": true, @@ -15003,19 +15626,19 @@ "default": true }, "attachment": false, - "open_weights": false, - "knowledge": "2024-10", - "release_date": "2024-12-09", - "last_updated": "2024-12-09", + "open_weights": true, + "knowledge": "2023-10", + "release_date": "2024-12-11", + "last_updated": "2024-12-11", "cost": { "input": 0, "output": 0 } }, { - "id": "cohere/cohere-command-r-08-2024", - "name": "Cohere Command R 08-2024", - "display_name": "Cohere Command R 08-2024", + "id": "microsoft/phi-4-mini-reasoning", + "name": "Phi-4-mini-reasoning", + "display_name": "Phi-4-mini-reasoning", "modalities": { "input": [ "text" @@ -15035,19 +15658,19 @@ "default": true }, "attachment": false, - "open_weights": false, - "knowledge": "2024-03", - "release_date": "2024-08-01", - "last_updated": "2024-08-01", + "open_weights": true, + "knowledge": "2023-10", + "release_date": "2024-12-11", + "last_updated": "2024-12-11", "cost": { "input": 0, "output": 0 } }, { - "id": "cohere/cohere-command-a", - "name": "Cohere Command A", - "display_name": "Cohere Command A", + "id": "microsoft/phi-3-small-8k-instruct", + "name": "Phi-3-small instruct (8k)", + "display_name": "Phi-3-small instruct (8k)", "modalities": { "input": [ "text" @@ -15057,8 +15680,8 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 8192, + "output": 2048 }, "temperature": true, "tool_call": true, @@ -15067,19 +15690,19 @@ "default": true }, "attachment": false, - "open_weights": false, - "knowledge": "2024-03", - "release_date": "2024-11-01", - "last_updated": "2024-11-01", + "open_weights": true, + "knowledge": "2023-10", + "release_date": "2024-04-23", + "last_updated": "2024-04-23", "cost": { "input": 0, "output": 0 } }, { - "id": "cohere/cohere-command-r-plus-08-2024", - "name": "Cohere Command R+ 08-2024", - "display_name": "Cohere Command R+ 08-2024", + "id": "microsoft/phi-3.5-mini-instruct", + "name": "Phi-3.5-mini instruct (128k)", + "display_name": "Phi-3.5-mini instruct (128k)", "modalities": { "input": [ "text" @@ -15099,22 +15722,24 @@ "default": true }, "attachment": false, - "open_weights": false, - "knowledge": "2024-03", - "release_date": "2024-08-01", - "last_updated": "2024-08-01", + "open_weights": true, + "knowledge": "2023-10", + "release_date": "2024-08-20", + "last_updated": "2024-08-20", "cost": { "input": 0, "output": 0 } }, { - "id": "cohere/cohere-command-r", - "name": "Cohere Command R", - "display_name": "Cohere Command R", - "modalities": { + "id": "microsoft/phi-4-multimodal-instruct", + "name": "Phi-4-multimodal-instruct", + "display_name": "Phi-4-multimodal-instruct", + "modalities": { "input": [ - "text" + "text", + "image", + "audio" ], "output": [ "text" @@ -15131,19 +15756,19 @@ "default": true }, "attachment": false, - "open_weights": false, - "knowledge": "2024-03", - "release_date": "2024-03-11", - "last_updated": "2024-08-01", + "open_weights": true, + "knowledge": "2023-10", + "release_date": "2024-12-11", + "last_updated": "2024-12-11", "cost": { "input": 0, "output": 0 } }, { - "id": "cohere/cohere-command-r-plus", - "name": "Cohere Command R+", - "display_name": "Cohere Command R+", + "id": "microsoft/phi-3-mini-128k-instruct", + "name": "Phi-3-mini instruct (128k)", + "display_name": "Phi-3-mini instruct (128k)", "modalities": { "input": [ "text" @@ -15163,19 +15788,19 @@ "default": true }, "attachment": false, - "open_weights": false, - "knowledge": "2024-03", - "release_date": "2024-04-04", - "last_updated": "2024-08-01", + "open_weights": true, + "knowledge": "2023-10", + "release_date": "2024-04-23", + "last_updated": "2024-04-23", "cost": { "input": 0, "output": 0 } }, { - "id": "deepseek/deepseek-r1-0528", - "name": "DeepSeek-R1-0528", - "display_name": "DeepSeek-R1-0528", + "id": "microsoft/phi-3.5-moe-instruct", + "name": "Phi-3.5-MoE instruct (128k)", + "display_name": "Phi-3.5-MoE instruct (128k)", "modalities": { "input": [ "text" @@ -15185,8 +15810,8 @@ ] }, "limit": { - "context": 65536, - "output": 8192 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, @@ -15196,18 +15821,18 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2024-06", - "release_date": "2025-05-28", - "last_updated": "2025-05-28", + "knowledge": "2023-10", + "release_date": "2024-08-20", + "last_updated": "2024-08-20", "cost": { "input": 0, "output": 0 } }, { - "id": "deepseek/deepseek-r1", - "name": "DeepSeek-R1", - "display_name": "DeepSeek-R1", + "id": "microsoft/phi-4-mini-instruct", + "name": "Phi-4-mini-instruct", + "display_name": "Phi-4-mini-instruct", "modalities": { "input": [ "text" @@ -15217,8 +15842,8 @@ ] }, "limit": { - "context": 65536, - "output": 8192 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, @@ -15228,18 +15853,18 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2024-06", - "release_date": "2025-01-20", - "last_updated": "2025-01-20", + "knowledge": "2023-10", + "release_date": "2024-12-11", + "last_updated": "2024-12-11", "cost": { "input": 0, "output": 0 } }, { - "id": "deepseek/deepseek-v3-0324", - "name": "DeepSeek-V3-0324", - "display_name": "DeepSeek-V3-0324", + "id": "microsoft/phi-3-medium-4k-instruct", + "name": "Phi-3-medium instruct (4k)", + "display_name": "Phi-3-medium instruct (4k)", "modalities": { "input": [ "text" @@ -15249,8 +15874,8 @@ ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 4096, + "output": 1024 }, "temperature": true, "tool_call": true, @@ -15260,22 +15885,21 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2024-06", - "release_date": "2025-03-24", - "last_updated": "2025-03-24", + "knowledge": "2023-10", + "release_date": "2024-04-23", + "last_updated": "2024-04-23", "cost": { "input": 0, "output": 0 } }, { - "id": "mistral-ai/mistral-medium-2505", - "name": "Mistral Medium 3 (25.05)", - "display_name": "Mistral Medium 3 (25.05)", + "id": "microsoft/phi-4-reasoning", + "name": "Phi-4-Reasoning", + "display_name": "Phi-4-Reasoning", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" @@ -15283,7 +15907,7 @@ }, "limit": { "context": 128000, - "output": 32768 + "output": 4096 }, "temperature": true, "tool_call": true, @@ -15292,19 +15916,19 @@ "default": true }, "attachment": false, - "open_weights": false, - "knowledge": "2024-09", - "release_date": "2025-05-01", - "last_updated": "2025-05-01", + "open_weights": true, + "knowledge": "2023-10", + "release_date": "2024-12-11", + "last_updated": "2024-12-11", "cost": { "input": 0, "output": 0 } }, { - "id": "mistral-ai/ministral-3b", - "name": "Ministral 3B", - "display_name": "Ministral 3B", + "id": "microsoft/mai-ds-r1", + "name": "MAI-DS-R1", + "display_name": "MAI-DS-R1", "modalities": { "input": [ "text" @@ -15314,7 +15938,7 @@ ] }, "limit": { - "context": 128000, + "context": 65536, "output": 8192 }, "temperature": true, @@ -15324,22 +15948,23 @@ "default": true }, "attachment": false, - "open_weights": true, - "knowledge": "2024-03", - "release_date": "2024-10-22", - "last_updated": "2024-10-22", + "open_weights": false, + "knowledge": "2024-06", + "release_date": "2025-01-20", + "last_updated": "2025-01-20", "cost": { "input": 0, "output": 0 } }, { - "id": "mistral-ai/mistral-nemo", - "name": "Mistral Nemo", - "display_name": "Mistral Nemo", + "id": "openai/gpt-4.1-nano", + "name": "GPT-4.1-nano", + "display_name": "GPT-4.1-nano", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -15347,31 +15972,31 @@ }, "limit": { "context": 128000, - "output": 8192 + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-03", - "release_date": "2024-07-18", - "last_updated": "2024-07-18", + "attachment": true, + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { "input": 0, "output": 0 } }, { - "id": "mistral-ai/mistral-large-2411", - "name": "Mistral Large 24.11", - "display_name": "Mistral Large 24.11", + "id": "openai/gpt-4.1-mini", + "name": "GPT-4.1-mini", + "display_name": "GPT-4.1-mini", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -15379,28 +16004,27 @@ }, "limit": { "context": 128000, - "output": 32768 + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-09", - "release_date": "2024-11-01", - "last_updated": "2024-11-01", + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { "input": 0, "output": 0 } }, { - "id": "mistral-ai/codestral-2501", - "name": "Codestral 25.01", - "display_name": "Codestral 25.01", + "id": "openai/o1-preview", + "name": "OpenAI o1-preview", + "display_name": "OpenAI o1-preview", "modalities": { "input": [ "text" @@ -15410,65 +16034,66 @@ ] }, "limit": { - "context": 32000, - "output": 8192 + "context": 128000, + "output": 32768 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { "supported": true, "default": true }, "attachment": false, "open_weights": false, - "knowledge": "2024-03", - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "knowledge": "2023-10", + "release_date": "2024-09-12", + "last_updated": "2024-09-12", "cost": { "input": 0, "output": 0 } }, { - "id": "mistral-ai/mistral-small-2503", - "name": "Mistral Small 3.1", - "display_name": "Mistral Small 3.1", + "id": "openai/o3-mini", + "name": "OpenAI o3-mini", + "display_name": "OpenAI o3-mini", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 200000, + "output": 100000 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { "supported": true, "default": true }, "attachment": false, "open_weights": false, - "knowledge": "2024-09", - "release_date": "2025-03-01", - "last_updated": "2025-03-01", + "knowledge": "2024-04", + "release_date": "2025-01-31", + "last_updated": "2025-01-31", "cost": { "input": 0, "output": 0 } }, { - "id": "microsoft/phi-3-medium-128k-instruct", - "name": "Phi-3-medium instruct (128k)", - "display_name": "Phi-3-medium instruct (128k)", + "id": "openai/gpt-4o", + "name": "GPT-4o", + "display_name": "GPT-4o", "modalities": { "input": [ - "text" + "text", + "image", + "audio" ], "output": [ "text" @@ -15476,92 +16101,92 @@ }, "limit": { "context": 128000, - "output": 4096 + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": false, - "open_weights": true, + "attachment": true, + "open_weights": false, "knowledge": "2023-10", - "release_date": "2024-04-23", - "last_updated": "2024-04-23", + "release_date": "2024-05-13", + "last_updated": "2024-05-13", "cost": { "input": 0, "output": 0 } }, { - "id": "microsoft/phi-3-mini-4k-instruct", - "name": "Phi-3-mini instruct (4k)", - "display_name": "Phi-3-mini instruct (4k)", + "id": "openai/gpt-4.1", + "name": "GPT-4.1", + "display_name": "GPT-4.1", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 4096, - "output": 1024 + "context": 128000, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-04-23", - "last_updated": "2024-04-23", + "attachment": true, + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { "input": 0, "output": 0 } }, { - "id": "microsoft/phi-3-small-128k-instruct", - "name": "Phi-3-small instruct (128k)", - "display_name": "Phi-3-small instruct (128k)", + "id": "openai/o4-mini", + "name": "OpenAI o4-mini", + "display_name": "OpenAI o4-mini", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 200000, + "output": 100000 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { "supported": true, "default": true }, "attachment": false, - "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-04-23", - "last_updated": "2024-04-23", + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2025-01-31", + "last_updated": "2025-01-31", "cost": { "input": 0, "output": 0 } }, { - "id": "microsoft/phi-3.5-vision-instruct", - "name": "Phi-3.5-vision instruct (128k)", - "display_name": "Phi-3.5-vision instruct (128k)", + "id": "openai/o1", + "name": "OpenAI o1", + "display_name": "OpenAI o1", "modalities": { "input": [ "text", @@ -15572,29 +16197,29 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 200000, + "output": 100000 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { "supported": true, "default": true }, "attachment": false, - "open_weights": true, + "open_weights": false, "knowledge": "2023-10", - "release_date": "2024-08-20", - "last_updated": "2024-08-20", + "release_date": "2024-09-12", + "last_updated": "2024-12-17", "cost": { "input": 0, "output": 0 } }, { - "id": "microsoft/phi-4", - "name": "Phi-4", - "display_name": "Phi-4", + "id": "openai/o1-mini", + "name": "OpenAI o1-mini", + "display_name": "OpenAI o1-mini", "modalities": { "input": [ "text" @@ -15604,96 +16229,100 @@ ] }, "limit": { - "context": 16000, - "output": 4096 + "context": 128000, + "output": 65536 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { "supported": true, "default": true }, "attachment": false, - "open_weights": true, + "open_weights": false, "knowledge": "2023-10", - "release_date": "2024-12-11", - "last_updated": "2024-12-11", + "release_date": "2024-09-12", + "last_updated": "2024-12-17", "cost": { "input": 0, "output": 0 } }, { - "id": "microsoft/phi-4-mini-reasoning", - "name": "Phi-4-mini-reasoning", - "display_name": "Phi-4-mini-reasoning", + "id": "openai/o3", + "name": "OpenAI o3", + "display_name": "OpenAI o3", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 200000, + "output": 100000 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { "supported": true, "default": true }, "attachment": false, - "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-12-11", - "last_updated": "2024-12-11", + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2025-01-31", + "last_updated": "2025-01-31", "cost": { "input": 0, "output": 0 } }, { - "id": "microsoft/phi-3-small-8k-instruct", - "name": "Phi-3-small instruct (8k)", - "display_name": "Phi-3-small instruct (8k)", + "id": "openai/gpt-4o-mini", + "name": "GPT-4o mini", + "display_name": "GPT-4o mini", "modalities": { "input": [ - "text" + "text", + "image", + "audio" ], "output": [ "text" ] }, "limit": { - "context": 8192, - "output": 2048 + "context": 128000, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": false, - "open_weights": true, + "attachment": true, + "open_weights": false, "knowledge": "2023-10", - "release_date": "2024-04-23", - "last_updated": "2024-04-23", + "release_date": "2024-07-18", + "last_updated": "2024-07-18", "cost": { "input": 0, "output": 0 } }, { - "id": "microsoft/phi-3.5-mini-instruct", - "name": "Phi-3.5-mini instruct (128k)", - "display_name": "Phi-3.5-mini instruct (128k)", + "id": "meta/llama-3.2-11b-vision-instruct", + "name": "Llama-3.2-11B-Vision-Instruct", + "display_name": "Llama-3.2-11B-Vision-Instruct", "modalities": { "input": [ - "text" + "text", + "image", + "audio" ], "output": [ "text" @@ -15701,7 +16330,7 @@ }, "limit": { "context": 128000, - "output": 4096 + "output": 8192 }, "temperature": true, "tool_call": true, @@ -15711,23 +16340,21 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-08-20", - "last_updated": "2024-08-20", + "knowledge": "2023-12", + "release_date": "2024-09-25", + "last_updated": "2024-09-25", "cost": { "input": 0, "output": 0 } }, { - "id": "microsoft/phi-4-multimodal-instruct", - "name": "Phi-4-multimodal-instruct", - "display_name": "Phi-4-multimodal-instruct", + "id": "meta/meta-llama-3.1-405b-instruct", + "name": "Meta-Llama-3.1-405B-Instruct", + "display_name": "Meta-Llama-3.1-405B-Instruct", "modalities": { "input": [ - "text", - "image", - "audio" + "text" ], "output": [ "text" @@ -15735,7 +16362,7 @@ }, "limit": { "context": 128000, - "output": 4096 + "output": 32768 }, "temperature": true, "tool_call": true, @@ -15745,21 +16372,22 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-12-11", - "last_updated": "2024-12-11", + "knowledge": "2023-12", + "release_date": "2024-07-23", + "last_updated": "2024-07-23", "cost": { "input": 0, "output": 0 } }, { - "id": "microsoft/phi-3-mini-128k-instruct", - "name": "Phi-3-mini instruct (128k)", - "display_name": "Phi-3-mini instruct (128k)", + "id": "meta/llama-4-maverick-17b-128e-instruct-fp8", + "name": "Llama 4 Maverick 17B 128E Instruct FP8", + "display_name": "Llama 4 Maverick 17B 128E Instruct FP8", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -15767,7 +16395,7 @@ }, "limit": { "context": 128000, - "output": 4096 + "output": 8192 }, "temperature": true, "tool_call": true, @@ -15777,18 +16405,18 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-04-23", - "last_updated": "2024-04-23", + "knowledge": "2024-12", + "release_date": "2025-01-31", + "last_updated": "2025-01-31", "cost": { "input": 0, "output": 0 } }, { - "id": "microsoft/phi-3.5-moe-instruct", - "name": "Phi-3.5-MoE instruct (128k)", - "display_name": "Phi-3.5-MoE instruct (128k)", + "id": "meta/meta-llama-3-70b-instruct", + "name": "Meta-Llama-3-70B-Instruct", + "display_name": "Meta-Llama-3-70B-Instruct", "modalities": { "input": [ "text" @@ -15798,8 +16426,8 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 8192, + "output": 2048 }, "temperature": true, "tool_call": true, @@ -15809,18 +16437,18 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-08-20", - "last_updated": "2024-08-20", + "knowledge": "2023-12", + "release_date": "2024-04-18", + "last_updated": "2024-04-18", "cost": { "input": 0, "output": 0 } }, { - "id": "microsoft/phi-4-mini-instruct", - "name": "Phi-4-mini-instruct", - "display_name": "Phi-4-mini-instruct", + "id": "meta/meta-llama-3.1-70b-instruct", + "name": "Meta-Llama-3.1-70B-Instruct", + "display_name": "Meta-Llama-3.1-70B-Instruct", "modalities": { "input": [ "text" @@ -15831,7 +16459,7 @@ }, "limit": { "context": 128000, - "output": 4096 + "output": 32768 }, "temperature": true, "tool_call": true, @@ -15841,18 +16469,18 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-12-11", - "last_updated": "2024-12-11", + "knowledge": "2023-12", + "release_date": "2024-07-23", + "last_updated": "2024-07-23", "cost": { "input": 0, "output": 0 } }, { - "id": "microsoft/phi-3-medium-4k-instruct", - "name": "Phi-3-medium instruct (4k)", - "display_name": "Phi-3-medium instruct (4k)", + "id": "meta/llama-3.3-70b-instruct", + "name": "Llama-3.3-70B-Instruct", + "display_name": "Llama-3.3-70B-Instruct", "modalities": { "input": [ "text" @@ -15862,8 +16490,8 @@ ] }, "limit": { - "context": 4096, - "output": 1024 + "context": 128000, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -15873,21 +16501,23 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-04-23", - "last_updated": "2024-04-23", + "knowledge": "2023-12", + "release_date": "2024-12-06", + "last_updated": "2024-12-06", "cost": { "input": 0, "output": 0 } }, { - "id": "microsoft/phi-4-reasoning", - "name": "Phi-4-Reasoning", - "display_name": "Phi-4-Reasoning", + "id": "meta/llama-3.2-90b-vision-instruct", + "name": "Llama-3.2-90B-Vision-Instruct", + "display_name": "Llama-3.2-90B-Vision-Instruct", "modalities": { "input": [ - "text" + "text", + "image", + "audio" ], "output": [ "text" @@ -15895,7 +16525,7 @@ }, "limit": { "context": 128000, - "output": 4096 + "output": 8192 }, "temperature": true, "tool_call": true, @@ -15905,18 +16535,18 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-12-11", - "last_updated": "2024-12-11", + "knowledge": "2023-12", + "release_date": "2024-09-25", + "last_updated": "2024-09-25", "cost": { "input": 0, "output": 0 } }, { - "id": "microsoft/mai-ds-r1", - "name": "MAI-DS-R1", - "display_name": "MAI-DS-R1", + "id": "meta/meta-llama-3-8b-instruct", + "name": "Meta-Llama-3-8B-Instruct", + "display_name": "Meta-Llama-3-8B-Instruct", "modalities": { "input": [ "text" @@ -15926,8 +16556,8 @@ ] }, "limit": { - "context": 65536, - "output": 8192 + "context": 8192, + "output": 2048 }, "temperature": true, "tool_call": true, @@ -15936,19 +16566,19 @@ "default": true }, "attachment": false, - "open_weights": false, - "knowledge": "2024-06", - "release_date": "2025-01-20", - "last_updated": "2025-01-20", + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2024-04-18", + "last_updated": "2024-04-18", "cost": { "input": 0, "output": 0 } }, { - "id": "openai/gpt-4.1-nano", - "name": "GPT-4.1-nano", - "display_name": "GPT-4.1-nano", + "id": "meta/llama-4-scout-17b-16e-instruct", + "name": "Llama 4 Scout 17B 16E Instruct", + "display_name": "Llama 4 Scout 17B 16E Instruct", "modalities": { "input": [ "text", @@ -15960,31 +16590,31 @@ }, "limit": { "context": 128000, - "output": 16384 + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", + "attachment": false, + "open_weights": true, + "knowledge": "2024-12", + "release_date": "2025-01-31", + "last_updated": "2025-01-31", "cost": { "input": 0, "output": 0 } }, { - "id": "openai/gpt-4.1-mini", - "name": "GPT-4.1-mini", - "display_name": "GPT-4.1-mini", + "id": "meta/meta-llama-3.1-8b-instruct", + "name": "Meta-Llama-3.1-8B-Instruct", + "display_name": "Meta-Llama-3.1-8B-Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" @@ -15992,27 +16622,28 @@ }, "limit": { "context": 128000, - "output": 16384 + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", + "attachment": false, + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2024-07-23", + "last_updated": "2024-07-23", "cost": { "input": 0, "output": 0 } }, { - "id": "openai/o1-preview", - "name": "OpenAI o1-preview", - "display_name": "OpenAI o1-preview", + "id": "ai21-labs/ai21-jamba-1.5-large", + "name": "AI21 Jamba 1.5 Large", + "display_name": "AI21 Jamba 1.5 Large", "modalities": { "input": [ "text" @@ -16022,29 +16653,29 @@ ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 256000, + "output": 4096 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": true, "default": true }, "attachment": false, "open_weights": false, - "knowledge": "2023-10", - "release_date": "2024-09-12", - "last_updated": "2024-09-12", + "knowledge": "2024-03", + "release_date": "2024-08-29", + "last_updated": "2024-08-29", "cost": { "input": 0, "output": 0 } }, { - "id": "openai/o3-mini", - "name": "OpenAI o3-mini", - "display_name": "OpenAI o3-mini", + "id": "ai21-labs/ai21-jamba-1.5-mini", + "name": "AI21 Jamba 1.5 Mini", + "display_name": "AI21 Jamba 1.5 Mini", "modalities": { "input": [ "text" @@ -16054,62 +16685,77 @@ ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 256000, + "output": 4096 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": true, "default": true }, "attachment": false, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-01-31", - "last_updated": "2025-01-31", + "knowledge": "2024-03", + "release_date": "2024-08-29", + "last_updated": "2024-08-29", "cost": { "input": 0, "output": 0 } - }, + } + ] + }, + "togetherai": { + "id": "togetherai", + "name": "Together AI", + "display_name": "Together AI", + "doc": "https://docs.together.ai/docs/serverless-models", + "models": [ { - "id": "openai/gpt-4o", - "name": "GPT-4o", - "display_name": "GPT-4o", + "id": "openai/gpt-oss-120b", + "name": "GPT OSS 120B", + "display_name": "GPT OSS 120B", "modalities": { "input": [ - "text", - "image", - "audio" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 131072, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2023-10", - "release_date": "2024-05-13", - "last_updated": "2024-05-13", + "attachment": false, + "open_weights": true, + "knowledge": "2025-08", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 0, - "output": 0 + "input": 0.15, + "output": 0.6 } - }, + } + ] + }, + "azure": { + "id": "azure", + "name": "Azure", + "display_name": "Azure", + "doc": "https://learn.microsoft.com/en-us/azure/ai-services/openai/concepts/models", + "models": [ { - "id": "openai/gpt-4.1", - "name": "GPT-4.1", - "display_name": "GPT-4.1", + "id": "gpt-4.1-nano", + "name": "GPT-4.1 nano", + "display_name": "GPT-4.1 nano", "modalities": { "input": [ "text", @@ -16120,8 +16766,8 @@ ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 1047576, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -16130,51 +16776,48 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2024-04", + "knowledge": "2024-05", "release_date": "2025-04-14", "last_updated": "2025-04-14", "cost": { - "input": 0, - "output": 0 + "input": 0.1, + "output": 0.4, + "cache_read": 0.03 } }, { - "id": "openai/o4-mini", - "name": "OpenAI o4-mini", - "display_name": "OpenAI o4-mini", + "id": "text-embedding-3-small", + "name": "text-embedding-3-small", + "display_name": "text-embedding-3-small", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 8191, + "output": 1536 }, - "temperature": false, "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-01-31", - "last_updated": "2025-01-31", + "release_date": "2024-01-25", + "last_updated": "2024-01-25", "cost": { - "input": 0, + "input": 0.02, "output": 0 } }, { - "id": "openai/o1", - "name": "OpenAI o1", - "display_name": "OpenAI o1", + "id": "grok-4-fast-non-reasoning", + "name": "Grok 4 Fast (Non-Reasoning)", + "display_name": "Grok 4 Fast (Non-Reasoning)", "modalities": { "input": [ "text", @@ -16185,29 +16828,29 @@ ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 2000000, + "output": 30000 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2023-10", - "release_date": "2024-09-12", - "last_updated": "2024-12-17", + "knowledge": "2025-07", + "release_date": "2025-09-19", + "last_updated": "2025-09-19", "cost": { - "input": 0, - "output": 0 + "input": 0.2, + "output": 0.5, + "cache_read": 0.05 } }, { - "id": "openai/o1-mini", - "name": "OpenAI o1-mini", - "display_name": "OpenAI o1-mini", + "id": "deepseek-r1-0528", + "name": "DeepSeek-R1-0528", + "display_name": "DeepSeek-R1-0528", "modalities": { "input": [ "text" @@ -16217,29 +16860,29 @@ ] }, "limit": { - "context": 128000, - "output": 65536 + "context": 163840, + "output": 163840 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": true, "default": true }, "attachment": false, - "open_weights": false, - "knowledge": "2023-10", - "release_date": "2024-09-12", - "last_updated": "2024-12-17", + "open_weights": true, + "knowledge": "2024-07", + "release_date": "2025-05-28", + "last_updated": "2025-05-28", "cost": { - "input": 0, - "output": 0 + "input": 1.35, + "output": 5.4 } }, { - "id": "openai/o3", - "name": "OpenAI o3", - "display_name": "OpenAI o3", + "id": "grok-4-fast-reasoning", + "name": "Grok 4 Fast (Reasoning)", + "display_name": "Grok 4 Fast (Reasoning)", "modalities": { "input": [ "text", @@ -16250,34 +16893,33 @@ ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 2000000, + "output": 30000 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-01-31", - "last_updated": "2025-01-31", + "knowledge": "2025-07", + "release_date": "2025-09-19", + "last_updated": "2025-09-19", "cost": { - "input": 0, - "output": 0 + "input": 0.2, + "output": 0.5, + "cache_read": 0.05 } }, { - "id": "openai/gpt-4o-mini", - "name": "GPT-4o mini", - "display_name": "GPT-4o mini", + "id": "phi-3-medium-128k-instruct", + "name": "Phi-3-medium-instruct (128k)", + "display_name": "Phi-3-medium-instruct (128k)", "modalities": { "input": [ - "text", - "image", - "audio" + "text" ], "output": [ "text" @@ -16285,72 +16927,71 @@ }, "limit": { "context": 128000, - "output": 16384 + "output": 4096 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, + "attachment": false, + "open_weights": true, "knowledge": "2023-10", - "release_date": "2024-07-18", - "last_updated": "2024-07-18", + "release_date": "2024-04-23", + "last_updated": "2024-04-23", "cost": { - "input": 0, - "output": 0 + "input": 0.17, + "output": 0.68 } }, { - "id": "meta/llama-3.2-11b-vision-instruct", - "name": "Llama-3.2-11B-Vision-Instruct", - "display_name": "Llama-3.2-11B-Vision-Instruct", + "id": "gpt-4", + "name": "GPT-4", + "display_name": "GPT-4", "modalities": { "input": [ - "text", - "image", - "audio" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, + "context": 8192, "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-09-25", - "last_updated": "2024-09-25", + "open_weights": false, + "knowledge": "2023-11", + "release_date": "2023-03-14", + "last_updated": "2023-03-14", "cost": { - "input": 0, - "output": 0 + "input": 60, + "output": 120 } }, { - "id": "meta/meta-llama-3.1-405b-instruct", - "name": "Meta-Llama-3.1-405B-Instruct", - "display_name": "Meta-Llama-3.1-405B-Instruct", + "id": "claude-opus-4-1", + "name": "Claude Opus 4.1", + "display_name": "Claude Opus 4.1", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 200000, + "output": 32000 }, "temperature": true, "tool_call": true, @@ -16358,20 +16999,22 @@ "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-07-23", - "last_updated": "2024-07-23", + "attachment": true, + "open_weights": false, + "knowledge": "2025-03-31", + "release_date": "2025-11-18", + "last_updated": "2025-11-18", "cost": { - "input": 0, - "output": 0 + "input": 15, + "output": 75, + "cache_read": 1.5, + "cache_write": 18.75 } }, { - "id": "meta/llama-4-maverick-17b-128e-instruct-fp8", - "name": "Llama 4 Maverick 17B 128E Instruct FP8", - "display_name": "Llama 4 Maverick 17B 128E Instruct FP8", + "id": "llama-3.2-11b-vision-instruct", + "name": "Llama-3.2-11B-Vision-Instruct", + "display_name": "Llama-3.2-11B-Vision-Instruct", "modalities": { "input": [ "text", @@ -16388,55 +17031,53 @@ "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2024-12", - "release_date": "2025-01-31", - "last_updated": "2025-01-31", + "knowledge": "2023-12", + "release_date": "2024-09-25", + "last_updated": "2024-09-25", "cost": { - "input": 0, - "output": 0 + "input": 0.37, + "output": 0.37 } }, { - "id": "meta/meta-llama-3-70b-instruct", - "name": "Meta-Llama-3-70B-Instruct", - "display_name": "Meta-Llama-3-70B-Instruct", + "id": "cohere-embed-v-4-0", + "name": "Embed v4", + "display_name": "Embed v4", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 8192, - "output": 2048 + "context": 128000, + "output": 1536 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-04-18", - "last_updated": "2024-04-18", + "release_date": "2025-04-15", + "last_updated": "2025-04-15", "cost": { - "input": 0, + "input": 0.12, "output": 0 } }, { - "id": "meta/meta-llama-3.1-70b-instruct", - "name": "Meta-Llama-3.1-70B-Instruct", - "display_name": "Meta-Llama-3.1-70B-Instruct", + "id": "cohere-command-r-08-2024", + "name": "Command R", + "display_name": "Command R", "modalities": { "input": [ "text" @@ -16447,7 +17088,7 @@ }, "limit": { "context": 128000, - "output": 32768 + "output": 4000 }, "temperature": true, "tool_call": true, @@ -16457,18 +17098,18 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-07-23", - "last_updated": "2024-07-23", + "knowledge": "2024-06-01", + "release_date": "2024-08-30", + "last_updated": "2024-08-30", "cost": { - "input": 0, - "output": 0 + "input": 0.15, + "output": 0.6 } }, { - "id": "meta/llama-3.3-70b-instruct", - "name": "Llama-3.3-70B-Instruct", - "display_name": "Llama-3.3-70B-Instruct", + "id": "grok-4", + "name": "Grok 4", + "display_name": "Grok 4", "modalities": { "input": [ "text" @@ -16478,8 +17119,8 @@ ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 256000, + "output": 64000 }, "temperature": true, "tool_call": true, @@ -16488,53 +17129,51 @@ "default": true }, "attachment": false, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "open_weights": false, + "knowledge": "2025-07", + "release_date": "2025-07-09", + "last_updated": "2025-07-09", "cost": { - "input": 0, - "output": 0 + "input": 3, + "output": 15, + "reasoning": 15, + "cache_read": 0.75 } }, { - "id": "meta/llama-3.2-90b-vision-instruct", - "name": "Llama-3.2-90B-Vision-Instruct", - "display_name": "Llama-3.2-90B-Vision-Instruct", + "id": "cohere-embed-v3-multilingual", + "name": "Embed v3 Multilingual", + "display_name": "Embed v3 Multilingual", "modalities": { "input": [ - "text", - "image", - "audio" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 512, + "output": 1024 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-09-25", - "last_updated": "2024-09-25", + "release_date": "2023-11-07", + "last_updated": "2023-11-07", "cost": { - "input": 0, + "input": 0.1, "output": 0 } }, { - "id": "meta/meta-llama-3-8b-instruct", - "name": "Meta-Llama-3-8B-Instruct", - "display_name": "Meta-Llama-3-8B-Instruct", + "id": "phi-4-mini", + "name": "Phi-4-mini", + "display_name": "Phi-4-mini", "modalities": { "input": [ "text" @@ -16544,62 +17183,59 @@ ] }, "limit": { - "context": 8192, - "output": 2048 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-04-18", - "last_updated": "2024-04-18", + "knowledge": "2023-10", + "release_date": "2024-12-11", + "last_updated": "2024-12-11", "cost": { - "input": 0, - "output": 0 + "input": 0.075, + "output": 0.3 } }, { - "id": "meta/llama-4-scout-17b-16e-instruct", - "name": "Llama 4 Scout 17B 16E Instruct", - "display_name": "Llama 4 Scout 17B 16E Instruct", + "id": "gpt-4-32k", + "name": "GPT-4 32K", + "display_name": "GPT-4 32K", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 32768, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2024-12", - "release_date": "2025-01-31", - "last_updated": "2025-01-31", + "open_weights": false, + "knowledge": "2023-11", + "release_date": "2023-03-14", + "last_updated": "2023-03-14", "cost": { - "input": 0, - "output": 0 + "input": 60, + "output": 120 } }, { - "id": "meta/meta-llama-3.1-8b-instruct", - "name": "Meta-Llama-3.1-8B-Instruct", - "display_name": "Meta-Llama-3.1-8B-Instruct", + "id": "meta-llama-3.1-405b-instruct", + "name": "Meta-Llama-3.1-405B-Instruct", + "display_name": "Meta-Llama-3.1-405B-Instruct", "modalities": { "input": [ "text" @@ -16615,8 +17251,7 @@ "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": true, @@ -16624,14 +17259,14 @@ "release_date": "2024-07-23", "last_updated": "2024-07-23", "cost": { - "input": 0, - "output": 0 + "input": 5.33, + "output": 16 } }, { - "id": "ai21-labs/ai21-jamba-1.5-large", - "name": "AI21 Jamba 1.5 Large", - "display_name": "AI21 Jamba 1.5 Large", + "id": "deepseek-r1", + "name": "DeepSeek-R1", + "display_name": "DeepSeek-R1", "modalities": { "input": [ "text" @@ -16641,29 +17276,29 @@ ] }, "limit": { - "context": 256000, - "output": 4096 + "context": 163840, + "output": 163840 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, "attachment": false, - "open_weights": false, - "knowledge": "2024-03", - "release_date": "2024-08-29", - "last_updated": "2024-08-29", + "open_weights": true, + "knowledge": "2024-07", + "release_date": "2025-01-20", + "last_updated": "2025-01-20", "cost": { - "input": 0, - "output": 0 + "input": 1.35, + "output": 5.4 } }, { - "id": "ai21-labs/ai21-jamba-1.5-mini", - "name": "AI21 Jamba 1.5 Mini", - "display_name": "AI21 Jamba 1.5 Mini", + "id": "grok-code-fast-1", + "name": "Grok Code Fast 1", + "display_name": "Grok Code Fast 1", "modalities": { "input": [ "text" @@ -16674,7 +17309,7 @@ }, "limit": { "context": 256000, - "output": 4096 + "output": 10000 }, "temperature": true, "tool_call": true, @@ -16684,98 +17319,56 @@ }, "attachment": false, "open_weights": false, - "knowledge": "2024-03", - "release_date": "2024-08-29", - "last_updated": "2024-08-29", + "knowledge": "2023-10", + "release_date": "2025-08-28", + "last_updated": "2025-08-28", "cost": { - "input": 0, - "output": 0 + "input": 0.2, + "output": 1.5, + "cache_read": 0.02 } - } - ] - }, - "togetherai": { - "id": "togetherai", - "name": "Together AI", - "display_name": "Together AI", - "doc": "https://docs.together.ai/docs/serverless-models", - "models": [ + }, { - "id": "openai/gpt-oss-120b", - "name": "GPT OSS 120B", - "display_name": "GPT OSS 120B", + "id": "gpt-5.1-codex", + "name": "GPT-5.1 Codex", + "display_name": "GPT-5.1 Codex", "modalities": { "input": [ - "text" + "text", + "image", + "audio" ], "output": [ - "text" + "text", + "image", + "audio" ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, "attachment": false, - "open_weights": true, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", - "cost": { - "input": 0.15, - "output": 0.6 - } - } - ] - }, - "azure": { - "id": "azure", - "name": "Azure", - "display_name": "Azure", - "doc": "https://learn.microsoft.com/en-us/azure/ai-services/openai/concepts/models", - "models": [ - { - "id": "gpt-4.1-nano", - "name": "GPT-4.1 nano", - "display_name": "GPT-4.1 nano", - "modalities": { - "input": [ - "text", - "image" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 1047576, - "output": 32768 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false - }, - "attachment": true, "open_weights": false, - "knowledge": "2024-05", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", + "knowledge": "2024-09-30", + "release_date": "2025-11-14", + "last_updated": "2025-11-14", "cost": { - "input": 0.1, - "output": 0.4, - "cache_read": 0.03 + "input": 1.25, + "output": 10, + "cache_read": 0.125 } }, { - "id": "text-embedding-3-small", - "name": "text-embedding-3-small", - "display_name": "text-embedding-3-small", + "id": "phi-3-mini-4k-instruct", + "name": "Phi-3-mini-instruct (4k)", + "display_name": "Phi-3-mini-instruct (4k)", "modalities": { "input": [ "text" @@ -16785,103 +17378,109 @@ ] }, "limit": { - "context": 8191, - "output": 1536 + "context": 4096, + "output": 1024 }, + "temperature": true, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2024-01-25", - "last_updated": "2024-01-25", + "open_weights": true, + "knowledge": "2023-10", + "release_date": "2024-04-23", + "last_updated": "2024-04-23", "cost": { - "input": 0.02, - "output": 0 + "input": 0.13, + "output": 0.52 } }, { - "id": "grok-4-fast-non-reasoning", - "name": "Grok 4 Fast (Non-Reasoning)", - "display_name": "Grok 4 Fast (Non-Reasoning)", + "id": "claude-haiku-4-5", + "name": "Claude Haiku 4.5", + "display_name": "Claude Haiku 4.5", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 2000000, - "output": 30000 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": false, - "knowledge": "2025-07", - "release_date": "2025-09-19", - "last_updated": "2025-09-19", + "knowledge": "2025-02-31", + "release_date": "2025-11-18", + "last_updated": "2025-11-18", "cost": { - "input": 0.2, - "output": 0.5, - "cache_read": 0.05 + "input": 1, + "output": 5, + "cache_read": 0.1, + "cache_write": 1.25 } }, { - "id": "deepseek-r1-0528", - "name": "DeepSeek-R1-0528", - "display_name": "DeepSeek-R1-0528", + "id": "mistral-medium-2505", + "name": "Mistral Medium 3", + "display_name": "Mistral Medium 3", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 163840, - "output": 163840 + "context": 128000, + "output": 128000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-07", - "release_date": "2025-05-28", - "last_updated": "2025-05-28", + "attachment": true, + "open_weights": false, + "knowledge": "2025-05", + "release_date": "2025-05-07", + "last_updated": "2025-05-07", "cost": { - "input": 1.35, - "output": 5.4 + "input": 0.4, + "output": 2 } }, { - "id": "grok-4-fast-reasoning", - "name": "Grok 4 Fast (Reasoning)", - "display_name": "Grok 4 Fast (Reasoning)", + "id": "claude-opus-4-5", + "name": "Claude Opus 4.5", + "display_name": "Claude Opus 4.5", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 2000000, - "output": 30000 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, @@ -16891,19 +17490,20 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2025-07", - "release_date": "2025-09-19", - "last_updated": "2025-09-19", + "knowledge": "2025-03-31", + "release_date": "2025-11-24", + "last_updated": "2025-08-01", "cost": { - "input": 0.2, - "output": 0.5, - "cache_read": 0.05 + "input": 5, + "output": 25, + "cache_read": 1.5, + "cache_write": 18.75 } }, { - "id": "phi-3-medium-128k-instruct", - "name": "Phi-3-medium-instruct (128k)", - "display_name": "Phi-3-medium-instruct (128k)", + "id": "phi-3-small-128k-instruct", + "name": "Phi-3-small-instruct (128k)", + "display_name": "Phi-3-small-instruct (128k)", "modalities": { "input": [ "text" @@ -16927,14 +17527,14 @@ "release_date": "2024-04-23", "last_updated": "2024-04-23", "cost": { - "input": 0.17, - "output": 0.68 + "input": 0.15, + "output": 0.6 } }, { - "id": "gpt-4", - "name": "GPT-4", - "display_name": "GPT-4", + "id": "cohere-command-a", + "name": "Command A", + "display_name": "Command A", "modalities": { "input": [ "text" @@ -16944,40 +17544,40 @@ ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 256000, + "output": 8000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": false, - "knowledge": "2023-11", - "release_date": "2023-03-14", - "last_updated": "2023-03-14", + "open_weights": true, + "knowledge": "2024-06-01", + "release_date": "2025-03-13", + "last_updated": "2025-03-13", "cost": { - "input": 60, - "output": 120 + "input": 2.5, + "output": 10 } }, { - "id": "claude-opus-4-1", - "name": "Claude Opus 4.1", - "display_name": "Claude Opus 4.1", + "id": "cohere-command-r-plus-08-2024", + "name": "Command R+", + "display_name": "Command R+", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 32000 + "context": 128000, + "output": 4000 }, "temperature": true, "tool_call": true, @@ -16985,22 +17585,20 @@ "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-11-18", - "last_updated": "2025-11-18", + "attachment": false, + "open_weights": true, + "knowledge": "2024-06-01", + "release_date": "2024-08-30", + "last_updated": "2024-08-30", "cost": { - "input": 15, - "output": 75, - "cache_read": 1.5, - "cache_write": 18.75 + "input": 2.5, + "output": 10 } }, { - "id": "llama-3.2-11b-vision-instruct", - "name": "Llama-3.2-11B-Vision-Instruct", - "display_name": "Llama-3.2-11B-Vision-Instruct", + "id": "llama-4-maverick-17b-128e-instruct-fp8", + "name": "Llama 4 Maverick 17B 128E Instruct FP8", + "display_name": "Llama 4 Maverick 17B 128E Instruct FP8", "modalities": { "input": [ "text", @@ -17021,18 +17619,18 @@ }, "attachment": true, "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-09-25", - "last_updated": "2024-09-25", + "knowledge": "2024-08", + "release_date": "2025-04-05", + "last_updated": "2025-04-05", "cost": { - "input": 0.37, - "output": 0.37 + "input": 0.25, + "output": 1 } }, { - "id": "cohere-embed-v-4-0", - "name": "Embed v4", - "display_name": "Embed v4", + "id": "gpt-4.1-mini", + "name": "GPT-4.1 mini", + "display_name": "GPT-4.1 mini", "modalities": { "input": [ "text", @@ -17043,30 +17641,33 @@ ] }, "limit": { - "context": 128000, - "output": 1536 + "context": 1047576, + "output": 32768 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, "attachment": true, - "open_weights": true, - "release_date": "2025-04-15", - "last_updated": "2025-04-15", + "open_weights": false, + "knowledge": "2024-05", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { - "input": 0.12, - "output": 0 + "input": 0.4, + "output": 1.6, + "cache_read": 0.1 } }, { - "id": "cohere-command-r-08-2024", - "name": "Command R", - "display_name": "Command R", + "id": "gpt-5-chat", + "name": "GPT-5 Chat", + "display_name": "GPT-5 Chat", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -17074,28 +17675,29 @@ }, "limit": { "context": 128000, - "output": 4000 + "output": 16384 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-06-01", - "release_date": "2024-08-30", - "last_updated": "2024-08-30", + "attachment": true, + "open_weights": false, + "knowledge": "2024-10-24", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 0.15, - "output": 0.6 + "input": 1.25, + "output": 10, + "cache_read": 0.13 } }, { - "id": "grok-4", - "name": "Grok 4", - "display_name": "Grok 4", + "id": "deepseek-v3.1", + "name": "DeepSeek-V3.1", + "display_name": "DeepSeek-V3.1", "modalities": { "input": [ "text" @@ -17105,8 +17707,8 @@ ] }, "limit": { - "context": 256000, - "output": 64000 + "context": 131072, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -17115,21 +17717,19 @@ "default": true }, "attachment": false, - "open_weights": false, - "knowledge": "2025-07", - "release_date": "2025-07-09", - "last_updated": "2025-07-09", + "open_weights": true, + "knowledge": "2024-07", + "release_date": "2025-08-21", + "last_updated": "2025-08-21", "cost": { - "input": 3, - "output": 15, - "reasoning": 15, - "cache_read": 0.75 + "input": 0.56, + "output": 1.68 } }, { - "id": "cohere-embed-v3-multilingual", - "name": "Embed v3 Multilingual", - "display_name": "Embed v3 Multilingual", + "id": "phi-4", + "name": "Phi-4", + "display_name": "Phi-4", "modalities": { "input": [ "text" @@ -17139,27 +17739,28 @@ ] }, "limit": { - "context": 512, - "output": 1024 + "context": 128000, + "output": 4096 }, - "temperature": false, + "temperature": true, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2023-11-07", - "last_updated": "2023-11-07", + "knowledge": "2023-10", + "release_date": "2024-12-11", + "last_updated": "2024-12-11", "cost": { - "input": 0.1, - "output": 0 + "input": 0.125, + "output": 0.5 } }, { - "id": "phi-4-mini", - "name": "Phi-4-mini", - "display_name": "Phi-4-mini", + "id": "phi-4-mini-reasoning", + "name": "Phi-4-mini-reasoning", + "display_name": "Phi-4-mini-reasoning", "modalities": { "input": [ "text" @@ -17175,7 +17776,8 @@ "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": true, @@ -17188,40 +17790,45 @@ } }, { - "id": "gpt-4-32k", - "name": "GPT-4 32K", - "display_name": "GPT-4 32K", + "id": "claude-sonnet-4-5", + "name": "Claude Sonnet 4.5", + "display_name": "Claude Sonnet 4.5", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 32768, - "output": 32768 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2023-11", - "release_date": "2023-03-14", - "last_updated": "2023-03-14", + "knowledge": "2025-07-31", + "release_date": "2025-11-18", + "last_updated": "2025-11-18", "cost": { - "input": 60, - "output": 120 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 } }, { - "id": "meta-llama-3.1-405b-instruct", - "name": "Meta-Llama-3.1-405B-Instruct", - "display_name": "Meta-Llama-3.1-405B-Instruct", + "id": "gpt-3.5-turbo-0125", + "name": "GPT-3.5 Turbo 0125", + "display_name": "GPT-3.5 Turbo 0125", "modalities": { "input": [ "text" @@ -17231,28 +17838,28 @@ ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 16384, + "output": 16384 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-07-23", - "last_updated": "2024-07-23", + "open_weights": false, + "knowledge": "2021-08", + "release_date": "2024-01-25", + "last_updated": "2024-01-25", "cost": { - "input": 5.33, - "output": 16 + "input": 0.5, + "output": 1.5 } }, { - "id": "deepseek-r1", - "name": "DeepSeek-R1", - "display_name": "DeepSeek-R1", + "id": "grok-3", + "name": "Grok 3", + "display_name": "Grok 3", "modalities": { "input": [ "text" @@ -17262,29 +17869,29 @@ ] }, "limit": { - "context": 163840, - "output": 163840 + "context": 131072, + "output": 8192 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2024-07", - "release_date": "2025-01-20", - "last_updated": "2025-01-20", + "open_weights": false, + "knowledge": "2024-11", + "release_date": "2025-02-17", + "last_updated": "2025-02-17", "cost": { - "input": 1.35, - "output": 5.4 + "input": 3, + "output": 15, + "cache_read": 0.75 } }, { - "id": "grok-code-fast-1", - "name": "Grok Code Fast 1", - "display_name": "Grok Code Fast 1", + "id": "text-embedding-3-large", + "name": "text-embedding-3-large", + "display_name": "text-embedding-3-large", "modalities": { "input": [ "text" @@ -17294,67 +17901,88 @@ ] }, "limit": { - "context": 256000, - "output": 10000 + "context": 8191, + "output": 3072 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2023-10", - "release_date": "2025-08-28", - "last_updated": "2025-08-28", + "release_date": "2024-01-25", + "last_updated": "2024-01-25", "cost": { - "input": 0.2, - "output": 1.5, - "cache_read": 0.02 + "input": 0.13, + "output": 0 } }, { - "id": "gpt-5.1-codex", - "name": "GPT-5.1 Codex", - "display_name": "GPT-5.1 Codex", + "id": "meta-llama-3-70b-instruct", + "name": "Meta-Llama-3-70B-Instruct", + "display_name": "Meta-Llama-3-70B-Instruct", "modalities": { "input": [ - "text", - "image", - "audio" + "text" ], "output": [ - "text", - "image", - "audio" + "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 8192, + "output": 2048 }, - "temperature": false, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2024-04-18", + "last_updated": "2024-04-18", + "cost": { + "input": 2.68, + "output": 3.54 + } + }, + { + "id": "deepseek-v3-0324", + "name": "DeepSeek-V3-0324", + "display_name": "DeepSeek-V3-0324", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 131072 + }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-14", - "last_updated": "2025-11-14", + "open_weights": true, + "knowledge": "2024-07", + "release_date": "2025-03-24", + "last_updated": "2025-03-24", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125 + "input": 1.14, + "output": 4.56 } }, { - "id": "phi-3-mini-4k-instruct", - "name": "Phi-3-mini-instruct (4k)", - "display_name": "Phi-3-mini-instruct (4k)", + "id": "phi-3-small-8k-instruct", + "name": "Phi-3-small-instruct (8k)", + "display_name": "Phi-3-small-instruct (8k)", "modalities": { "input": [ "text" @@ -17364,8 +17992,8 @@ ] }, "limit": { - "context": 4096, - "output": 1024 + "context": 8192, + "output": 2048 }, "temperature": true, "tool_call": false, @@ -17378,49 +18006,45 @@ "release_date": "2024-04-23", "last_updated": "2024-04-23", "cost": { - "input": 0.13, - "output": 0.52 + "input": 0.15, + "output": 0.6 } }, { - "id": "claude-haiku-4-5", - "name": "Claude Haiku 4.5", - "display_name": "Claude Haiku 4.5", + "id": "meta-llama-3.1-70b-instruct", + "name": "Meta-Llama-3.1-70B-Instruct", + "display_name": "Meta-Llama-3.1-70B-Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 128000, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-02-31", - "release_date": "2025-11-18", - "last_updated": "2025-11-18", + "attachment": false, + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2024-07-23", + "last_updated": "2024-07-23", "cost": { - "input": 1, - "output": 5, - "cache_read": 0.1, - "cache_write": 1.25 + "input": 2.68, + "output": 3.54 } }, { - "id": "mistral-medium-2505", - "name": "Mistral Medium 3", - "display_name": "Mistral Medium 3", + "id": "gpt-4-turbo", + "name": "GPT-4 Turbo", + "display_name": "GPT-4 Turbo", "modalities": { "input": [ "text", @@ -17432,7 +18056,7 @@ }, "limit": { "context": 128000, - "output": 128000 + "output": 4096 }, "temperature": true, "tool_call": true, @@ -17441,53 +18065,49 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2025-05", - "release_date": "2025-05-07", - "last_updated": "2025-05-07", + "knowledge": "2023-11", + "release_date": "2023-11-06", + "last_updated": "2024-04-09", "cost": { - "input": 0.4, - "output": 2 + "input": 10, + "output": 30 } }, { - "id": "claude-opus-4-5", - "name": "Claude Opus 4.5", - "display_name": "Claude Opus 4.5", + "id": "gpt-3.5-turbo-0613", + "name": "GPT-3.5 Turbo 0613", + "display_name": "GPT-3.5 Turbo 0613", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 16384, + "output": 16384 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-11-24", - "last_updated": "2025-08-01", + "knowledge": "2021-08", + "release_date": "2023-06-13", + "last_updated": "2023-06-13", "cost": { - "input": 5, - "output": 25, - "cache_read": 1.5, - "cache_write": 18.75 + "input": 3, + "output": 4 } }, { - "id": "phi-3-small-128k-instruct", - "name": "Phi-3-small-instruct (128k)", - "display_name": "Phi-3-small-instruct (128k)", + "id": "phi-3.5-mini-instruct", + "name": "Phi-3.5-mini-instruct", + "display_name": "Phi-3.5-mini-instruct", "modalities": { "input": [ "text" @@ -17508,17 +18128,17 @@ "attachment": false, "open_weights": true, "knowledge": "2023-10", - "release_date": "2024-04-23", - "last_updated": "2024-04-23", + "release_date": "2024-08-20", + "last_updated": "2024-08-20", "cost": { - "input": 0.15, - "output": 0.6 + "input": 0.13, + "output": 0.52 } }, { - "id": "cohere-command-a", - "name": "Command A", - "display_name": "Command A", + "id": "o1-preview", + "name": "o1-preview", + "display_name": "o1-preview", "modalities": { "input": [ "text" @@ -17528,29 +18148,30 @@ ] }, "limit": { - "context": 256000, - "output": 8000 + "context": 128000, + "output": 32768 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, "attachment": false, - "open_weights": true, - "knowledge": "2024-06-01", - "release_date": "2025-03-13", - "last_updated": "2025-03-13", + "open_weights": false, + "knowledge": "2023-09", + "release_date": "2024-09-12", + "last_updated": "2024-09-12", "cost": { - "input": 2.5, - "output": 10 + "input": 16.5, + "output": 66, + "cache_read": 8.25 } }, { - "id": "cohere-command-r-plus-08-2024", - "name": "Command R+", - "display_name": "Command R+", + "id": "llama-3.3-70b-instruct", + "name": "Llama-3.3-70B-Instruct", + "display_name": "Llama-3.3-70B-Instruct", "modalities": { "input": [ "text" @@ -17561,60 +18182,64 @@ }, "limit": { "context": 128000, - "output": 4000 + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2024-06-01", - "release_date": "2024-08-30", - "last_updated": "2024-08-30", + "knowledge": "2023-12", + "release_date": "2024-12-06", + "last_updated": "2024-12-06", "cost": { - "input": 2.5, - "output": 10 + "input": 0.71, + "output": 0.71 } }, { - "id": "llama-4-maverick-17b-128e-instruct-fp8", - "name": "Llama 4 Maverick 17B 128E Instruct FP8", - "display_name": "Llama 4 Maverick 17B 128E Instruct FP8", + "id": "gpt-5.1-codex-mini", + "name": "GPT-5.1 Codex Mini", + "display_name": "GPT-5.1 Codex Mini", "modalities": { "input": [ "text", - "image" + "image", + "audio" ], "output": [ - "text" + "text", + "image", + "audio" ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": true, - "knowledge": "2024-08", - "release_date": "2025-04-05", - "last_updated": "2025-04-05", + "attachment": false, + "open_weights": false, + "knowledge": "2024-09-30", + "release_date": "2025-11-14", + "last_updated": "2025-11-14", "cost": { "input": 0.25, - "output": 1 + "output": 2, + "cache_read": 0.025 } }, { - "id": "gpt-4.1-mini", - "name": "GPT-4.1 mini", - "display_name": "GPT-4.1 mini", + "id": "model-router", + "name": "Model Router", + "display_name": "Model Router", "modalities": { "input": [ "text", @@ -17625,158 +18250,164 @@ ] }, "limit": { - "context": 1047576, - "output": 32768 + "context": 128000, + "output": 16384 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2024-05", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", + "release_date": "2025-05-19", + "last_updated": "2025-11-18", "cost": { - "input": 0.4, - "output": 1.6, - "cache_read": 0.1 + "input": 0.14, + "output": 0 } }, { - "id": "gpt-5-chat", - "name": "GPT-5 Chat", - "display_name": "GPT-5 Chat", + "id": "o3-mini", + "name": "o3-mini", + "display_name": "o3-mini", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 200000, + "output": 100000 }, "temperature": false, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-10-24", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "knowledge": "2024-05", + "release_date": "2024-12-20", + "last_updated": "2025-01-29", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.13 + "input": 1.1, + "output": 4.4, + "cache_read": 0.55 } }, { - "id": "deepseek-v3.1", - "name": "DeepSeek-V3.1", - "display_name": "DeepSeek-V3.1", + "id": "gpt-5.1", + "name": "GPT-5.1", + "display_name": "GPT-5.1", "modalities": { "input": [ - "text" + "text", + "image", + "audio" ], "output": [ - "text" + "text", + "image", + "audio" ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 272000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-07", - "release_date": "2025-08-21", - "last_updated": "2025-08-21", + "attachment": true, + "open_weights": false, + "knowledge": "2024-09-30", + "release_date": "2025-11-14", + "last_updated": "2025-11-14", "cost": { - "input": 0.56, - "output": 1.68 + "input": 1.25, + "output": 10, + "cache_read": 0.125 } }, { - "id": "phi-4", - "name": "Phi-4", - "display_name": "Phi-4", + "id": "gpt-5-nano", + "name": "GPT-5 Nano", + "display_name": "GPT-5 Nano", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 272000, + "output": 128000 }, - "temperature": true, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-12-11", - "last_updated": "2024-12-11", + "attachment": true, + "open_weights": false, + "knowledge": "2024-05-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 0.125, - "output": 0.5 + "input": 0.05, + "output": 0.4, + "cache_read": 0.01 } }, { - "id": "phi-4-mini-reasoning", - "name": "Phi-4-mini-reasoning", - "display_name": "Phi-4-mini-reasoning", + "id": "gpt-5-codex", + "name": "GPT-5-Codex", + "display_name": "GPT-5-Codex", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, "attachment": false, - "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-12-11", - "last_updated": "2024-12-11", + "open_weights": false, + "knowledge": "2024-09-30", + "release_date": "2025-09-15", + "last_updated": "2025-09-15", "cost": { - "input": 0.075, - "output": 0.3 + "input": 1.25, + "output": 10, + "cache_read": 0.13 } }, { - "id": "claude-sonnet-4-5", - "name": "Claude Sonnet 4.5", - "display_name": "Claude Sonnet 4.5", + "id": "llama-3.2-90b-vision-instruct", + "name": "Llama-3.2-90B-Vision-Instruct", + "display_name": "Llama-3.2-90B-Vision-Instruct", "modalities": { "input": [ "text", @@ -17787,31 +18418,28 @@ ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 128000, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, - "open_weights": false, - "knowledge": "2025-07-31", - "release_date": "2025-11-18", - "last_updated": "2025-11-18", + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2024-09-25", + "last_updated": "2024-09-25", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 2.04, + "output": 2.04 } }, { - "id": "gpt-3.5-turbo-0125", - "name": "GPT-3.5 Turbo 0125", - "display_name": "GPT-3.5 Turbo 0125", + "id": "phi-3-mini-128k-instruct", + "name": "Phi-3-mini-instruct (128k)", + "display_name": "Phi-3-mini-instruct (128k)", "modalities": { "input": [ "text" @@ -17821,8 +18449,8 @@ ] }, "limit": { - "context": 16384, - "output": 16384 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": false, @@ -17830,51 +18458,52 @@ "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2021-08", - "release_date": "2024-01-25", - "last_updated": "2024-01-25", + "open_weights": true, + "knowledge": "2023-10", + "release_date": "2024-04-23", + "last_updated": "2024-04-23", "cost": { - "input": 0.5, - "output": 1.5 + "input": 0.13, + "output": 0.52 } }, { - "id": "grok-3", - "name": "Grok 3", - "display_name": "Grok 3", + "id": "gpt-4o", + "name": "GPT-4o", + "display_name": "GPT-4o", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 128000, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-11", - "release_date": "2025-02-17", - "last_updated": "2025-02-17", + "knowledge": "2023-09", + "release_date": "2024-05-13", + "last_updated": "2024-05-13", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.75 + "input": 2.5, + "output": 10, + "cache_read": 1.25 } }, { - "id": "text-embedding-3-large", - "name": "text-embedding-3-large", - "display_name": "text-embedding-3-large", + "id": "gpt-3.5-turbo-0301", + "name": "GPT-3.5 Turbo 0301", + "display_name": "GPT-3.5 Turbo 0301", "modalities": { "input": [ "text" @@ -17884,37 +18513,8 @@ ] }, "limit": { - "context": 8191, - "output": 3072 - }, - "tool_call": false, - "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": false, - "release_date": "2024-01-25", - "last_updated": "2024-01-25", - "cost": { - "input": 0.13, - "output": 0 - } - }, - { - "id": "meta-llama-3-70b-instruct", - "name": "Meta-Llama-3-70B-Instruct", - "display_name": "Meta-Llama-3-70B-Instruct", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 8192, - "output": 2048 + "context": 4096, + "output": 4096 }, "temperature": true, "tool_call": false, @@ -17922,19 +18522,19 @@ "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-04-18", - "last_updated": "2024-04-18", + "open_weights": false, + "knowledge": "2021-08", + "release_date": "2023-03-01", + "last_updated": "2023-03-01", "cost": { - "input": 2.68, - "output": 3.54 + "input": 1.5, + "output": 2 } }, { - "id": "deepseek-v3-0324", - "name": "DeepSeek-V3-0324", - "display_name": "DeepSeek-V3-0324", + "id": "ministral-3b", + "name": "Ministral 3B", + "display_name": "Ministral 3B", "modalities": { "input": [ "text" @@ -17944,8 +18544,8 @@ ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 128000, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -17954,59 +18554,29 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2024-07", - "release_date": "2025-03-24", - "last_updated": "2025-03-24", - "cost": { - "input": 1.14, - "output": 4.56 - } - }, - { - "id": "phi-3-small-8k-instruct", - "name": "Phi-3-small-instruct (8k)", - "display_name": "Phi-3-small-instruct (8k)", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 8192, - "output": 2048 - }, - "temperature": true, - "tool_call": false, - "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-04-23", - "last_updated": "2024-04-23", + "knowledge": "2024-03", + "release_date": "2024-10-22", + "last_updated": "2024-10-22", "cost": { - "input": 0.15, - "output": 0.6 + "input": 0.04, + "output": 0.04 } }, { - "id": "meta-llama-3.1-70b-instruct", - "name": "Meta-Llama-3.1-70B-Instruct", - "display_name": "Meta-Llama-3.1-70B-Instruct", + "id": "gpt-4.1", + "name": "GPT-4.1", + "display_name": "GPT-4.1", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, + "context": 1047576, "output": 32768 }, "temperature": true, @@ -18014,20 +18584,21 @@ "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-07-23", - "last_updated": "2024-07-23", + "attachment": true, + "open_weights": false, + "knowledge": "2024-05", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { - "input": 2.68, - "output": 3.54 + "input": 2, + "output": 8, + "cache_read": 0.5 } }, { - "id": "gpt-4-turbo", - "name": "GPT-4 Turbo", - "display_name": "GPT-4 Turbo", + "id": "o4-mini", + "name": "o4-mini", + "display_name": "o4-mini", "modalities": { "input": [ "text", @@ -18038,59 +18609,64 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 200000, + "output": 100000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": false, - "knowledge": "2023-11", - "release_date": "2023-11-06", - "last_updated": "2024-04-09", + "knowledge": "2024-05", + "release_date": "2025-04-16", + "last_updated": "2025-04-16", "cost": { - "input": 10, - "output": 30 + "input": 1.1, + "output": 4.4, + "cache_read": 0.28 } }, { - "id": "gpt-3.5-turbo-0613", - "name": "GPT-3.5 Turbo 0613", - "display_name": "GPT-3.5 Turbo 0613", + "id": "phi-4-multimodal", + "name": "Phi-4-multimodal", + "display_name": "Phi-4-multimodal", "modalities": { "input": [ - "text" + "text", + "image", + "audio" ], "output": [ "text" ] }, "limit": { - "context": 16384, - "output": 16384 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": false, - "knowledge": "2021-08", - "release_date": "2023-06-13", - "last_updated": "2023-06-13", + "attachment": true, + "open_weights": true, + "knowledge": "2023-10", + "release_date": "2024-12-11", + "last_updated": "2024-12-11", "cost": { - "input": 3, - "output": 4 + "input": 0.08, + "output": 0.32, + "input_audio": 4 } }, { - "id": "phi-3.5-mini-instruct", - "name": "Phi-3.5-mini-instruct", - "display_name": "Phi-3.5-mini-instruct", + "id": "meta-llama-3-8b-instruct", + "name": "Meta-Llama-3-8B-Instruct", + "display_name": "Meta-Llama-3-8B-Instruct", "modalities": { "input": [ "text" @@ -18100,8 +18676,8 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 8192, + "output": 2048 }, "temperature": true, "tool_call": false, @@ -18110,29 +18686,30 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-08-20", - "last_updated": "2024-08-20", + "knowledge": "2023-12", + "release_date": "2024-04-18", + "last_updated": "2024-04-18", "cost": { - "input": 0.13, - "output": 0.52 + "input": 0.3, + "output": 0.61 } }, { - "id": "o1-preview", - "name": "o1-preview", - "display_name": "o1-preview", + "id": "o1", + "name": "o1", + "display_name": "o1", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 200000, + "output": 100000 }, "temperature": false, "tool_call": true, @@ -18143,18 +18720,18 @@ "attachment": false, "open_weights": false, "knowledge": "2023-09", - "release_date": "2024-09-12", - "last_updated": "2024-09-12", + "release_date": "2024-12-05", + "last_updated": "2024-12-05", "cost": { - "input": 16.5, - "output": 66, - "cache_read": 8.25 + "input": 15, + "output": 60, + "cache_read": 7.5 } }, { - "id": "llama-3.3-70b-instruct", - "name": "Llama-3.3-70B-Instruct", - "display_name": "Llama-3.3-70B-Instruct", + "id": "grok-3-mini", + "name": "Grok 3 Mini", + "display_name": "Grok 3 Mini", "modalities": { "input": [ "text" @@ -18164,28 +18741,31 @@ ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "open_weights": false, + "knowledge": "2024-11", + "release_date": "2025-02-17", + "last_updated": "2025-02-17", "cost": { - "input": 0.71, - "output": 0.71 + "input": 0.3, + "output": 0.5, + "reasoning": 0.5, + "cache_read": 0.075 } }, { - "id": "gpt-5.1-codex-mini", - "name": "GPT-5.1 Codex Mini", - "display_name": "GPT-5.1 Codex Mini", + "id": "gpt-5.1-chat", + "name": "GPT-5.1 Chat", + "display_name": "GPT-5.1 Chat", "modalities": { "input": [ "text", @@ -18199,8 +18779,8 @@ ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 128000, + "output": 16384 }, "temperature": false, "tool_call": true, @@ -18208,25 +18788,24 @@ "supported": true, "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, "knowledge": "2024-09-30", "release_date": "2025-11-14", "last_updated": "2025-11-14", "cost": { - "input": 0.25, - "output": 2, - "cache_read": 0.025 + "input": 1.25, + "output": 10, + "cache_read": 0.125 } }, { - "id": "model-router", - "name": "Model Router", - "display_name": "Model Router", + "id": "phi-3.5-moe-instruct", + "name": "Phi-3.5-MoE-instruct", + "display_name": "Phi-3.5-MoE-instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" @@ -18234,36 +18813,39 @@ }, "limit": { "context": 128000, - "output": 16384 + "output": 4096 }, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2025-05-19", - "last_updated": "2025-11-18", + "attachment": false, + "open_weights": true, + "knowledge": "2023-10", + "release_date": "2024-08-20", + "last_updated": "2024-08-20", "cost": { - "input": 0.14, - "output": 0 + "input": 0.16, + "output": 0.64 } }, { - "id": "o3-mini", - "name": "o3-mini", - "display_name": "o3-mini", + "id": "gpt-5-mini", + "name": "GPT-5 Mini", + "display_name": "GPT-5 Mini", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 272000, + "output": 128000 }, "temperature": false, "tool_call": true, @@ -18271,36 +18853,32 @@ "supported": true, "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-05", - "release_date": "2024-12-20", - "last_updated": "2025-01-29", + "knowledge": "2024-05-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 1.1, - "output": 4.4, - "cache_read": 0.55 + "input": 0.25, + "output": 2, + "cache_read": 0.03 } }, { - "id": "gpt-5.1", - "name": "GPT-5.1", - "display_name": "GPT-5.1", + "id": "o1-mini", + "name": "o1-mini", + "display_name": "o1-mini", "modalities": { "input": [ - "text", - "image", - "audio" + "text" ], "output": [ - "text", - "image", - "audio" + "text" ] }, "limit": { - "context": 272000, - "output": 128000 + "context": 128000, + "output": 65536 }, "temperature": false, "tool_call": true, @@ -18308,21 +18886,21 @@ "supported": true, "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-14", - "last_updated": "2025-11-14", + "knowledge": "2023-09", + "release_date": "2024-09-12", + "last_updated": "2024-09-12", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125 + "input": 1.1, + "output": 4.4, + "cache_read": 0.55 } }, { - "id": "gpt-5-nano", - "name": "GPT-5 Nano", - "display_name": "GPT-5 Nano", + "id": "llama-4-scout-17b-16e-instruct", + "name": "Llama 4 Scout 17B 16E Instruct", + "display_name": "Llama 4 Scout 17B 16E Instruct", "modalities": { "input": [ "text", @@ -18333,96 +18911,87 @@ ] }, "limit": { - "context": 272000, - "output": 128000 + "context": 128000, + "output": 8192 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, - "open_weights": false, - "knowledge": "2024-05-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "open_weights": true, + "knowledge": "2024-08", + "release_date": "2025-04-05", + "last_updated": "2025-04-05", "cost": { - "input": 0.05, - "output": 0.4, - "cache_read": 0.01 + "input": 0.2, + "output": 0.78 } }, { - "id": "gpt-5-codex", - "name": "GPT-5-Codex", - "display_name": "GPT-5-Codex", + "id": "cohere-embed-v3-english", + "name": "Embed v3 English", + "display_name": "Embed v3 English", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 512, + "output": 1024 }, "temperature": false, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-09-15", - "last_updated": "2025-09-15", + "open_weights": true, + "release_date": "2023-11-07", + "last_updated": "2023-11-07", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.13 + "input": 0.1, + "output": 0 } }, { - "id": "llama-3.2-90b-vision-instruct", - "name": "Llama-3.2-90B-Vision-Instruct", - "display_name": "Llama-3.2-90B-Vision-Instruct", + "id": "text-embedding-ada-002", + "name": "text-embedding-ada-002", + "display_name": "text-embedding-ada-002", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 8192, + "output": 1536 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-09-25", - "last_updated": "2024-09-25", + "attachment": false, + "open_weights": false, + "release_date": "2022-12-15", + "last_updated": "2022-12-15", "cost": { - "input": 2.04, - "output": 2.04 + "input": 0.1, + "output": 0 } }, { - "id": "phi-3-mini-128k-instruct", - "name": "Phi-3-mini-instruct (128k)", - "display_name": "Phi-3-mini-instruct (128k)", + "id": "meta-llama-3.1-8b-instruct", + "name": "Meta-Llama-3.1-8B-Instruct", + "display_name": "Meta-Llama-3.1-8B-Instruct", "modalities": { "input": [ "text" @@ -18433,27 +19002,27 @@ }, "limit": { "context": 128000, - "output": 4096 + "output": 32768 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-04-23", - "last_updated": "2024-04-23", + "knowledge": "2023-12", + "release_date": "2024-07-23", + "last_updated": "2024-07-23", "cost": { - "input": 0.13, - "output": 0.52 + "input": 0.3, + "output": 0.61 } }, { - "id": "gpt-4o", - "name": "GPT-4o", - "display_name": "GPT-4o", + "id": "gpt-5.1-codex-max", + "name": "GPT-5.1 Codex Max", + "display_name": "GPT-5.1 Codex Max", "modalities": { "input": [ "text", @@ -18464,29 +19033,30 @@ ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": false, - "knowledge": "2023-09", - "release_date": "2024-05-13", - "last_updated": "2024-05-13", + "knowledge": "2024-09-30", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", "cost": { - "input": 2.5, + "input": 1.25, "output": 10, - "cache_read": 1.25 + "cache_read": 0.125 } }, { - "id": "gpt-3.5-turbo-0301", - "name": "GPT-3.5 Turbo 0301", - "display_name": "GPT-3.5 Turbo 0301", + "id": "gpt-3.5-turbo-instruct", + "name": "GPT-3.5 Turbo Instruct", + "display_name": "GPT-3.5 Turbo Instruct", "modalities": { "input": [ "text" @@ -18507,17 +19077,17 @@ "attachment": false, "open_weights": false, "knowledge": "2021-08", - "release_date": "2023-03-01", - "last_updated": "2023-03-01", + "release_date": "2023-09-21", + "last_updated": "2023-09-21", "cost": { "input": 1.5, "output": 2 } }, { - "id": "ministral-3b", - "name": "Ministral 3B", - "display_name": "Ministral 3B", + "id": "mistral-nemo", + "name": "Mistral Nemo", + "display_name": "Mistral Nemo", "modalities": { "input": [ "text" @@ -18528,7 +19098,7 @@ }, "limit": { "context": 128000, - "output": 8192 + "output": 128000 }, "temperature": true, "tool_call": true, @@ -18537,19 +19107,19 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2024-03", - "release_date": "2024-10-22", - "last_updated": "2024-10-22", + "knowledge": "2024-07", + "release_date": "2024-07-18", + "last_updated": "2024-07-18", "cost": { - "input": 0.04, - "output": 0.04 + "input": 0.15, + "output": 0.15 } }, { - "id": "gpt-4.1", - "name": "GPT-4.1", - "display_name": "GPT-4.1", - "modalities": { + "id": "o3", + "name": "o3", + "display_name": "o3", + "modalities": { "input": [ "text", "image" @@ -18559,19 +19129,20 @@ ] }, "limit": { - "context": 1047576, - "output": 32768 + "context": 200000, + "output": 100000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": false, "knowledge": "2024-05", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", + "release_date": "2025-04-16", + "last_updated": "2025-04-16", "cost": { "input": 2, "output": 8, @@ -18579,13 +19150,12 @@ } }, { - "id": "o4-mini", - "name": "o4-mini", - "display_name": "o4-mini", + "id": "codex-mini", + "name": "Codex Mini", + "display_name": "Codex Mini", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" @@ -18603,53 +19173,50 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2024-05", - "release_date": "2025-04-16", - "last_updated": "2025-04-16", + "knowledge": "2024-04", + "release_date": "2025-05-16", + "last_updated": "2025-05-16", "cost": { - "input": 1.1, - "output": 4.4, - "cache_read": 0.28 + "input": 1.5, + "output": 6, + "cache_read": 0.375 } }, { - "id": "phi-4-multimodal", - "name": "Phi-4-multimodal", - "display_name": "Phi-4-multimodal", + "id": "phi-3-medium-4k-instruct", + "name": "Phi-3-medium-instruct (4k)", + "display_name": "Phi-3-medium-instruct (4k)", "modalities": { "input": [ - "text", - "image", - "audio" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 4096, + "output": 1024 }, "temperature": true, "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": true, "knowledge": "2023-10", - "release_date": "2024-12-11", - "last_updated": "2024-12-11", + "release_date": "2024-04-23", + "last_updated": "2024-04-23", "cost": { - "input": 0.08, - "output": 0.32, - "input_audio": 4 + "input": 0.17, + "output": 0.68 } }, { - "id": "meta-llama-3-8b-instruct", - "name": "Meta-Llama-3-8B-Instruct", - "display_name": "Meta-Llama-3-8B-Instruct", + "id": "phi-4-reasoning", + "name": "Phi-4-reasoning", + "display_name": "Phi-4-reasoning", "modalities": { "input": [ "text" @@ -18659,28 +19226,29 @@ ] }, "limit": { - "context": 8192, - "output": 2048 + "context": 32000, + "output": 4096 }, "temperature": true, "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-04-18", - "last_updated": "2024-04-18", + "knowledge": "2023-10", + "release_date": "2024-12-11", + "last_updated": "2024-12-11", "cost": { - "input": 0.3, - "output": 0.61 + "input": 0.125, + "output": 0.5 } }, { - "id": "o1", - "name": "o1", - "display_name": "o1", + "id": "gpt-4-turbo-vision", + "name": "GPT-4 Turbo Vision", + "display_name": "GPT-4 Turbo Vision", "modalities": { "input": [ "text", @@ -18691,30 +19259,28 @@ ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 128000, + "output": 4096 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2023-09", - "release_date": "2024-12-05", - "last_updated": "2024-12-05", + "knowledge": "2023-11", + "release_date": "2023-11-06", + "last_updated": "2024-04-09", "cost": { - "input": 15, - "output": 60, - "cache_read": 7.5 + "input": 10, + "output": 30 } }, { - "id": "grok-3-mini", - "name": "Grok 3 Mini", - "display_name": "Grok 3 Mini", + "id": "phi-4-reasoning-plus", + "name": "Phi-4-reasoning-plus", + "display_name": "Phi-4-reasoning-plus", "modalities": { "input": [ "text" @@ -18724,47 +19290,75 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 32000, + "output": 4096 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, "attachment": false, - "open_weights": false, - "knowledge": "2024-11", - "release_date": "2025-02-17", - "last_updated": "2025-02-17", + "open_weights": true, + "knowledge": "2023-10", + "release_date": "2024-12-11", + "last_updated": "2024-12-11", "cost": { - "input": 0.3, - "output": 0.5, - "reasoning": 0.5, - "cache_read": 0.075 + "input": 0.125, + "output": 0.5 } }, { - "id": "gpt-5.1-chat", - "name": "GPT-5.1 Chat", - "display_name": "GPT-5.1 Chat", + "id": "gpt-4o-mini", + "name": "GPT-4o mini", + "display_name": "GPT-4o mini", "modalities": { "input": [ "text", - "image", - "audio" + "image" ], "output": [ - "text", - "image", - "audio" + "text" ] }, "limit": { "context": 128000, "output": 16384 }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": false, + "knowledge": "2023-09", + "release_date": "2024-07-18", + "last_updated": "2024-07-18", + "cost": { + "input": 0.15, + "output": 0.6, + "cache_read": 0.08 + } + }, + { + "id": "gpt-5", + "name": "GPT-5", + "display_name": "GPT-5", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 272000, + "output": 128000 + }, "temperature": false, "tool_call": true, "reasoning": { @@ -18774,18 +19368,18 @@ "attachment": true, "open_weights": false, "knowledge": "2024-09-30", - "release_date": "2025-11-14", - "last_updated": "2025-11-14", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { "input": 1.25, "output": 10, - "cache_read": 0.125 + "cache_read": 0.13 } }, { - "id": "phi-3.5-moe-instruct", - "name": "Phi-3.5-MoE-instruct", - "display_name": "Phi-3.5-MoE-instruct", + "id": "mai-ds-r1", + "name": "MAI-DS-R1", + "display_name": "MAI-DS-R1", "modalities": { "input": [ "text" @@ -18796,27 +19390,28 @@ }, "limit": { "context": 128000, - "output": 4096 + "output": 8192 }, "temperature": true, "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-08-20", - "last_updated": "2024-08-20", + "open_weights": false, + "knowledge": "2024-06", + "release_date": "2025-01-20", + "last_updated": "2025-01-20", "cost": { - "input": 0.16, - "output": 0.64 + "input": 1.35, + "output": 5.4 } }, { - "id": "gpt-5-mini", - "name": "GPT-5 Mini", - "display_name": "GPT-5 Mini", + "id": "gpt-5-pro", + "name": "GPT-5 Pro", + "display_name": "GPT-5 Pro", "modalities": { "input": [ "text", @@ -18827,8 +19422,8 @@ ] }, "limit": { - "context": 272000, - "output": 128000 + "context": 400000, + "output": 272000 }, "temperature": false, "tool_call": true, @@ -18838,19 +19433,18 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2024-05-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "knowledge": "2024-09-30", + "release_date": "2025-10-06", + "last_updated": "2025-10-06", "cost": { - "input": 0.25, - "output": 2, - "cache_read": 0.03 + "input": 15, + "output": 120 } }, { - "id": "o1-mini", - "name": "o1-mini", - "display_name": "o1-mini", + "id": "mistral-large-2411", + "name": "Mistral Large 24.11", + "display_name": "Mistral Large 24.11", "modalities": { "input": [ "text" @@ -18861,29 +19455,27 @@ }, "limit": { "context": 128000, - "output": 65536 + "output": 32768 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2023-09", - "release_date": "2024-09-12", - "last_updated": "2024-09-12", + "knowledge": "2024-09", + "release_date": "2024-11-01", + "last_updated": "2024-11-01", "cost": { - "input": 1.1, - "output": 4.4, - "cache_read": 0.55 + "input": 2, + "output": 6 } }, { - "id": "llama-4-scout-17b-16e-instruct", - "name": "Llama 4 Scout 17B 16E Instruct", - "display_name": "Llama 4 Scout 17B 16E Instruct", + "id": "gpt-5.2", + "name": "GPT-5.2", + "display_name": "GPT-5.2", "modalities": { "input": [ "text", @@ -18894,28 +19486,30 @@ ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, - "open_weights": true, - "knowledge": "2024-08", - "release_date": "2025-04-05", - "last_updated": "2025-04-05", + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2025-12-11", + "last_updated": "2025-12-11", "cost": { - "input": 0.2, - "output": 0.78 + "input": 1.75, + "output": 14, + "cache_read": 0.125 } }, { - "id": "cohere-embed-v3-english", - "name": "Embed v3 English", - "display_name": "Embed v3 English", + "id": "codestral-2501", + "name": "Codestral 25.01", + "display_name": "Codestral 25.01", "modalities": { "input": [ "text" @@ -18925,56 +19519,60 @@ ] }, "limit": { - "context": 512, - "output": 1024 + "context": 256000, + "output": 256000 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2023-11-07", - "last_updated": "2023-11-07", + "open_weights": false, + "knowledge": "2024-03", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 0.1, - "output": 0 + "input": 0.3, + "output": 0.9 } }, { - "id": "text-embedding-ada-002", - "name": "text-embedding-ada-002", - "display_name": "text-embedding-ada-002", + "id": "mistral-small-2503", + "name": "Mistral Small 3.1", + "display_name": "Mistral Small 3.1", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 8192, - "output": 1536 + "context": 128000, + "output": 32768 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2022-12-15", - "last_updated": "2022-12-15", + "knowledge": "2024-09", + "release_date": "2025-03-01", + "last_updated": "2025-03-01", "cost": { "input": 0.1, - "output": 0 + "output": 0.3 } }, { - "id": "meta-llama-3.1-8b-instruct", - "name": "Meta-Llama-3.1-8B-Instruct", - "display_name": "Meta-Llama-3.1-8B-Instruct", + "id": "gpt-3.5-turbo-1106", + "name": "GPT-3.5 Turbo 1106", + "display_name": "GPT-3.5 Turbo 1106", "modalities": { "input": [ "text" @@ -18984,28 +19582,37 @@ ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 16384, + "output": 16384 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-07-23", - "last_updated": "2024-07-23", + "open_weights": false, + "knowledge": "2021-08", + "release_date": "2023-11-06", + "last_updated": "2023-11-06", "cost": { - "input": 0.3, - "output": 0.61 + "input": 1, + "output": 2 } - }, + } + ] + }, + "siliconflow": { + "id": "siliconflow", + "name": "SiliconFlow", + "display_name": "SiliconFlow", + "api": "https://api.siliconflow.com/v1", + "doc": "https://cloud.siliconflow.com/models", + "models": [ { - "id": "gpt-3.5-turbo-instruct", - "name": "GPT-3.5 Turbo Instruct", - "display_name": "GPT-3.5 Turbo Instruct", + "id": "deepseek-ai-deepseek-r1-distill-qwen-7b", + "name": "deepseek-ai/DeepSeek-R1-Distill-Qwen-7B", + "display_name": "deepseek-ai/DeepSeek-R1-Distill-Qwen-7B", "modalities": { "input": [ "text" @@ -19015,28 +19622,28 @@ ] }, "limit": { - "context": 4096, - "output": 4096 + "context": 33000, + "output": 16000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": false, - "knowledge": "2021-08", - "release_date": "2023-09-21", - "last_updated": "2023-09-21", + "release_date": "2025-01-20", + "last_updated": "2025-11-25", "cost": { - "input": 1.5, - "output": 2 + "input": 0.05, + "output": 0.05 } }, { - "id": "mistral-nemo", - "name": "Mistral Nemo", - "display_name": "Mistral Nemo", + "id": "z-ai-glm-4.5-air", + "name": "z-ai/GLM-4.5-Air", + "display_name": "z-ai/GLM-4.5-Air", "modalities": { "input": [ "text" @@ -19046,8 +19653,8 @@ ] }, "limit": { - "context": 128000, - "output": 128000 + "context": 131000, + "output": 131000 }, "temperature": true, "tool_call": true, @@ -19055,86 +19662,79 @@ "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2024-07", - "release_date": "2024-07-18", - "last_updated": "2024-07-18", + "open_weights": false, + "release_date": "2025-07-28", + "last_updated": "2025-11-25", "cost": { - "input": 0.15, - "output": 0.15 + "input": 0.14, + "output": 0.86 } }, { - "id": "o3", - "name": "o3", - "display_name": "o3", + "id": "qwen-qwen2.5-72b-instruct-128k", + "name": "Qwen/Qwen2.5-72B-Instruct-128K", + "display_name": "Qwen/Qwen2.5-72B-Instruct-128K", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 131000, + "output": 4000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-05", - "release_date": "2025-04-16", - "last_updated": "2025-04-16", + "release_date": "2024-09-18", + "last_updated": "2025-11-25", "cost": { - "input": 2, - "output": 8, - "cache_read": 0.5 + "input": 0.59, + "output": 0.59 } }, { - "id": "codex-mini", - "name": "Codex Mini", - "display_name": "Codex Mini", + "id": "deepseek-ai-deepseek-vl2", + "name": "deepseek-ai/deepseek-vl2", + "display_name": "deepseek-ai/deepseek-vl2", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 4000, + "output": 4000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-05-16", - "last_updated": "2025-05-16", + "release_date": "2024-12-13", + "last_updated": "2025-11-25", "cost": { - "input": 1.5, - "output": 6, - "cache_read": 0.375 + "input": 0.15, + "output": 0.15 } }, { - "id": "phi-3-medium-4k-instruct", - "name": "Phi-3-medium-instruct (4k)", - "display_name": "Phi-3-medium-instruct (4k)", + "id": "moonshotai-kimi-dev-72b", + "name": "moonshotai/Kimi-Dev-72B", + "display_name": "moonshotai/Kimi-Dev-72B", "modalities": { "input": [ "text" @@ -19144,28 +19744,27 @@ ] }, "limit": { - "context": 4096, - "output": 1024 + "context": 131000, + "output": 131000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-04-23", - "last_updated": "2024-04-23", + "open_weights": false, + "release_date": "2025-06-19", + "last_updated": "2025-11-25", "cost": { - "input": 0.17, - "output": 0.68 + "input": 0.29, + "output": 1.15 } }, { - "id": "phi-4-reasoning", - "name": "Phi-4-reasoning", - "display_name": "Phi-4-reasoning", + "id": "qwen-qwen2.5-coder-32b-instruct", + "name": "Qwen/Qwen2.5-Coder-32B-Instruct", + "display_name": "Qwen/Qwen2.5-Coder-32B-Instruct", "modalities": { "input": [ "text" @@ -19175,494 +19774,13 @@ ] }, "limit": { - "context": 32000, - "output": 4096 + "context": 33000, + "output": 4000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "attachment": false, - "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-12-11", - "last_updated": "2024-12-11", - "cost": { - "input": 0.125, - "output": 0.5 - } - }, - { - "id": "gpt-4-turbo-vision", - "name": "GPT-4 Turbo Vision", - "display_name": "GPT-4 Turbo Vision", - "modalities": { - "input": [ - "text", - "image" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 128000, - "output": 4096 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false - }, - "attachment": true, - "open_weights": false, - "knowledge": "2023-11", - "release_date": "2023-11-06", - "last_updated": "2024-04-09", - "cost": { - "input": 10, - "output": 30 - } - }, - { - "id": "phi-4-reasoning-plus", - "name": "Phi-4-reasoning-plus", - "display_name": "Phi-4-reasoning-plus", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 32000, - "output": 4096 - }, - "temperature": true, - "tool_call": false, - "reasoning": { - "supported": true, - "default": true - }, - "attachment": false, - "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-12-11", - "last_updated": "2024-12-11", - "cost": { - "input": 0.125, - "output": 0.5 - } - }, - { - "id": "gpt-4o-mini", - "name": "GPT-4o mini", - "display_name": "GPT-4o mini", - "modalities": { - "input": [ - "text", - "image" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 128000, - "output": 16384 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false - }, - "attachment": true, - "open_weights": false, - "knowledge": "2023-09", - "release_date": "2024-07-18", - "last_updated": "2024-07-18", - "cost": { - "input": 0.15, - "output": 0.6, - "cache_read": 0.08 - } - }, - { - "id": "gpt-5", - "name": "GPT-5", - "display_name": "GPT-5", - "modalities": { - "input": [ - "text", - "image" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 272000, - "output": 128000 - }, - "temperature": false, - "tool_call": true, - "reasoning": { - "supported": true, - "default": true - }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", - "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.13 - } - }, - { - "id": "mai-ds-r1", - "name": "MAI-DS-R1", - "display_name": "MAI-DS-R1", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 128000, - "output": 8192 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": true, - "default": true - }, - "attachment": false, - "open_weights": false, - "knowledge": "2024-06", - "release_date": "2025-01-20", - "last_updated": "2025-01-20", - "cost": { - "input": 1.35, - "output": 5.4 - } - }, - { - "id": "mistral-large-2411", - "name": "Mistral Large 24.11", - "display_name": "Mistral Large 24.11", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 128000, - "output": 32768 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": false, - "knowledge": "2024-09", - "release_date": "2024-11-01", - "last_updated": "2024-11-01", - "cost": { - "input": 2, - "output": 6 - } - }, - { - "id": "codestral-2501", - "name": "Codestral 25.01", - "display_name": "Codestral 25.01", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 256000, - "output": 256000 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": false, - "knowledge": "2024-03", - "release_date": "2025-01-01", - "last_updated": "2025-01-01", - "cost": { - "input": 0.3, - "output": 0.9 - } - }, - { - "id": "mistral-small-2503", - "name": "Mistral Small 3.1", - "display_name": "Mistral Small 3.1", - "modalities": { - "input": [ - "text", - "image" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 128000, - "output": 32768 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false - }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-09", - "release_date": "2025-03-01", - "last_updated": "2025-03-01", - "cost": { - "input": 0.1, - "output": 0.3 - } - }, - { - "id": "gpt-3.5-turbo-1106", - "name": "GPT-3.5 Turbo 1106", - "display_name": "GPT-3.5 Turbo 1106", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 16384, - "output": 16384 - }, - "temperature": true, - "tool_call": false, - "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": false, - "knowledge": "2021-08", - "release_date": "2023-11-06", - "last_updated": "2023-11-06", - "cost": { - "input": 1, - "output": 2 - } - } - ] - }, - "siliconflow": { - "id": "siliconflow", - "name": "SiliconFlow", - "display_name": "SiliconFlow", - "api": "https://api.siliconflow.com/v1", - "doc": "https://cloud.siliconflow.com/models", - "models": [ - { - "id": "deepseek-ai-deepseek-r1-distill-qwen-7b", - "name": "deepseek-ai/DeepSeek-R1-Distill-Qwen-7B", - "display_name": "deepseek-ai/DeepSeek-R1-Distill-Qwen-7B", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 33000, - "output": 16000 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": true, - "default": true - }, - "attachment": false, - "open_weights": false, - "release_date": "2025-01-20", - "last_updated": "2025-11-25", - "cost": { - "input": 0.05, - "output": 0.05 - } - }, - { - "id": "z-ai-glm-4.5-air", - "name": "z-ai/GLM-4.5-Air", - "display_name": "z-ai/GLM-4.5-Air", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 131000, - "output": 131000 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": false, - "release_date": "2025-07-28", - "last_updated": "2025-11-25", - "cost": { - "input": 0.14, - "output": 0.86 - } - }, - { - "id": "qwen-qwen2.5-72b-instruct-128k", - "name": "Qwen/Qwen2.5-72B-Instruct-128K", - "display_name": "Qwen/Qwen2.5-72B-Instruct-128K", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 131000, - "output": 4000 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": false, - "release_date": "2024-09-18", - "last_updated": "2025-11-25", - "cost": { - "input": 0.59, - "output": 0.59 - } - }, - { - "id": "deepseek-ai-deepseek-vl2", - "name": "deepseek-ai/deepseek-vl2", - "display_name": "deepseek-ai/deepseek-vl2", - "modalities": { - "input": [ - "text", - "image" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 4000, - "output": 4000 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false - }, - "attachment": true, - "open_weights": false, - "release_date": "2024-12-13", - "last_updated": "2025-11-25", - "cost": { - "input": 0.15, - "output": 0.15 - } - }, - { - "id": "moonshotai-kimi-dev-72b", - "name": "moonshotai/Kimi-Dev-72B", - "display_name": "moonshotai/Kimi-Dev-72B", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 131000, - "output": 131000 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": false, - "release_date": "2025-06-19", - "last_updated": "2025-11-25", - "cost": { - "input": 0.29, - "output": 1.15 - } - }, - { - "id": "qwen-qwen2.5-coder-32b-instruct", - "name": "Qwen/Qwen2.5-Coder-32B-Instruct", - "display_name": "Qwen/Qwen2.5-Coder-32B-Instruct", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 33000, - "output": 4000 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false + "supported": false }, "attachment": false, "open_weights": false, @@ -21895,28 +22013,29 @@ } ] }, - "opencode": { - "id": "opencode", - "name": "OpenCode Zen", - "display_name": "OpenCode Zen", - "api": "https://opencode.ai/zen/v1", - "doc": "https://opencode.ai/docs/zen", + "helicone": { + "id": "helicone", + "name": "Helicone", + "display_name": "Helicone", + "api": "https://ai-gateway.helicone.ai/v1", + "doc": "https://helicone.ai/models", "models": [ { - "id": "qwen3-coder", - "name": "Qwen3 Coder", - "display_name": "Qwen3 Coder", + "id": "gpt-4.1-nano", + "name": "OpenAI GPT-4.1 Nano", + "display_name": "OpenAI GPT-4.1 Nano", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 1047576, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -21924,57 +22043,60 @@ "supported": false }, "attachment": false, - "open_weights": true, + "open_weights": false, "knowledge": "2025-04", - "release_date": "2025-07-23", - "last_updated": "2025-07-23", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { - "input": 0.45, - "output": 1.8 + "input": 0.09999999999999999, + "output": 0.39999999999999997, + "cache_read": 0.024999999999999998 } }, { - "id": "claude-opus-4-1", - "name": "Claude Opus 4.1", - "display_name": "Claude Opus 4.1", + "id": "grok-4-fast-non-reasoning", + "name": "xAI Grok 4 Fast Non-Reasoning", + "display_name": "xAI Grok 4 Fast Non-Reasoning", "modalities": { "input": [ "text", - "image" + "image", + "audio" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 32000 + "context": 2000000, + "output": 2000000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "knowledge": "2025-09", + "release_date": "2025-09-19", + "last_updated": "2025-09-19", "cost": { - "input": 15, - "output": 75, - "cache_read": 1.5, - "cache_write": 18.75 + "input": 0.19999999999999998, + "output": 0.5, + "cache_read": 0.049999999999999996 } }, { - "id": "kimi-k2", - "name": "Kimi K2", - "display_name": "Kimi K2", + "id": "qwen3-coder", + "name": "Qwen3 Coder 480B A35B Instruct Turbo", + "display_name": "Qwen3 Coder 480B A35B Instruct Turbo", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video" ], "output": [ "text" @@ -21982,7 +22104,7 @@ }, "limit": { "context": 262144, - "output": 262144 + "output": 16384 }, "temperature": true, "tool_call": true, @@ -21990,55 +22112,51 @@ "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2024-10", - "release_date": "2025-09-05", - "last_updated": "2025-09-05", + "open_weights": false, + "knowledge": "2025-07", + "release_date": "2025-07-23", + "last_updated": "2025-07-23", "cost": { - "input": 0.4, - "output": 2.5, - "cache_read": 0.4 + "input": 0.22, + "output": 0.95 } }, { - "id": "gpt-5.1-codex", - "name": "GPT-5.1 Codex", - "display_name": "GPT-5.1 Codex", + "id": "deepseek-v3", + "name": "DeepSeek V3", + "display_name": "DeepSeek V3", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ - "text", - "image" + "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 128000, + "output": 8192 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-12", - "last_updated": "2025-11-12", + "knowledge": "2024-12", + "release_date": "2024-12-26", + "last_updated": "2024-12-26", "cost": { - "input": 1.07, - "output": 8.5, - "cache_read": 0.107 + "input": 0.56, + "output": 1.68, + "cache_read": 0.07 } }, { - "id": "claude-haiku-4-5", - "name": "Claude Haiku 4.5", - "display_name": "Claude Haiku 4.5", + "id": "claude-opus-4", + "name": "Anthropic: Claude Opus 4", + "display_name": "Anthropic: Claude Opus 4", "modalities": { "input": [ "text", @@ -22050,7 +22168,7 @@ }, "limit": { "context": 200000, - "output": 64000 + "output": 32000 }, "temperature": true, "tool_call": true, @@ -22058,22 +22176,22 @@ "supported": true, "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-02-28", - "release_date": "2025-10-15", - "last_updated": "2025-10-15", + "knowledge": "2025-05", + "release_date": "2025-05-14", + "last_updated": "2025-05-14", "cost": { - "input": 1, - "output": 5, - "cache_read": 0.1, - "cache_write": 1.25 + "input": 15, + "output": 75, + "cache_read": 1.5, + "cache_write": 18.75 } }, { - "id": "claude-opus-4-5", - "name": "Claude Opus 4.5", - "display_name": "Claude Opus 4.5", + "id": "grok-4-fast-reasoning", + "name": "xAI: Grok 4 Fast Reasoning", + "display_name": "xAI: Grok 4 Fast Reasoning", "modalities": { "input": [ "text", @@ -22084,8 +22202,8 @@ ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 2000000, + "output": 2000000 }, "temperature": true, "tool_call": true, @@ -22093,64 +22211,52 @@ "supported": true, "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-11-01", - "last_updated": "2025-11-01", + "knowledge": "2025-09", + "release_date": "2025-09-01", + "last_updated": "2025-09-01", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25 + "input": 0.19999999999999998, + "output": 0.5, + "cache_read": 0.049999999999999996 } }, { - "id": "gemini-3-pro", - "name": "Gemini 3 Pro", - "display_name": "Gemini 3 Pro", + "id": "llama-3.1-8b-instant", + "name": "Meta Llama 3.1 8B Instant", + "display_name": "Meta Llama 3.1 8B Instant", "modalities": { "input": [ - "text", - "image", - "video", - "audio", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 64000 + "context": 131072, + "output": 32678 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-11-18", - "last_updated": "2025-11-18", + "knowledge": "2024-07", + "release_date": "2024-07-01", + "last_updated": "2024-07-01", "cost": { - "input": 2, - "output": 12, - "cache_read": 0.2, - "context_over_200k": { - "input": 4, - "output": 18, - "cache_read": 0.4 - } + "input": 0.049999999999999996, + "output": 0.08 } }, { - "id": "claude-sonnet-4-5", - "name": "Claude Sonnet 4.5", - "display_name": "Claude Sonnet 4.5", + "id": "claude-opus-4-1", + "name": "Anthropic: Claude Opus 4.1", + "display_name": "Anthropic: Claude Opus 4.1", "modalities": { "input": [ "text", @@ -22161,8 +22267,8 @@ ] }, "limit": { - "context": 1000000, - "output": 64000 + "context": 200000, + "output": 32000 }, "temperature": true, "tool_call": true, @@ -22170,28 +22276,22 @@ "supported": true, "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-07-31", - "release_date": "2025-09-29", - "last_updated": "2025-09-29", + "knowledge": "2025-08", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75, - "context_over_200k": { - "input": 6, - "output": 22.5, - "cache_read": 0.6, - "cache_write": 7.5 - } + "input": 15, + "output": 75, + "cache_read": 1.5, + "cache_write": 18.75 } }, { - "id": "alpha-gd4", - "name": "Alpha GD4", - "display_name": "Alpha GD4", + "id": "grok-4", + "name": "xAI Grok 4", + "display_name": "xAI Grok 4", "modalities": { "input": [ "text" @@ -22201,98 +22301,94 @@ ] }, "limit": { - "context": 262144, - "output": 32768 + "context": 256000, + "output": 256000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2025-01", - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "open_weights": false, + "knowledge": "2024-07", + "release_date": "2024-07-09", + "last_updated": "2024-07-09", "cost": { - "input": 0.5, - "output": 2, - "cache_read": 0.15 + "input": 3, + "output": 15, + "cache_read": 0.75 } }, { - "id": "kimi-k2-thinking", - "name": "Kimi K2 Thinking", - "display_name": "Kimi K2 Thinking", + "id": "qwen3-next-80b-a3b-instruct", + "name": "Qwen3 Next 80B A3B Instruct", + "display_name": "Qwen3 Next 80B A3B Instruct", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 262000, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2024-10", - "release_date": "2025-09-05", - "last_updated": "2025-09-05", + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 0.4, - "output": 2.5, - "cache_read": 0.4 + "input": 0.14, + "output": 1.4 } }, { - "id": "gpt-5.1", - "name": "GPT-5.1", - "display_name": "GPT-5.1", + "id": "llama-4-maverick", + "name": "Meta Llama 4 Maverick 17B 128E", + "display_name": "Meta Llama 4 Maverick 17B 128E", "modalities": { "input": [ "text", "image" ], "output": [ - "text", - "image" + "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 131072, + "output": 8192 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-12", - "last_updated": "2025-11-12", + "knowledge": "2025-01", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 1.07, - "output": 8.5, - "cache_read": 0.107 + "input": 0.15, + "output": 0.6 } }, { - "id": "alpha-minimax-m2", - "name": "MiniMax M2 (alpha)", - "display_name": "MiniMax M2 (alpha)", + "id": "llama-prompt-guard-2-86m", + "name": "Meta Llama Prompt Guard 2 86M", + "display_name": "Meta Llama Prompt Guard 2 86M", "modalities": { "input": [ "text" @@ -22302,29 +22398,28 @@ ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 512, + "output": 2 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": true, + "open_weights": false, "knowledge": "2024-10", - "release_date": "2025-10-27", - "last_updated": "2025-10-27", + "release_date": "2024-10-01", + "last_updated": "2024-10-01", "cost": { - "input": 0.3, - "output": 1.2 + "input": 0.01, + "output": 0.01 } }, { - "id": "gpt-5-nano", - "name": "GPT-5 Nano", - "display_name": "GPT-5 Nano", + "id": "grok-4-1-fast-reasoning", + "name": "xAI Grok 4.1 Fast Reasoning", + "display_name": "xAI Grok 4.1 Fast Reasoning", "modalities": { "input": [ "text", @@ -22335,67 +22430,66 @@ ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 2000000, + "output": 2000000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-05-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "knowledge": "2025-11", + "release_date": "2025-11-17", + "last_updated": "2025-11-17", "cost": { - "input": 0, - "output": 0, - "cache_read": 0 + "input": 0.19999999999999998, + "output": 0.5, + "cache_read": 0.049999999999999996 } }, { - "id": "gpt-5-codex", - "name": "GPT-5 Codex", - "display_name": "GPT-5 Codex", + "id": "grok-code-fast-1", + "name": "xAI Grok Code Fast 1", + "display_name": "xAI Grok Code Fast 1", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 256000, + "output": 10000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "knowledge": "2024-08", + "release_date": "2024-08-25", + "last_updated": "2024-08-25", "cost": { - "input": 1.07, - "output": 8.5, - "cache_read": 0.107 + "input": 0.19999999999999998, + "output": 1.5, + "cache_read": 0.02 } }, { - "id": "big-pickle", - "name": "Big Pickle", - "display_name": "Big Pickle", + "id": "claude-4.5-haiku", + "name": "Anthropic: Claude 4.5 Haiku", + "display_name": "Anthropic: Claude 4.5 Haiku", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -22403,327 +22497,305 @@ }, "limit": { "context": 200000, - "output": 128000 + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-10-17", - "last_updated": "2025-10-17", + "knowledge": "2025-10", + "release_date": "2025-10-01", + "last_updated": "2025-10-01", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "input": 1, + "output": 5, + "cache_read": 0.09999999999999999, + "cache_write": 1.25 } }, { - "id": "claude-3-5-haiku", - "name": "Claude Haiku 3.5", - "display_name": "Claude Haiku 3.5", + "id": "llama-3.1-8b-instruct-turbo", + "name": "Meta Llama 3.1 8B Instruct Turbo", + "display_name": "Meta Llama 3.1 8B Instruct Turbo", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 8192 + "context": 128000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-07-31", - "release_date": "2024-10-22", - "last_updated": "2024-10-22", + "knowledge": "2024-07", + "release_date": "2024-07-23", + "last_updated": "2024-07-23", "cost": { - "input": 0.8, - "output": 4, - "cache_read": 0.08, - "cache_write": 1 + "input": 0.02, + "output": 0.03 } }, { - "id": "glm-4.6", - "name": "GLM-4.6", - "display_name": "GLM-4.6", + "id": "gpt-5.1-codex", + "name": "OpenAI: GPT-5.1 Codex", + "display_name": "OpenAI: GPT-5.1 Codex", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ - "text" + "text", + "image" ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-09-30", - "last_updated": "2025-09-30", + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 0.6, - "output": 2.2, - "cache_read": 0.1 + "input": 1.25, + "output": 10, + "cache_read": 0.12500000000000003 } }, { - "id": "grok-code", - "name": "Grok Code Fast 1", - "display_name": "Grok Code Fast 1", + "id": "gpt-4.1-mini-2025-04-14", + "name": "OpenAI GPT-4.1 Mini", + "display_name": "OpenAI GPT-4.1 Mini", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 256000 + "context": 1047576, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-08-20", - "last_updated": "2025-08-20", + "knowledge": "2025-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "input": 0.39999999999999997, + "output": 1.5999999999999999, + "cache_read": 0.09999999999999999 } }, { - "id": "alpha-doubao-seed-code", - "name": "Doubao Seed Code (alpha)", - "display_name": "Doubao Seed Code (alpha)", + "id": "llama-guard-4", + "name": "Meta Llama Guard 4 12B", + "display_name": "Meta Llama Guard 4 12B", "modalities": { "input": [ "text", - "image", - "video" + "image" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 32000 + "context": 131072, + "output": 1024 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2024-10", - "release_date": "2025-11-11", - "last_updated": "2025-11-11", + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 0, - "output": 0, - "cache_read": 0 + "input": 0.21, + "output": 0.21 } }, { - "id": "claude-sonnet-4", - "name": "Claude Sonnet 4", - "display_name": "Claude Sonnet 4", + "id": "llama-3.1-8b-instruct", + "name": "Meta Llama 3.1 8B Instruct", + "display_name": "Meta Llama 3.1 8B Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 64000 + "context": 16384, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-05-22", - "last_updated": "2025-05-22", + "knowledge": "2024-07", + "release_date": "2024-07-23", + "last_updated": "2024-07-23", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75, - "context_over_200k": { - "input": 6, - "output": 22.5, - "cache_read": 0.6, - "cache_write": 7.5 - } + "input": 0.02, + "output": 0.049999999999999996 } }, { - "id": "gpt-5", - "name": "GPT-5", - "display_name": "GPT-5", + "id": "gemini-3-pro-preview", + "name": "Google Gemini 3 Pro Preview", + "display_name": "Google Gemini 3 Pro Preview", "modalities": { "input": [ "text", - "image" + "image", + "audio", + "video" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 1048576, + "output": 65536 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "knowledge": "2025-11", + "release_date": "2025-11-18", + "last_updated": "2025-11-18", "cost": { - "input": 1.07, - "output": 8.5, - "cache_read": 0.107 + "input": 2, + "output": 12, + "cache_read": 0.19999999999999998 } - } - ] - }, - "fastrouter": { - "id": "fastrouter", - "name": "FastRouter", - "display_name": "FastRouter", - "api": "https://go.fastrouter.ai/api/v1", - "doc": "https://fastrouter.ai/models", - "models": [ + }, { - "id": "moonshotai/kimi-k2", - "name": "Kimi K2", - "display_name": "Kimi K2", + "id": "gemini-2.5-flash", + "name": "Google Gemini 2.5 Flash", + "display_name": "Google Gemini 2.5 Flash", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 1048576, + "output": 65535 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": true, - "knowledge": "2024-10", - "release_date": "2025-07-11", - "last_updated": "2025-07-11", + "open_weights": false, + "knowledge": "2025-06", + "release_date": "2025-06-17", + "last_updated": "2025-06-17", "cost": { - "input": 0.55, - "output": 2.2 + "input": 0.3, + "output": 2.5, + "cache_read": 0.075, + "cache_write": 0.3 } }, { - "id": "x-ai/grok-4", - "name": "Grok 4", - "display_name": "Grok 4", + "id": "gpt-4.1-mini", + "name": "OpenAI GPT-4.1 Mini", + "display_name": "OpenAI GPT-4.1 Mini", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 64000 + "context": 1047576, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2025-07", - "release_date": "2025-07-09", - "last_updated": "2025-07-09", + "knowledge": "2025-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.75, - "cache_write": 15 + "input": 0.39999999999999997, + "output": 1.5999999999999999, + "cache_read": 0.09999999999999999 } }, { - "id": "google/gemini-2.5-flash", - "name": "Gemini 2.5 Flash", - "display_name": "Gemini 2.5 Flash", + "id": "deepseek-v3.1-terminus", + "name": "DeepSeek V3.1 Terminus", + "display_name": "DeepSeek V3.1 Terminus", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 128000, + "output": 16384 }, "temperature": true, "tool_call": true, @@ -22731,56 +22803,52 @@ "supported": true, "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-06-17", - "last_updated": "2025-06-17", + "knowledge": "2025-09", + "release_date": "2025-09-22", + "last_updated": "2025-09-22", "cost": { - "input": 0.3, - "output": 2.5, - "cache_read": 0.0375 + "input": 0.27, + "output": 1, + "cache_read": 0.21600000000000003 } }, { - "id": "google/gemini-2.5-pro", - "name": "Gemini 2.5 Pro", - "display_name": "Gemini 2.5 Pro", + "id": "llama-prompt-guard-2-22m", + "name": "Meta Llama Prompt Guard 2 22M", + "display_name": "Meta Llama Prompt Guard 2 22M", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 512, + "output": 2 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-06-17", - "last_updated": "2025-06-17", + "knowledge": "2024-10", + "release_date": "2024-10-01", + "last_updated": "2024-10-01", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.31 + "input": 0.01, + "output": 0.01 } }, { - "id": "openai/gpt-5-nano", - "name": "GPT-5 Nano", - "display_name": "GPT-5 Nano", + "id": "claude-3.5-sonnet-v2", + "name": "Anthropic: Claude 3.5 Sonnet v2", + "display_name": "Anthropic: Claude 3.5 Sonnet v2", "modalities": { "input": [ "text", @@ -22791,63 +22859,62 @@ ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 200000, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-10-01", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "knowledge": "2024-10", + "release_date": "2024-10-22", + "last_updated": "2024-10-22", "cost": { - "input": 0.05, - "output": 0.4, - "cache_read": 0.005 + "input": 3, + "output": 15, + "cache_read": 0.30000000000000004, + "cache_write": 3.75 } }, { - "id": "openai/gpt-4.1", - "name": "GPT-4.1", - "display_name": "GPT-4.1", + "id": "sonar-deep-research", + "name": "Perplexity Sonar Deep Research", + "display_name": "Perplexity Sonar Deep Research", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1047576, - "output": 32768 + "context": 127000, + "output": 4096 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", + "knowledge": "2025-01", + "release_date": "2025-01-27", + "last_updated": "2025-01-27", "cost": { "input": 2, - "output": 8, - "cache_read": 0.5 + "output": 8 } }, { - "id": "openai/gpt-5-mini", - "name": "GPT-5 Mini", - "display_name": "GPT-5 Mini", + "id": "gemini-2.5-flash-lite", + "name": "Google Gemini 2.5 Flash Lite", + "display_name": "Google Gemini 2.5 Flash Lite", "modalities": { "input": [ "text", @@ -22858,8 +22925,8 @@ ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 1048576, + "output": 65535 }, "temperature": true, "tool_call": true, @@ -22867,32 +22934,34 @@ "supported": true, "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-10-01", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "knowledge": "2025-07", + "release_date": "2025-07-22", + "last_updated": "2025-07-22", "cost": { - "input": 0.25, - "output": 2, - "cache_read": 0.025 + "input": 0.09999999999999999, + "output": 0.39999999999999997, + "cache_read": 0.024999999999999998, + "cache_write": 0.09999999999999999 } }, { - "id": "openai/gpt-oss-20b", - "name": "GPT OSS 20B", - "display_name": "GPT OSS 20B", + "id": "claude-sonnet-4-5-20250929", + "name": "Anthropic: Claude Sonnet 4.5 (20250929)", + "display_name": "Anthropic: Claude Sonnet 4.5 (20250929)", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 65536 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, @@ -22901,18 +22970,21 @@ "default": true }, "attachment": false, - "open_weights": true, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "open_weights": false, + "knowledge": "2025-09", + "release_date": "2025-09-29", + "last_updated": "2025-09-29", "cost": { - "input": 0.05, - "output": 0.2 + "input": 3, + "output": 15, + "cache_read": 0.30000000000000004, + "cache_write": 3.75 } }, { - "id": "openai/gpt-oss-120b", - "name": "GPT OSS 120B", - "display_name": "GPT OSS 120B", + "id": "grok-3", + "name": "xAI Grok 3", + "display_name": "xAI Grok 3", "modalities": { "input": [ "text" @@ -22923,27 +22995,28 @@ }, "limit": { "context": 131072, - "output": 32768 + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "open_weights": false, + "knowledge": "2024-06", + "release_date": "2024-06-01", + "last_updated": "2024-06-01", "cost": { - "input": 0.15, - "output": 0.6 + "input": 3, + "output": 15, + "cache_read": 0.75 } }, { - "id": "openai/gpt-5", - "name": "GPT-5", - "display_name": "GPT-5", + "id": "mistral-small", + "name": "Mistral Small", + "display_name": "Mistral Small", "modalities": { "input": [ "text", @@ -22954,30 +23027,28 @@ ] }, "limit": { - "context": 400000, + "context": 128000, "output": 128000 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-10-01", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "knowledge": "2024-02", + "release_date": "2024-02-26", + "last_updated": "2024-02-26", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125 + "input": 75, + "output": 200 } }, { - "id": "qwen/qwen3-coder", - "name": "Qwen3 Coder", - "display_name": "Qwen3 Coder", + "id": "kimi-k2-0711", + "name": "Kimi K2 (07/11)", + "display_name": "Kimi K2 (07/11)", "modalities": { "input": [ "text" @@ -22987,8 +23058,8 @@ ] }, "limit": { - "context": 262144, - "output": 66536 + "context": 131072, + "output": 16384 }, "temperature": true, "tool_call": true, @@ -22996,19 +23067,19 @@ "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-23", - "last_updated": "2025-07-23", + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 0.3, - "output": 1.2 + "input": 0.5700000000000001, + "output": 2.3 } }, { - "id": "anthropic/claude-opus-4.1", - "name": "Claude Opus 4.1", - "display_name": "Claude Opus 4.1", + "id": "chatgpt-4o-latest", + "name": "OpenAI ChatGPT-4o", + "display_name": "OpenAI ChatGPT-4o", "modalities": { "input": [ "text", @@ -23019,66 +23090,60 @@ ] }, "limit": { - "context": 200000, - "output": 32000 + "context": 128000, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "knowledge": "2024-08", + "release_date": "2024-08-14", + "last_updated": "2024-08-14", "cost": { - "input": 15, - "output": 75, - "cache_read": 1.5, - "cache_write": 18.75 + "input": 5, + "output": 20, + "cache_read": 2.5 } }, { - "id": "anthropic/claude-sonnet-4", - "name": "Claude Sonnet 4", - "display_name": "Claude Sonnet 4", + "id": "qwen3-coder-30b-a3b-instruct", + "name": "Qwen3 Coder 30B A3B Instruct", + "display_name": "Qwen3 Coder 30B A3B Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-05-22", - "last_updated": "2025-05-22", + "knowledge": "2025-07", + "release_date": "2025-07-31", + "last_updated": "2025-07-31", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 0.09999999999999999, + "output": 0.3 } }, { - "id": "deepseek-ai/deepseek-r1-distill-llama-70b", - "name": "DeepSeek R1 Distill Llama 70B", - "display_name": "DeepSeek R1 Distill Llama 70B", + "id": "kimi-k2-0905", + "name": "Kimi K2 (09/05)", + "display_name": "Kimi K2 (09/05)", "modalities": { "input": [ "text" @@ -23088,37 +23153,29 @@ ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 262144, + "output": 16384 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2024-10", - "release_date": "2025-01-23", - "last_updated": "2025-01-23", + "open_weights": false, + "knowledge": "2025-09", + "release_date": "2025-09-05", + "last_updated": "2025-09-05", "cost": { - "input": 0.03, - "output": 0.14 + "input": 0.5, + "output": 2, + "cache_read": 0.39999999999999997 } - } - ] - }, - "google": { - "id": "google", - "name": "google", - "display_name": "google", - "doc": "https://ai.google.dev/gemini-api/docs/pricing", - "models": [ + }, { - "id": "gemini-embedding-001", - "name": "Gemini Embedding 001", - "display_name": "Gemini Embedding 001", + "id": "sonar-reasoning", + "name": "Perplexity Sonar Reasoning", + "display_name": "Perplexity Sonar Reasoning", "modalities": { "input": [ "text" @@ -23128,178 +23185,157 @@ ] }, "limit": { - "context": 2048, - "output": 3072 + "context": 127000, + "output": 4096 }, - "temperature": false, + "temperature": true, "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": false, - "knowledge": "2025-05", - "release_date": "2025-05-20", - "last_updated": "2025-05-20", + "knowledge": "2025-01", + "release_date": "2025-01-27", + "last_updated": "2025-01-27", "cost": { - "input": 0.15, - "output": 0 + "input": 1, + "output": 5 } }, { - "id": "gemini-2.5-flash-image", - "name": "Gemini 2.5 Flash Image", - "display_name": "Gemini 2.5 Flash Image", + "id": "llama-3.3-70b-instruct", + "name": "Meta Llama 3.3 70B Instruct", + "display_name": "Meta Llama 3.3 70B Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ - "text", - "image" + "text" ] }, "limit": { - "context": 32768, - "output": 32768 + "context": 128000, + "output": 16400 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2025-06", - "release_date": "2025-08-26", - "last_updated": "2025-08-26", + "knowledge": "2024-12", + "release_date": "2024-12-06", + "last_updated": "2024-12-06", "cost": { - "input": 0.3, - "output": 30, - "cache_read": 0.075 + "input": 0.13, + "output": 0.39 } }, { - "id": "gemini-2.5-flash-preview-05-20", - "name": "Gemini 2.5 Flash Preview 05-20", - "display_name": "Gemini 2.5 Flash Preview 05-20", + "id": "gpt-5.1-codex-mini", + "name": "OpenAI: GPT-5.1 Codex Mini", + "display_name": "OpenAI: GPT-5.1 Codex Mini", "modalities": { "input": [ "text", - "image", - "audio", - "video", - "pdf" + "image" ], "output": [ - "text" + "text", + "image" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, "knowledge": "2025-01", - "release_date": "2025-05-20", - "last_updated": "2025-05-20", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 0.15, - "output": 0.6, - "cache_read": 0.0375 + "input": 0.25, + "output": 2, + "cache_read": 0.024999999999999998 } }, { - "id": "gemini-flash-lite-latest", - "name": "Gemini Flash-Lite Latest", - "display_name": "Gemini Flash-Lite Latest", + "id": "kimi-k2-thinking", + "name": "Kimi K2 Thinking", + "display_name": "Kimi K2 Thinking", "modalities": { "input": [ - "text", - "image", - "audio", - "video", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 256000, + "output": 262144 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-09-25", - "last_updated": "2025-09-25", - "cost": { - "input": 0.1, - "output": 0.4, - "cache_read": 0.025 + "knowledge": "2025-11", + "release_date": "2025-11-06", + "last_updated": "2025-11-06", + "cost": { + "input": 0.48, + "output": 2 } }, { - "id": "gemini-3-pro-preview", - "name": "Gemini 3 Pro Preview", - "display_name": "Gemini 3 Pro Preview", + "id": "o3-mini", + "name": "OpenAI o3 Mini", + "display_name": "OpenAI o3 Mini", "modalities": { "input": [ - "text", - "image", - "video", - "audio", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 64000 + "context": 200000, + "output": 100000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-11-18", - "last_updated": "2025-11-18", + "knowledge": "2023-10", + "release_date": "2023-10-01", + "last_updated": "2023-10-01", "cost": { - "input": 2, - "output": 12, - "cache_read": 0.2, - "context_over_200k": { - "input": 4, - "output": 18, - "cache_read": 0.4 - } + "input": 1.1, + "output": 4.4, + "cache_read": 0.55 } }, { - "id": "gemini-2.5-flash", - "name": "Gemini 2.5 Flash", - "display_name": "Gemini 2.5 Flash", + "id": "claude-4.5-sonnet", + "name": "Anthropic: Claude Sonnet 4.5", + "display_name": "Anthropic: Claude Sonnet 4.5", "modalities": { "input": [ "text", @@ -23310,256 +23346,227 @@ ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true, - "budget": { - "default": -1, - "min": 0, - "max": 24576 - } - }, - "search": { - "supported": true, - "default": false + "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-03-20", - "last_updated": "2025-06-05", + "knowledge": "2025-09", + "release_date": "2025-09-29", + "last_updated": "2025-09-29", "cost": { - "input": 0.3, - "output": 2.5, - "cache_read": 0.075, - "input_audio": 1 + "input": 3, + "output": 15, + "cache_read": 0.30000000000000004, + "cache_write": 3.75 } }, { - "id": "gemini-flash-latest", - "name": "Gemini Flash Latest", - "display_name": "Gemini Flash Latest", + "id": "gpt-5.1", + "name": "OpenAI GPT-5.1", + "display_name": "OpenAI GPT-5.1", "modalities": { "input": [ "text", - "image", - "audio", - "video", - "pdf" + "image" ], "output": [ - "text" + "text", + "image" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, "knowledge": "2025-01", - "release_date": "2025-09-25", - "last_updated": "2025-09-25", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 0.3, - "output": 2.5, - "cache_read": 0.075, - "input_audio": 1 + "input": 1.25, + "output": 10, + "cache_read": 0.12500000000000003 } }, { - "id": "gemini-2.5-pro-preview-05-06", - "name": "Gemini 2.5 Pro Preview 05-06", - "display_name": "Gemini 2.5 Pro Preview 05-06", + "id": "codex-mini-latest", + "name": "OpenAI Codex Mini Latest", + "display_name": "OpenAI Codex Mini Latest", "modalities": { "input": [ "text", - "image", - "audio", - "video", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 200000, + "output": 100000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, "knowledge": "2025-01", - "release_date": "2025-05-06", - "last_updated": "2025-05-06", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.31 + "input": 1.5, + "output": 6, + "cache_read": 0.375 } }, { - "id": "gemini-2.5-flash-preview-tts", - "name": "Gemini 2.5 Flash Preview TTS", - "display_name": "Gemini 2.5 Flash Preview TTS", + "id": "gpt-5-nano", + "name": "OpenAI GPT-5 Nano", + "display_name": "OpenAI GPT-5 Nano", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ - "audio" + "text" ] }, "limit": { - "context": 8000, - "output": 16000 + "context": 400000, + "output": 128000 }, "temperature": false, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, "knowledge": "2025-01", - "release_date": "2025-05-01", - "last_updated": "2025-05-01", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 0.5, - "output": 10 + "input": 0.049999999999999996, + "output": 0.39999999999999997, + "cache_read": 0.005 } }, { - "id": "gemini-2.0-flash-lite", - "name": "Gemini 2.0 Flash Lite", - "display_name": "Gemini 2.0 Flash Lite", + "id": "gpt-5-codex", + "name": "OpenAI: GPT-5 Codex", + "display_name": "OpenAI: GPT-5 Codex", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 8192 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": false }, - "search": { - "supported": false - }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-06", - "release_date": "2024-12-11", - "last_updated": "2024-12-11", + "knowledge": "2025-01", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 0.075, - "output": 0.3 + "input": 1.25, + "output": 10, + "cache_read": 0.12500000000000003 } }, { - "id": "gemini-live-2.5-flash-preview-native-audio", - "name": "Gemini Live 2.5 Flash Preview Native Audio", - "display_name": "Gemini Live 2.5 Flash Preview Native Audio", + "id": "gpt-4o", + "name": "OpenAI GPT-4o", + "display_name": "OpenAI GPT-4o", "modalities": { "input": [ "text", - "audio", - "video" + "image" ], "output": [ - "text", - "audio" + "text" ] }, "limit": { - "context": 131072, - "output": 65536 + "context": 128000, + "output": 16384 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-06-17", - "last_updated": "2025-09-18", + "knowledge": "2024-05", + "release_date": "2024-05-13", + "last_updated": "2024-05-13", "cost": { - "input": 0.5, - "output": 2, - "input_audio": 3, - "output_audio": 12 + "input": 2.5, + "output": 10, + "cache_read": 1.25 } }, { - "id": "gemini-2.0-flash", - "name": "Gemini 2.0 Flash", - "display_name": "Gemini 2.0 Flash", + "id": "deepseek-tng-r1t2-chimera", + "name": "DeepSeek TNG R1T2 Chimera", + "display_name": "DeepSeek TNG R1T2 Chimera", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 8192 + "context": 130000, + "output": 163840 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false - }, - "search": { - "supported": true, - "default": false + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-06", - "release_date": "2024-12-11", - "last_updated": "2024-12-11", + "knowledge": "2025-07", + "release_date": "2025-07-02", + "last_updated": "2025-07-02", "cost": { - "input": 0.1, - "output": 0.4, - "cache_read": 0.025 + "input": 0.3, + "output": 1.2 } }, { - "id": "gemini-2.5-flash-lite", - "name": "Gemini 2.5 Flash Lite", - "display_name": "Gemini 2.5 Flash Lite", + "id": "claude-4.5-opus", + "name": "Anthropic: Claude Opus 4.5", + "display_name": "Anthropic: Claude Opus 4.5", "modalities": { "input": [ "text", @@ -23570,129 +23577,106 @@ ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false, - "budget": { - "default": -1, - "min": 512, - "max": 24576 - } - }, - "search": { - "supported": true, - "default": false + "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-06-17", - "last_updated": "2025-06-17", + "knowledge": "2025-11", + "release_date": "2025-11-24", + "last_updated": "2025-11-24", "cost": { - "input": 0.1, - "output": 0.4, - "cache_read": 0.025 + "input": 5, + "output": 25, + "cache_read": 0.5000000000000001, + "cache_write": 6.25 } }, { - "id": "gemini-2.5-pro-preview-06-05", - "name": "Gemini 2.5 Pro Preview 06-05", - "display_name": "Gemini 2.5 Pro Preview 06-05", + "id": "gpt-4.1", + "name": "OpenAI GPT-4.1", + "display_name": "OpenAI GPT-4.1", "modalities": { "input": [ "text", - "image", - "audio", - "video", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 1047576, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-06-05", - "last_updated": "2025-06-05", + "knowledge": "2025-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.31 + "input": 2, + "output": 8, + "cache_read": 0.5 } }, { - "id": "gemini-live-2.5-flash", - "name": "Gemini Live 2.5 Flash", - "display_name": "Gemini Live 2.5 Flash", + "id": "sonar", + "name": "Perplexity Sonar", + "display_name": "Perplexity Sonar", "modalities": { "input": [ - "text", - "image", - "audio", - "video" + "text" ], "output": [ - "text", - "audio" + "text" ] }, "limit": { - "context": 128000, - "output": 8000 + "context": 127000, + "output": 4096 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, "knowledge": "2025-01", - "release_date": "2025-09-01", - "last_updated": "2025-09-01", + "release_date": "2025-01-27", + "last_updated": "2025-01-27", "cost": { - "input": 0.5, - "output": 2, - "input_audio": 3, - "output_audio": 12 + "input": 1, + "output": 1 } }, { - "id": "gemini-2.5-flash-lite-preview-06-17", - "name": "Gemini 2.5 Flash Lite Preview 06-17", - "display_name": "Gemini 2.5 Flash Lite Preview 06-17", + "id": "glm-4.6", + "name": "Zai GLM-4.6", + "display_name": "Zai GLM-4.6", "modalities": { "input": [ - "text", - "image", - "audio", - "video", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -23700,148 +23684,129 @@ "supported": true, "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-06-17", - "last_updated": "2025-06-17", + "knowledge": "2024-07", + "release_date": "2024-07-18", + "last_updated": "2024-07-18", "cost": { - "input": 0.1, - "output": 0.4, - "cache_read": 0.025, - "input_audio": 0.3 + "input": 0.44999999999999996, + "output": 1.5 } }, { - "id": "gemini-2.5-flash-image-preview", - "name": "Gemini 2.5 Flash Image Preview", - "display_name": "Gemini 2.5 Flash Image Preview", + "id": "o4-mini", + "name": "OpenAI o4 Mini", + "display_name": "OpenAI o4 Mini", "modalities": { "input": [ "text", "image" ], "output": [ - "text", - "image" + "text" ] }, "limit": { - "context": 32768, - "output": 32768 + "context": 200000, + "output": 100000 }, - "temperature": true, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2025-06", - "release_date": "2025-08-26", - "last_updated": "2025-08-26", + "knowledge": "2024-06", + "release_date": "2024-06-01", + "last_updated": "2024-06-01", "cost": { - "input": 0.3, - "output": 30, - "cache_read": 0.075 + "input": 1.1, + "output": 4.4, + "cache_read": 0.275 } }, { - "id": "gemini-2.5-flash-preview-09-2025", - "name": "Gemini 2.5 Flash Preview 09 2025", - "display_name": "Gemini 2.5 Flash Preview 09 2025", + "id": "qwen3-235b-a22b-thinking", + "name": "Qwen3 235B A22B Thinking", + "display_name": "Qwen3 235B A22B Thinking", "modalities": { "input": [ "text", - "image" + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 262144, + "output": 81920 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, - "default": true, - "budget": { - "default": -1, - "min": 0, - "max": 24576 - } - }, - "search": { - "supported": true, - "default": false + "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-09-25", - "last_updated": "2025-09-25", + "knowledge": "2025-07", + "release_date": "2025-07-25", + "last_updated": "2025-07-25", "cost": { "input": 0.3, - "output": 2.5, - "cache_read": 0.075, - "input_audio": 1 + "output": 2.9000000000000004 } }, { - "id": "gemini-2.5-flash-preview-04-17", - "name": "Gemini 2.5 Flash Preview 04-17", - "display_name": "Gemini 2.5 Flash Preview 04-17", + "id": "hermes-2-pro-llama-3-8b", + "name": "Hermes 2 Pro Llama 3 8B", + "display_name": "Hermes 2 Pro Llama 3 8B", "modalities": { "input": [ - "text", - "image", - "audio", - "video", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 131072, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-04-17", - "last_updated": "2025-04-17", + "knowledge": "2024-05", + "release_date": "2024-05-27", + "last_updated": "2024-05-27", "cost": { - "input": 0.15, - "output": 0.6, - "cache_read": 0.0375 + "input": 0.14, + "output": 0.14 } }, { - "id": "gemini-2.5-pro-preview-tts", - "name": "Gemini 2.5 Pro Preview TTS", - "display_name": "Gemini 2.5 Pro Preview TTS", + "id": "o1", + "name": "OpenAI: o1", + "display_name": "OpenAI: o1", "modalities": { "input": [ "text" ], "output": [ - "audio" + "text" ] }, "limit": { - "context": 8000, - "output": 16000 + "context": 200000, + "output": 100000 }, "temperature": false, "tool_call": false, @@ -23851,398 +23816,345 @@ "attachment": false, "open_weights": false, "knowledge": "2025-01", - "release_date": "2025-05-01", - "last_updated": "2025-05-01", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 1, - "output": 20 + "input": 15, + "output": 60, + "cache_read": 7.5 } }, { - "id": "gemini-2.5-pro", - "name": "Gemini 2.5 Pro", - "display_name": "Gemini 2.5 Pro", + "id": "grok-3-mini", + "name": "xAI Grok 3 Mini", + "display_name": "xAI Grok 3 Mini", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 131072, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true, - "budget": { - "default": -1, - "min": 128, - "max": 32768 - } - }, - "search": { - "supported": true, - "default": false + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-03-20", - "last_updated": "2025-06-05", + "knowledge": "2024-06", + "release_date": "2024-06-01", + "last_updated": "2024-06-01", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.31 + "input": 0.3, + "output": 0.5, + "cache_read": 0.075 } }, { - "id": "gemini-1.5-flash", - "name": "Gemini 1.5 Flash", - "display_name": "Gemini 1.5 Flash", + "id": "sonar-pro", + "name": "Perplexity Sonar Pro", + "display_name": "Perplexity Sonar Pro", "modalities": { "input": [ - "text", - "image", - "audio", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 8192 + "context": 200000, + "output": 4096 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2024-05-14", - "last_updated": "2024-05-14", + "knowledge": "2025-01", + "release_date": "2025-01-27", + "last_updated": "2025-01-27", "cost": { - "input": 0.075, - "output": 0.3, - "cache_read": 0.01875 + "input": 3, + "output": 15 } }, { - "id": "gemini-1.5-flash-8b", - "name": "Gemini 1.5 Flash-8B", - "display_name": "Gemini 1.5 Flash-8B", + "id": "gpt-5-mini", + "name": "OpenAI GPT-5 Mini", + "display_name": "OpenAI GPT-5 Mini", "modalities": { "input": [ "text", - "image", - "audio", - "video" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 8192 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2024-10-03", - "last_updated": "2024-10-03", + "knowledge": "2025-01", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 0.0375, - "output": 0.15, - "cache_read": 0.01 + "input": 0.25, + "output": 2, + "cache_read": 0.024999999999999998 } }, { - "id": "gemini-2.5-flash-lite-preview-09-2025", - "name": "Gemini 2.5 Flash Lite Preview 09 2025", - "display_name": "Gemini 2.5 Flash Lite Preview 09 2025", + "id": "deepseek-r1-distill-llama-70b", + "name": "DeepSeek R1 Distill Llama 70B", + "display_name": "DeepSeek R1 Distill Llama 70B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false, - "budget": { - "default": -1, - "min": 512, - "max": 24576 - } - }, - "search": { - "supported": true, - "default": false + "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, "knowledge": "2025-01", - "release_date": "2025-09-25", - "last_updated": "2025-09-25", + "release_date": "2025-01-20", + "last_updated": "2025-01-20", "cost": { - "input": 0.1, - "output": 0.4, - "cache_read": 0.025 + "input": 0.03, + "output": 0.13 } }, { - "id": "gemini-1.5-pro", - "name": "Gemini 1.5 Pro", - "display_name": "Gemini 1.5 Pro", + "id": "o1-mini", + "name": "OpenAI: o1-mini", + "display_name": "OpenAI: o1-mini", "modalities": { "input": [ - "text", - "image", - "audio", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 8192 + "context": 128000, + "output": 65536 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2024-02-15", - "last_updated": "2024-02-15", + "knowledge": "2025-01", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 1.25, - "output": 5, - "cache_read": 0.3125 + "input": 1.1, + "output": 4.4, + "cache_read": 0.55 } }, { - "id": "gemini-2.0-flash-preview-image-generation", - "name": "Gemini 2.0 Flash Preview Image Generation", - "display_name": "Gemini 2.0 Flash Preview Image Generation", + "id": "claude-3.7-sonnet", + "name": "Anthropic: Claude 3.7 Sonnet", + "display_name": "Anthropic: Claude 3.7 Sonnet", "modalities": { "input": [ "text", "image" ], "output": [ - "text", - "image" + "text" ] }, "limit": { - "context": 32000, - "output": 8192 + "context": 200000, + "output": 64000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, - "search": { - "supported": false - }, - "attachment": true - } - ] - }, - "google-vertex": { - "id": "google-vertex", - "name": "Vertex", - "display_name": "Vertex", - "doc": "https://cloud.google.com/vertex-ai/generative-ai/docs/models", - "models": [ + "attachment": false, + "open_weights": false, + "knowledge": "2025-02", + "release_date": "2025-02-19", + "last_updated": "2025-02-19", + "cost": { + "input": 3, + "output": 15, + "cache_read": 0.30000000000000004, + "cache_write": 3.75 + } + }, { - "id": "gemini-embedding-001", - "name": "Gemini Embedding 001", - "display_name": "Gemini Embedding 001", + "id": "claude-3-haiku-20240307", + "name": "Anthropic: Claude 3 Haiku", + "display_name": "Anthropic: Claude 3 Haiku", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 2048, - "output": 3072 + "context": 200000, + "output": 4096 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2025-05", - "release_date": "2025-05-20", - "last_updated": "2025-05-20", + "knowledge": "2024-03", + "release_date": "2024-03-07", + "last_updated": "2024-03-07", "cost": { - "input": 0.15, - "output": 0 + "input": 0.25, + "output": 1.25, + "cache_read": 0.03, + "cache_write": 0.3 } }, { - "id": "gemini-2.5-flash-preview-05-20", - "name": "Gemini 2.5 Flash Preview 05-20", - "display_name": "Gemini 2.5 Flash Preview 05-20", + "id": "o3-pro", + "name": "OpenAI o3 Pro", + "display_name": "OpenAI o3 Pro", "modalities": { "input": [ "text", - "image", - "audio", - "video", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 200000, + "output": 100000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-05-20", - "last_updated": "2025-05-20", + "knowledge": "2024-06", + "release_date": "2024-06-01", + "last_updated": "2024-06-01", "cost": { - "input": 0.15, - "output": 0.6, - "cache_read": 0.0375 + "input": 20, + "output": 80 } }, { - "id": "gemini-flash-lite-latest", - "name": "Gemini Flash-Lite Latest", - "display_name": "Gemini Flash-Lite Latest", + "id": "qwen2.5-coder-7b-fast", + "name": "Qwen2.5 Coder 7B fast", + "display_name": "Qwen2.5 Coder 7B fast", "modalities": { "input": [ - "text", - "image", - "audio", - "video", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 32000, + "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-09-25", - "last_updated": "2025-09-25", + "knowledge": "2024-09", + "release_date": "2024-09-15", + "last_updated": "2024-09-15", "cost": { - "input": 0.1, - "output": 0.4, - "cache_read": 0.025 + "input": 0.03, + "output": 0.09 } }, { - "id": "gemini-3-pro-preview", - "name": "Gemini 3 Pro Preview", - "display_name": "Gemini 3 Pro Preview", + "id": "deepseek-reasoner", + "name": "DeepSeek Reasoner", + "display_name": "DeepSeek Reasoner", "modalities": { "input": [ - "text", - "image", - "video", - "audio", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 128000, + "output": 64000 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, "knowledge": "2025-01", - "release_date": "2025-11-18", - "last_updated": "2025-11-18", + "release_date": "2025-01-20", + "last_updated": "2025-01-20", "cost": { - "input": 2, - "output": 12, - "cache_read": 0.2, - "context_over_200k": { - "input": 4, - "output": 18, - "cache_read": 0.4 - } + "input": 0.56, + "output": 1.68, + "cache_read": 0.07 } }, { - "id": "gemini-2.5-flash", - "name": "Gemini 2.5 Flash", - "display_name": "Gemini 2.5 Flash", + "id": "gemini-2.5-pro", + "name": "Google Gemini 2.5 Pro", + "display_name": "Google Gemini 2.5 Pro", "modalities": { "input": [ "text", - "image", - "audio", - "video", - "pdf" + "image" ], "output": [ "text" @@ -24258,183 +24170,162 @@ "supported": true, "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-01", + "knowledge": "2025-06", "release_date": "2025-06-17", "last_updated": "2025-06-17", "cost": { - "input": 0.3, - "output": 2.5, - "cache_read": 0.075, - "cache_write": 0.383 + "input": 1.25, + "output": 10, + "cache_read": 0.3125, + "cache_write": 1.25 } }, { - "id": "gemini-flash-latest", - "name": "Gemini Flash Latest", - "display_name": "Gemini Flash Latest", + "id": "gemma-3-12b-it", + "name": "Google Gemma 3 12B", + "display_name": "Google Gemma 3 12B", "modalities": { "input": [ "text", - "image", - "audio", - "video", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 131072, + "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-09-25", - "last_updated": "2025-09-25", + "knowledge": "2024-12", + "release_date": "2024-12-01", + "last_updated": "2024-12-01", "cost": { - "input": 0.3, - "output": 2.5, - "cache_read": 0.075, - "cache_write": 0.383 + "input": 0.049999999999999996, + "output": 0.09999999999999999 } }, { - "id": "gemini-2.5-pro-preview-05-06", - "name": "Gemini 2.5 Pro Preview 05-06", - "display_name": "Gemini 2.5 Pro Preview 05-06", + "id": "mistral-nemo", + "name": "Mistral Nemo", + "display_name": "Mistral Nemo", "modalities": { "input": [ "text", - "image", - "audio", - "video", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 128000, + "output": 16400 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-05-06", - "last_updated": "2025-05-06", + "knowledge": "2024-07", + "release_date": "2024-07-18", + "last_updated": "2024-07-18", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.31 + "input": 20, + "output": 40 } }, { - "id": "gemini-2.0-flash-lite", - "name": "Gemini 2.0 Flash Lite", - "display_name": "Gemini 2.0 Flash Lite", + "id": "o3", + "name": "OpenAI o3", + "display_name": "OpenAI o3", "modalities": { "input": [ "text", - "image", - "audio", - "video", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 8192 + "context": 200000, + "output": 100000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, "knowledge": "2024-06", - "release_date": "2024-12-11", - "last_updated": "2024-12-11", + "release_date": "2024-06-01", + "last_updated": "2024-06-01", "cost": { - "input": 0.075, - "output": 0.3 + "input": 2, + "output": 8, + "cache_read": 0.5 } }, { - "id": "gemini-2.0-flash", - "name": "Gemini 2.0 Flash", - "display_name": "Gemini 2.0 Flash", + "id": "gpt-oss-20b", + "name": "OpenAI GPT-OSS 20b", + "display_name": "OpenAI GPT-OSS 20b", "modalities": { "input": [ - "text", - "image", - "audio", - "video", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 8192 + "context": 131072, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, "knowledge": "2024-06", - "release_date": "2024-12-11", - "last_updated": "2024-12-11", + "release_date": "2024-06-01", + "last_updated": "2024-06-01", "cost": { - "input": 0.1, - "output": 0.4, - "cache_read": 0.025 + "input": 0.049999999999999996, + "output": 0.19999999999999998 } }, { - "id": "gemini-2.5-flash-lite", - "name": "Gemini 2.5 Flash Lite", - "display_name": "Gemini 2.5 Flash Lite", + "id": "gpt-oss-120b", + "name": "OpenAI GPT-OSS 120b", + "display_name": "OpenAI GPT-OSS 120b", "modalities": { "input": [ - "text", - "image", - "audio", - "video", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 131072, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -24442,185 +24333,163 @@ "supported": true, "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-06-17", - "last_updated": "2025-06-17", + "knowledge": "2024-06", + "release_date": "2024-06-01", + "last_updated": "2024-06-01", "cost": { - "input": 0.1, - "output": 0.4, - "cache_read": 0.025 + "input": 0.04, + "output": 0.16 } }, { - "id": "gemini-2.5-pro-preview-06-05", - "name": "Gemini 2.5 Pro Preview 06-05", - "display_name": "Gemini 2.5 Pro Preview 06-05", + "id": "claude-3.5-haiku", + "name": "Anthropic: Claude 3.5 Haiku", + "display_name": "Anthropic: Claude 3.5 Haiku", "modalities": { "input": [ "text", - "image", - "audio", - "video", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 200000, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-06-05", - "last_updated": "2025-06-05", + "knowledge": "2024-10", + "release_date": "2024-10-22", + "last_updated": "2024-10-22", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.31 + "input": 0.7999999999999999, + "output": 4, + "cache_read": 0.08, + "cache_write": 1 } }, { - "id": "gemini-2.5-flash-lite-preview-06-17", - "name": "Gemini 2.5 Flash Lite Preview 06-17", - "display_name": "Gemini 2.5 Flash Lite Preview 06-17", + "id": "gpt-5-chat-latest", + "name": "OpenAI GPT-5 Chat Latest", + "display_name": "OpenAI GPT-5 Chat Latest", "modalities": { "input": [ "text", - "image", - "audio", - "video", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 65536, - "output": 65536 + "context": 128000, + "output": 16384 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-06-17", - "last_updated": "2025-06-17", + "knowledge": "2024-09", + "release_date": "2024-09-30", + "last_updated": "2024-09-30", "cost": { - "input": 0.1, - "output": 0.4, - "cache_read": 0.025 + "input": 1.25, + "output": 10, + "cache_read": 0.12500000000000003 } }, { - "id": "gemini-2.5-flash-preview-09-2025", - "name": "Gemini 2.5 Flash Preview 09-25", - "display_name": "Gemini 2.5 Flash Preview 09-25", + "id": "gpt-4o-mini", + "name": "OpenAI GPT-4o-mini", + "display_name": "OpenAI GPT-4o-mini", "modalities": { "input": [ "text", - "image", - "audio", - "video", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 128000, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-09-25", - "last_updated": "2025-09-25", + "knowledge": "2024-07", + "release_date": "2024-07-18", + "last_updated": "2024-07-18", "cost": { - "input": 0.3, - "output": 2.5, - "cache_read": 0.075, - "cache_write": 0.383 + "input": 0.15, + "output": 0.6, + "cache_read": 0.075 } }, { - "id": "gemini-2.5-flash-preview-04-17", - "name": "Gemini 2.5 Flash Preview 04-17", - "display_name": "Gemini 2.5 Flash Preview 04-17", + "id": "gemma2-9b-it", + "name": "Google Gemma 2", + "display_name": "Google Gemma 2", "modalities": { "input": [ - "text", - "image", - "audio", - "video", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 8192, + "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-04-17", - "last_updated": "2025-04-17", + "knowledge": "2024-06", + "release_date": "2024-06-25", + "last_updated": "2024-06-25", "cost": { - "input": 0.15, - "output": 0.6, - "cache_read": 0.0375 + "input": 0.01, + "output": 0.03 } }, { - "id": "gemini-2.5-pro", - "name": "Gemini 2.5 Pro", - "display_name": "Gemini 2.5 Pro", + "id": "claude-sonnet-4", + "name": "Anthropic: Claude Sonnet 4", + "display_name": "Anthropic: Claude Sonnet 4", "modalities": { "input": [ "text", - "image", - "audio", - "video", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, @@ -24628,137 +24497,132 @@ "supported": true, "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-03-20", - "last_updated": "2025-06-05", + "knowledge": "2025-05", + "release_date": "2025-05-14", + "last_updated": "2025-05-14", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.31 + "input": 3, + "output": 15, + "cache_read": 0.30000000000000004, + "cache_write": 3.75 } }, { - "id": "gemini-2.5-flash-lite-preview-09-2025", - "name": "Gemini 2.5 Flash Lite Preview 09-25", - "display_name": "Gemini 2.5 Flash Lite Preview 09-25", + "id": "sonar-reasoning-pro", + "name": "Perplexity Sonar Reasoning Pro", + "display_name": "Perplexity Sonar Reasoning Pro", "modalities": { "input": [ - "text", - "image", - "audio", - "video", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 127000, + "output": 4096 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, "knowledge": "2025-01", - "release_date": "2025-09-25", - "last_updated": "2025-09-25", + "release_date": "2025-01-27", + "last_updated": "2025-01-27", "cost": { - "input": 0.1, - "output": 0.4, - "cache_read": 0.025 + "input": 2, + "output": 8 } - } - ] - }, - "cloudflare-workers-ai": { - "id": "cloudflare-workers-ai", - "name": "Cloudflare Workers AI", - "display_name": "Cloudflare Workers AI", - "doc": "https://developers.cloudflare.com/workers-ai/models/", - "models": [ + }, { - "id": "mistral-7b-instruct-v0.1-awq", - "name": "@hf/thebloke/mistral-7b-instruct-v0.1-awq", - "display_name": "@hf/thebloke/mistral-7b-instruct-v0.1-awq", + "id": "gpt-5", + "name": "OpenAI GPT-5", + "display_name": "OpenAI GPT-5", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 4096, - "output": 4096 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2023-09-27", - "last_updated": "2023-11-09", + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 0, - "output": 0 + "input": 1.25, + "output": 10, + "cache_read": 0.12500000000000003 } }, { - "id": "aura-1", - "name": "@cf/deepgram/aura-1", - "display_name": "@cf/deepgram/aura-1", + "id": "qwen3-vl-235b-a22b-instruct", + "name": "Qwen3 VL 235B A22B Instruct", + "display_name": "Qwen3 VL 235B A22B Instruct", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ - "audio" + "text" ] }, "limit": { - "context": 0, - "output": 0 + "context": 256000, + "output": 16384 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2025-08-27", - "last_updated": "2025-07-07", + "open_weights": false, + "knowledge": "2025-09", + "release_date": "2025-09-23", + "last_updated": "2025-09-23", "cost": { - "input": 0.015, - "output": 0.015 + "input": 0.3, + "output": 1.5 } }, { - "id": "mistral-7b-instruct-v0.2", - "name": "@hf/mistral/mistral-7b-instruct-v0.2", - "display_name": "@hf/mistral/mistral-7b-instruct-v0.2", + "id": "qwen3-30b-a3b", + "name": "Qwen3 30B A3B", + "display_name": "Qwen3 30B A3B", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 3072, - "output": 3072 + "context": 41000, + "output": 41000 }, "temperature": true, "tool_call": true, @@ -24766,18 +24630,19 @@ "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2023-12-11", - "last_updated": "2025-07-24", + "open_weights": false, + "knowledge": "2025-06", + "release_date": "2025-06-01", + "last_updated": "2025-06-01", "cost": { - "input": 0, - "output": 0 + "input": 0.08, + "output": 0.29 } }, { - "id": "tinyllama-1.1b-chat-v1.0", - "name": "@cf/tinyllama/tinyllama-1.1b-chat-v1.0", - "display_name": "@cf/tinyllama/tinyllama-1.1b-chat-v1.0", + "id": "deepseek-v3.2", + "name": "DeepSeek V3.2", + "display_name": "DeepSeek V3.2", "modalities": { "input": [ "text" @@ -24787,8 +24652,8 @@ ] }, "limit": { - "context": 2048, - "output": 2048 + "context": 163840, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -24796,29 +24661,32 @@ "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2023-12-30", - "last_updated": "2024-03-17", + "open_weights": false, + "knowledge": "2025-09", + "release_date": "2025-09-22", + "last_updated": "2025-09-22", "cost": { - "input": 0, - "output": 0 + "input": 0.27, + "output": 0.41 } }, { - "id": "qwen1.5-0.5b-chat", - "name": "@cf/qwen/qwen1.5-0.5b-chat", - "display_name": "@cf/qwen/qwen1.5-0.5b-chat", + "id": "grok-4-1-fast-non-reasoning", + "name": "xAI Grok 4.1 Fast Non-Reasoning", + "display_name": "xAI Grok 4.1 Fast Non-Reasoning", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ - "text" + "text", + "image" ] }, "limit": { - "context": 32000, - "output": 32000 + "context": 2000000, + "output": 30000 }, "temperature": true, "tool_call": true, @@ -24826,18 +24694,20 @@ "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2024-01-31", - "last_updated": "2024-04-30", + "open_weights": false, + "knowledge": "2025-11", + "release_date": "2025-11-17", + "last_updated": "2025-11-17", "cost": { - "input": 0, - "output": 0 + "input": 0.19999999999999998, + "output": 0.5, + "cache_read": 0.049999999999999996 } }, { - "id": "llama-3.2-11b-vision-instruct", - "name": "@cf/meta/llama-3.2-11b-vision-instruct", - "display_name": "@cf/meta/llama-3.2-11b-vision-instruct", + "id": "gpt-5-pro", + "name": "OpenAI: GPT-5 Pro", + "display_name": "OpenAI: GPT-5 Pro", "modalities": { "input": [ "text" @@ -24848,26 +24718,27 @@ }, "limit": { "context": 128000, - "output": 128000 + "output": 32768 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2024-09-18", - "last_updated": "2024-12-04", + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 0.049, - "output": 0.68 + "input": 15, + "output": 120 } }, { - "id": "llama-2-13b-chat-awq", - "name": "@hf/thebloke/llama-2-13b-chat-awq", - "display_name": "@hf/thebloke/llama-2-13b-chat-awq", + "id": "llama-3.3-70b-versatile", + "name": "Meta Llama 3.3 70B Versatile", + "display_name": "Meta Llama 3.3 70B Versatile", "modalities": { "input": [ "text" @@ -24877,8 +24748,8 @@ ] }, "limit": { - "context": 4096, - "output": 4096 + "context": 131072, + "output": 32678 }, "temperature": true, "tool_call": true, @@ -24886,18 +24757,19 @@ "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2023-09-19", - "last_updated": "2023-11-09", + "open_weights": false, + "knowledge": "2024-12", + "release_date": "2024-12-06", + "last_updated": "2024-12-06", "cost": { - "input": 0, - "output": 0 + "input": 0.59, + "output": 0.7899999999999999 } }, { - "id": "llama-3.1-8b-instruct-fp8", - "name": "@cf/meta/llama-3.1-8b-instruct-fp8", - "display_name": "@cf/meta/llama-3.1-8b-instruct-fp8", + "id": "mistral-large-2411", + "name": "Mistral-Large", + "display_name": "Mistral-Large", "modalities": { "input": [ "text" @@ -24907,8 +24779,8 @@ ] }, "limit": { - "context": 32000, - "output": 32000 + "context": 128000, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -24916,179 +24788,198 @@ "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2024-07-25", - "last_updated": "2024-07-25", + "open_weights": false, + "knowledge": "2024-07", + "release_date": "2024-07-24", + "last_updated": "2024-07-24", "cost": { - "input": 0.15, - "output": 0.29 + "input": 2, + "output": 6 } }, { - "id": "whisper", - "name": "@cf/openai/whisper", - "display_name": "@cf/openai/whisper", + "id": "claude-opus-4-1-20250805", + "name": "Anthropic: Claude Opus 4.1 (20250805)", + "display_name": "Anthropic: Claude Opus 4.1 (20250805)", "modalities": { "input": [ - "audio" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 0, - "output": 0 + "context": 200000, + "output": 32000 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": true, - "release_date": "2023-11-07", - "last_updated": "2024-08-12", + "open_weights": false, + "knowledge": "2025-08", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 0.00045, - "output": 0.00045 + "input": 15, + "output": 75, + "cache_read": 1.5, + "cache_write": 18.75 } }, { - "id": "stable-diffusion-xl-base-1.0", - "name": "@cf/stabilityai/stable-diffusion-xl-base-1.0", - "display_name": "@cf/stabilityai/stable-diffusion-xl-base-1.0", + "id": "ernie-4.5-21b-a3b-thinking", + "name": "Baidu Ernie 4.5 21B A3B Thinking", + "display_name": "Baidu Ernie 4.5 21B A3B Thinking", "modalities": { "input": [ "text" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 0, - "output": 0 + "context": 128000, + "output": 8000 }, - "temperature": false, + "temperature": true, "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": true, - "release_date": "2023-07-25", - "last_updated": "2023-10-30", + "open_weights": false, + "knowledge": "2025-03", + "release_date": "2025-03-16", + "last_updated": "2025-03-16", "cost": { - "input": 0, - "output": 0 + "input": 0.07, + "output": 0.28 } }, { - "id": "llama-2-7b-chat-fp16", - "name": "@cf/meta/llama-2-7b-chat-fp16", - "display_name": "@cf/meta/llama-2-7b-chat-fp16", + "id": "gpt-5.1-chat-latest", + "name": "OpenAI GPT-5.1 Chat", + "display_name": "OpenAI GPT-5.1 Chat", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ - "text" + "text", + "image" ] }, "limit": { - "context": 4096, - "output": 4096 + "context": 128000, + "output": 16384 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2023-07-26", - "last_updated": "2023-07-26", + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 0.56, - "output": 6.67 + "input": 1.25, + "output": 10, + "cache_read": 0.12500000000000003 } }, { - "id": "resnet-50", - "name": "@cf/microsoft/resnet-50", - "display_name": "@cf/microsoft/resnet-50", + "id": "qwen3-32b", + "name": "Qwen3 32B", + "display_name": "Qwen3 32B", "modalities": { "input": [ - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 0, - "output": 0 + "context": 131072, + "output": 40960 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": true, - "release_date": "2022-03-16", - "last_updated": "2024-02-13", + "open_weights": false, + "knowledge": "2025-04", + "release_date": "2025-04-28", + "last_updated": "2025-04-28", "cost": { - "input": 0.0000025, - "output": 0 + "input": 0.29, + "output": 0.59 } }, { - "id": "stable-diffusion-v1-5-inpainting", - "name": "@cf/runwayml/stable-diffusion-v1-5-inpainting", - "display_name": "@cf/runwayml/stable-diffusion-v1-5-inpainting", + "id": "claude-haiku-4-5-20251001", + "name": "Anthropic: Claude 4.5 Haiku (20251001)", + "display_name": "Anthropic: Claude 4.5 Haiku (20251001)", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 0, - "output": 0 + "context": 200000, + "output": 8192 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2024-02-27", - "last_updated": "2024-02-27", + "open_weights": false, + "knowledge": "2025-10", + "release_date": "2025-10-01", + "last_updated": "2025-10-01", "cost": { - "input": 0, - "output": 0 + "input": 1, + "output": 5, + "cache_read": 0.09999999999999999, + "cache_write": 1.25 } }, { - "id": "sqlcoder-7b-2", - "name": "@cf/defog/sqlcoder-7b-2", - "display_name": "@cf/defog/sqlcoder-7b-2", + "id": "llama-4-scout", + "name": "Meta Llama 4 Scout 17B 16E", + "display_name": "Meta Llama 4 Scout 17B 16E", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 10000, - "output": 10000 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -25096,18 +24987,28 @@ "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2024-02-05", - "last_updated": "2024-02-12", + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 0, - "output": 0 + "input": 0.08, + "output": 0.3 } - }, + } + ] + }, + "opencode": { + "id": "opencode", + "name": "OpenCode Zen", + "display_name": "OpenCode Zen", + "api": "https://opencode.ai/zen/v1", + "doc": "https://opencode.ai/docs/zen", + "models": [ { - "id": "llama-3-8b-instruct", - "name": "@cf/meta/llama-3-8b-instruct", - "display_name": "@cf/meta/llama-3-8b-instruct", + "id": "qwen3-coder", + "name": "Qwen3 Coder", + "display_name": "Qwen3 Coder", "modalities": { "input": [ "text" @@ -25117,8 +25018,8 @@ ] }, "limit": { - "context": 7968, - "output": 7968 + "context": 262144, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -25127,47 +25028,54 @@ }, "attachment": false, "open_weights": true, - "release_date": "2024-04-17", - "last_updated": "2025-06-19", + "knowledge": "2025-04", + "release_date": "2025-07-23", + "last_updated": "2025-07-23", "cost": { - "input": 0.28, - "output": 0.83 + "input": 0.45, + "output": 1.8 } }, { - "id": "llama-2-7b-chat-hf-lora", - "name": "@cf/meta-llama/llama-2-7b-chat-hf-lora", - "display_name": "@cf/meta-llama/llama-2-7b-chat-hf-lora", + "id": "claude-opus-4-1", + "name": "Claude Opus 4.1", + "display_name": "Claude Opus 4.1", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 200000, + "output": 32000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2023-07-13", - "last_updated": "2024-04-17", + "attachment": true, + "open_weights": false, + "knowledge": "2025-03-31", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 0, - "output": 0 + "input": 15, + "output": 75, + "cache_read": 1.5, + "cache_write": 18.75 } }, { - "id": "llama-3.1-8b-instruct", - "name": "@cf/meta/llama-3.1-8b-instruct", - "display_name": "@cf/meta/llama-3.1-8b-instruct", + "id": "kimi-k2", + "name": "Kimi K2", + "display_name": "Kimi K2", "modalities": { "input": [ "text" @@ -25177,8 +25085,8 @@ ] }, "limit": { - "context": 7968, - "output": 7968 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, @@ -25187,167 +25095,209 @@ }, "attachment": false, "open_weights": true, - "release_date": "2024-07-18", - "last_updated": "2024-09-25", + "knowledge": "2024-10", + "release_date": "2025-09-05", + "last_updated": "2025-09-05", "cost": { - "input": 0.28, - "output": 0.83 + "input": 0.4, + "output": 2.5, + "cache_read": 0.4 } }, { - "id": "openchat-3.5-0106", - "name": "@cf/openchat/openchat-3.5-0106", - "display_name": "@cf/openchat/openchat-3.5-0106", + "id": "gpt-5.1-codex", + "name": "GPT-5.1 Codex", + "display_name": "GPT-5.1 Codex", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2024-01-07", - "last_updated": "2024-05-18", + "attachment": true, + "open_weights": false, + "knowledge": "2024-09-30", + "release_date": "2025-11-12", + "last_updated": "2025-11-12", "cost": { - "input": 0, - "output": 0 + "input": 1.07, + "output": 8.5, + "cache_read": 0.107 } }, { - "id": "openhermes-2.5-mistral-7b-awq", - "name": "@hf/thebloke/openhermes-2.5-mistral-7b-awq", - "display_name": "@hf/thebloke/openhermes-2.5-mistral-7b-awq", + "id": "claude-haiku-4-5", + "name": "Claude Haiku 4.5", + "display_name": "Claude Haiku 4.5", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 4096, - "output": 4096 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2023-11-02", - "last_updated": "2023-11-09", + "attachment": true, + "open_weights": false, + "knowledge": "2025-02-28", + "release_date": "2025-10-15", + "last_updated": "2025-10-15", "cost": { - "input": 0, - "output": 0 + "input": 1, + "output": 5, + "cache_read": 0.1, + "cache_write": 1.25 } }, { - "id": "lucid-origin", - "name": "@cf/leonardo/lucid-origin", - "display_name": "@cf/leonardo/lucid-origin", + "id": "claude-opus-4-5", + "name": "Claude Opus 4.5", + "display_name": "Claude Opus 4.5", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 0, - "output": 0 + "context": 200000, + "output": 64000 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-08-25", - "last_updated": "2025-08-05", + "knowledge": "2025-03-31", + "release_date": "2025-11-01", + "last_updated": "2025-11-01", "cost": { - "input": 0.007, - "output": 0.007 + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 } }, { - "id": "bart-large-cnn", - "name": "@cf/facebook/bart-large-cnn", - "display_name": "@cf/facebook/bart-large-cnn", + "id": "gemini-3-pro", + "name": "Gemini 3 Pro", + "display_name": "Gemini 3 Pro", "modalities": { "input": [ - "text" + "text", + "image", + "video", + "audio", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 0, - "output": 0 + "context": 1000000, + "output": 64000 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2022-03-02", - "last_updated": "2024-02-13", + "attachment": true, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-11-18", + "last_updated": "2025-11-18", "cost": { - "input": 0, - "output": 0 + "input": 2, + "output": 12, + "cache_read": 0.2, + "context_over_200k": { + "input": 4, + "output": 18, + "cache_read": 0.4 + } } }, { - "id": "flux-1-schnell", - "name": "@cf/black-forest-labs/flux-1-schnell", - "display_name": "@cf/black-forest-labs/flux-1-schnell", + "id": "claude-sonnet-4-5", + "name": "Claude Sonnet 4.5", + "display_name": "Claude Sonnet 4.5", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 2048, - "output": 0 + "context": 1000000, + "output": 64000 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2024-07-31", - "last_updated": "2024-08-16", + "attachment": true, + "open_weights": false, + "knowledge": "2025-07-31", + "release_date": "2025-09-29", + "last_updated": "2025-09-29", "cost": { - "input": 0.000053, - "output": 0.00011 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75, + "context_over_200k": { + "input": 6, + "output": 22.5, + "cache_read": 0.6, + "cache_write": 7.5 + } } }, { - "id": "deepseek-r1-distill-qwen-32b", - "name": "@cf/deepseek-ai/deepseek-r1-distill-qwen-32b", - "display_name": "@cf/deepseek-ai/deepseek-r1-distill-qwen-32b", + "id": "alpha-gd4", + "name": "Alpha GD4", + "display_name": "Alpha GD4", "modalities": { "input": [ "text" @@ -25357,8 +25307,8 @@ ] }, "limit": { - "context": 80000, - "output": 80000 + "context": 262144, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -25368,17 +25318,19 @@ }, "attachment": false, "open_weights": true, - "release_date": "2025-01-20", - "last_updated": "2025-02-24", + "knowledge": "2025-01", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { "input": 0.5, - "output": 4.88 + "output": 2, + "cache_read": 0.15 } }, { - "id": "gemma-2b-it-lora", - "name": "@cf/google/gemma-2b-it-lora", - "display_name": "@cf/google/gemma-2b-it-lora", + "id": "kimi-k2-thinking", + "name": "Kimi K2 Thinking", + "display_name": "Kimi K2 Thinking", "modalities": { "input": [ "text" @@ -25388,57 +25340,65 @@ ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": true, - "release_date": "2024-04-02", - "last_updated": "2024-04-02", + "knowledge": "2024-10", + "release_date": "2025-09-05", + "last_updated": "2025-09-05", "cost": { - "input": 0, - "output": 0 + "input": 0.4, + "output": 2.5, + "cache_read": 0.4 } }, { - "id": "una-cybertron-7b-v2-bf16", - "name": "@cf/fblgit/una-cybertron-7b-v2-bf16", - "display_name": "@cf/fblgit/una-cybertron-7b-v2-bf16", + "id": "gpt-5.1", + "name": "GPT-5.1", + "display_name": "GPT-5.1", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ - "text" + "text", + "image" ] }, "limit": { - "context": 15000, - "output": 15000 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2023-12-02", - "last_updated": "2024-03-08", + "attachment": true, + "open_weights": false, + "knowledge": "2024-09-30", + "release_date": "2025-11-12", + "last_updated": "2025-11-12", "cost": { - "input": 0, - "output": 0 + "input": 1.07, + "output": 8.5, + "cache_read": 0.107 } }, { - "id": "m2m100-1.2b", - "name": "@cf/meta/m2m100-1.2b", - "display_name": "@cf/meta/m2m100-1.2b", + "id": "alpha-minimax-m2", + "name": "MiniMax M2 (alpha)", + "display_name": "MiniMax M2 (alpha)", "modalities": { "input": [ "text" @@ -25448,147 +25408,166 @@ ] }, "limit": { - "context": 0, - "output": 0 + "context": 204800, + "output": 131072 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": true, - "release_date": "2022-03-02", - "last_updated": "2023-11-16", + "knowledge": "2024-10", + "release_date": "2025-10-27", + "last_updated": "2025-10-27", "cost": { - "input": 0.34, - "output": 0.34 + "input": 0.3, + "output": 1.2 } }, { - "id": "llama-3.2-3b-instruct", - "name": "@cf/meta/llama-3.2-3b-instruct", - "display_name": "@cf/meta/llama-3.2-3b-instruct", + "id": "gpt-5-nano", + "name": "GPT-5 Nano", + "display_name": "GPT-5 Nano", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, + "context": 400000, "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2024-09-18", - "last_updated": "2024-10-24", + "attachment": true, + "open_weights": false, + "knowledge": "2024-05-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 0.051, - "output": 0.34 + "input": 0, + "output": 0, + "cache_read": 0 } }, { - "id": "qwen2.5-coder-32b-instruct", - "name": "@cf/qwen/qwen2.5-coder-32b-instruct", - "display_name": "@cf/qwen/qwen2.5-coder-32b-instruct", + "id": "gpt-5-codex", + "name": "GPT-5 Codex", + "display_name": "GPT-5 Codex", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 32768, - "output": 32768 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2024-11-06", - "last_updated": "2025-01-12", + "attachment": true, + "open_weights": false, + "knowledge": "2024-09-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 0.66, - "output": 1 + "input": 1.07, + "output": 8.5, + "cache_read": 0.107 } }, { - "id": "stable-diffusion-v1-5-img2img", - "name": "@cf/runwayml/stable-diffusion-v1-5-img2img", - "display_name": "@cf/runwayml/stable-diffusion-v1-5-img2img", + "id": "big-pickle", + "name": "Big Pickle", + "display_name": "Big Pickle", "modalities": { "input": [ "text" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 0, - "output": 0 + "context": 200000, + "output": 128000 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": true, - "release_date": "2024-02-27", - "last_updated": "2024-02-27", + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-10-17", + "last_updated": "2025-10-17", "cost": { "input": 0, - "output": 0 + "output": 0, + "cache_read": 0, + "cache_write": 0 } }, { - "id": "gemma-7b-it-lora", - "name": "@cf/google/gemma-7b-it-lora", - "display_name": "@cf/google/gemma-7b-it-lora", + "id": "claude-3-5-haiku", + "name": "Claude Haiku 3.5", + "display_name": "Claude Haiku 3.5", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 3500, - "output": 3500 + "context": 200000, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "release_date": "2024-04-02", - "last_updated": "2024-04-02", + "attachment": true, + "open_weights": false, + "knowledge": "2024-07-31", + "release_date": "2024-10-22", + "last_updated": "2024-10-22", "cost": { - "input": 0, - "output": 0 + "input": 0.8, + "output": 4, + "cache_read": 0.08, + "cache_write": 1 } }, { - "id": "qwen1.5-14b-chat-awq", - "name": "@cf/qwen/qwen1.5-14b-chat-awq", - "display_name": "@cf/qwen/qwen1.5-14b-chat-awq", + "id": "glm-4.6", + "name": "GLM-4.6", + "display_name": "GLM-4.6", "modalities": { "input": [ "text" @@ -25598,27 +25577,30 @@ ] }, "limit": { - "context": 7500, - "output": 7500 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": true, - "release_date": "2024-02-03", - "last_updated": "2024-04-30", + "knowledge": "2025-04", + "release_date": "2025-09-30", + "last_updated": "2025-09-30", "cost": { - "input": 0, - "output": 0 + "input": 0.6, + "output": 2.2, + "cache_read": 0.1 } }, { - "id": "qwen1.5-1.8b-chat", - "name": "@cf/qwen/qwen1.5-1.8b-chat", - "display_name": "@cf/qwen/qwen1.5-1.8b-chat", + "id": "grok-code", + "name": "Grok Code Fast 1", + "display_name": "Grok Code Fast 1", "modalities": { "input": [ "text" @@ -25628,147 +25610,184 @@ ] }, "limit": { - "context": 32000, - "output": 32000 + "context": 256000, + "output": 256000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2024-01-30", - "last_updated": "2024-04-30", + "attachment": true, + "open_weights": false, + "release_date": "2025-08-20", + "last_updated": "2025-08-20", "cost": { "input": 0, - "output": 0 + "output": 0, + "cache_read": 0, + "cache_write": 0 } }, { - "id": "mistral-small-3.1-24b-instruct", - "name": "@cf/mistralai/mistral-small-3.1-24b-instruct", - "display_name": "@cf/mistralai/mistral-small-3.1-24b-instruct", + "id": "gpt-5.1-codex-max", + "name": "GPT-5.1 Codex Max", + "display_name": "GPT-5.1 Codex Max", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, + "context": 400000, "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2025-03-11", - "last_updated": "2025-07-28", + "attachment": true, + "open_weights": false, + "knowledge": "2024-09-30", + "release_date": "2025-11-12", + "last_updated": "2025-11-12", "cost": { - "input": 0.35, - "output": 0.56 + "input": 1.25, + "output": 10, + "cache_read": 0.125 } }, { - "id": "gemma-7b-it", - "name": "@hf/google/gemma-7b-it", - "display_name": "@hf/google/gemma-7b-it", + "id": "alpha-doubao-seed-code", + "name": "Doubao Seed Code (alpha)", + "display_name": "Doubao Seed Code (alpha)", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 256000, + "output": 32000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": true, - "release_date": "2024-02-13", - "last_updated": "2024-08-14", + "knowledge": "2024-10", + "release_date": "2025-11-11", + "last_updated": "2025-11-11", "cost": { "input": 0, - "output": 0 + "output": 0, + "cache_read": 0 } }, { - "id": "llamaguard-7b-awq", - "name": "@hf/thebloke/llamaguard-7b-awq", - "display_name": "@hf/thebloke/llamaguard-7b-awq", + "id": "claude-sonnet-4", + "name": "Claude Sonnet 4", + "display_name": "Claude Sonnet 4", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 4096, - "output": 4096 + "context": 1000000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2023-12-11", - "last_updated": "2023-12-11", + "attachment": true, + "open_weights": false, + "knowledge": "2025-03-31", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", "cost": { - "input": 0, - "output": 0 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75, + "context_over_200k": { + "input": 6, + "output": 22.5, + "cache_read": 0.6, + "cache_write": 7.5 + } } }, { - "id": "hermes-2-pro-mistral-7b", - "name": "@hf/nousresearch/hermes-2-pro-mistral-7b", - "display_name": "@hf/nousresearch/hermes-2-pro-mistral-7b", + "id": "gpt-5", + "name": "GPT-5", + "display_name": "GPT-5", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 24000, - "output": 24000 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2024-03-11", - "last_updated": "2024-09-08", + "attachment": true, + "open_weights": false, + "knowledge": "2024-09-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 0, - "output": 0 + "input": 1.07, + "output": 8.5, + "cache_read": 0.107 } - }, + } + ] + }, + "fastrouter": { + "id": "fastrouter", + "name": "FastRouter", + "display_name": "FastRouter", + "api": "https://go.fastrouter.ai/api/v1", + "doc": "https://fastrouter.ai/models", + "models": [ { - "id": "falcon-7b-instruct", - "name": "@cf/tiiuae/falcon-7b-instruct", - "display_name": "@cf/tiiuae/falcon-7b-instruct", + "id": "moonshotai/kimi-k2", + "name": "Kimi K2", + "display_name": "Kimi K2", "modalities": { "input": [ "text" @@ -25778,8 +25797,8 @@ ] }, "limit": { - "context": 4096, - "output": 4096 + "context": 131072, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -25788,17 +25807,18 @@ }, "attachment": false, "open_weights": true, - "release_date": "2023-04-25", - "last_updated": "2024-10-12", + "knowledge": "2024-10", + "release_date": "2025-07-11", + "last_updated": "2025-07-11", "cost": { - "input": 0, - "output": 0 + "input": 0.55, + "output": 2.2 } }, { - "id": "llama-3.3-70b-instruct-fp8-fast", - "name": "@cf/meta/llama-3.3-70b-instruct-fp8-fast", - "display_name": "@cf/meta/llama-3.3-70b-instruct-fp8-fast", + "id": "x-ai/grok-4", + "name": "Grok 4", + "display_name": "Grok 4", "modalities": { "input": [ "text" @@ -25808,177 +25828,202 @@ ] }, "limit": { - "context": 24000, - "output": 24000 + "context": 256000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": true, - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "open_weights": false, + "knowledge": "2025-07", + "release_date": "2025-07-09", + "last_updated": "2025-07-09", "cost": { - "input": 0.29, - "output": 2.25 + "input": 3, + "output": 15, + "cache_read": 0.75, + "cache_write": 15 } }, { - "id": "llama-3-8b-instruct-awq", - "name": "@cf/meta/llama-3-8b-instruct-awq", - "display_name": "@cf/meta/llama-3-8b-instruct-awq", + "id": "google/gemini-2.5-flash", + "name": "Gemini 2.5 Flash", + "display_name": "Gemini 2.5 Flash", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2024-05-09", - "last_updated": "2024-05-09", + "attachment": true, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-06-17", + "last_updated": "2025-06-17", "cost": { - "input": 0.12, - "output": 0.27 + "input": 0.3, + "output": 2.5, + "cache_read": 0.0375 } }, { - "id": "phoenix-1.0", - "name": "@cf/leonardo/phoenix-1.0", - "display_name": "@cf/leonardo/phoenix-1.0", + "id": "google/gemini-2.5-pro", + "name": "Gemini 2.5 Pro", + "display_name": "Gemini 2.5 Pro", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 0, - "output": 0 + "context": 1048576, + "output": 65536 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-08-25", - "last_updated": "2025-08-25", + "knowledge": "2025-01", + "release_date": "2025-06-17", + "last_updated": "2025-06-17", "cost": { - "input": 0.0058, - "output": 0.0058 + "input": 1.25, + "output": 10, + "cache_read": 0.31 } }, { - "id": "phi-2", - "name": "@cf/microsoft/phi-2", - "display_name": "@cf/microsoft/phi-2", + "id": "openai/gpt-5-nano", + "name": "GPT-5 Nano", + "display_name": "GPT-5 Nano", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 2048, - "output": 2048 + "context": 400000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2023-12-13", - "last_updated": "2024-04-29", + "attachment": true, + "open_weights": false, + "knowledge": "2024-10-01", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 0, - "output": 0 + "input": 0.05, + "output": 0.4, + "cache_read": 0.005 } }, { - "id": "dreamshaper-8-lcm", - "name": "@cf/lykon/dreamshaper-8-lcm", - "display_name": "@cf/lykon/dreamshaper-8-lcm", + "id": "openai/gpt-4.1", + "name": "GPT-4.1", + "display_name": "GPT-4.1", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 0, - "output": 0 + "context": 1047576, + "output": 32768 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, "attachment": true, - "open_weights": true, - "release_date": "2023-12-06", - "last_updated": "2023-12-07", + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { - "input": 0, - "output": 0 + "input": 2, + "output": 8, + "cache_read": 0.5 } }, { - "id": "discolm-german-7b-v1-awq", - "name": "@cf/thebloke/discolm-german-7b-v1-awq", - "display_name": "@cf/thebloke/discolm-german-7b-v1-awq", + "id": "openai/gpt-5-mini", + "name": "GPT-5 Mini", + "display_name": "GPT-5 Mini", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 4096, - "output": 4096 + "context": 400000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2024-01-18", - "last_updated": "2024-01-24", + "attachment": true, + "open_weights": false, + "knowledge": "2024-10-01", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 0, - "output": 0 + "input": 0.25, + "output": 2, + "cache_read": 0.025 } }, { - "id": "llama-2-7b-chat-int8", - "name": "@cf/meta/llama-2-7b-chat-int8", - "display_name": "@cf/meta/llama-2-7b-chat-int8", + "id": "openai/gpt-oss-20b", + "name": "GPT OSS 20B", + "display_name": "GPT OSS 20B", "modalities": { "input": [ "text" @@ -25988,27 +26033,28 @@ ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 131072, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": true, - "release_date": "2023-09-25", - "last_updated": "2023-09-25", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 0.556, - "output": 6.667 + "input": 0.05, + "output": 0.2 } }, { - "id": "llama-3.2-1b-instruct", - "name": "@cf/meta/llama-3.2-1b-instruct", - "display_name": "@cf/meta/llama-3.2-1b-instruct", + "id": "openai/gpt-oss-120b", + "name": "GPT OSS 120B", + "display_name": "GPT OSS 120B", "modalities": { "input": [ "text" @@ -26018,57 +26064,62 @@ ] }, "limit": { - "context": 60000, - "output": 60000 + "context": 131072, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": true, - "release_date": "2024-09-18", - "last_updated": "2024-10-24", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 0.027, - "output": 0.2 + "input": 0.15, + "output": 0.6 } }, { - "id": "whisper-large-v3-turbo", - "name": "@cf/openai/whisper-large-v3-turbo", - "display_name": "@cf/openai/whisper-large-v3-turbo", + "id": "openai/gpt-5", + "name": "GPT-5", + "display_name": "GPT-5", "modalities": { "input": [ - "audio" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 0, - "output": 0 + "context": 400000, + "output": 128000 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2024-10-01", - "last_updated": "2024-10-04", + "attachment": true, + "open_weights": false, + "knowledge": "2024-10-01", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 0.00051, - "output": 0.00051 + "input": 1.25, + "output": 10, + "cache_read": 0.125 } }, { - "id": "llama-4-scout-17b-16e-instruct", - "name": "@cf/meta/llama-4-scout-17b-16e-instruct", - "display_name": "@cf/meta/llama-4-scout-17b-16e-instruct", + "id": "qwen/qwen3-coder", + "name": "Qwen3 Coder", + "display_name": "Qwen3 Coder", "modalities": { "input": [ "text" @@ -26078,8 +26129,8 @@ ] }, "limit": { - "context": 131000, - "output": 131000 + "context": 262144, + "output": 66536 }, "temperature": true, "tool_call": true, @@ -26088,77 +26139,90 @@ }, "attachment": false, "open_weights": true, - "release_date": "2025-04-02", - "last_updated": "2025-05-23", + "knowledge": "2025-04", + "release_date": "2025-07-23", + "last_updated": "2025-07-23", "cost": { - "input": 0.27, - "output": 0.85 + "input": 0.3, + "output": 1.2 } }, { - "id": "starling-lm-7b-beta", - "name": "@hf/nexusflow/starling-lm-7b-beta", - "display_name": "@hf/nexusflow/starling-lm-7b-beta", + "id": "anthropic/claude-opus-4.1", + "name": "Claude Opus 4.1", + "display_name": "Claude Opus 4.1", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 4096, - "output": 4096 + "context": 200000, + "output": 32000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2024-03-19", - "last_updated": "2024-04-03", + "attachment": true, + "open_weights": false, + "knowledge": "2025-03-31", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 0, - "output": 0 + "input": 15, + "output": 75, + "cache_read": 1.5, + "cache_write": 18.75 } }, { - "id": "deepseek-coder-6.7b-base-awq", - "name": "@hf/thebloke/deepseek-coder-6.7b-base-awq", - "display_name": "@hf/thebloke/deepseek-coder-6.7b-base-awq", + "id": "anthropic/claude-sonnet-4", + "name": "Claude Sonnet 4", + "display_name": "Claude Sonnet 4", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 4096, - "output": 4096 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2023-11-05", - "last_updated": "2023-11-09", + "attachment": true, + "open_weights": false, + "knowledge": "2025-03-31", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", "cost": { - "input": 0, - "output": 0 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 } }, { - "id": "gemma-3-12b-it", - "name": "@cf/google/gemma-3-12b-it", - "display_name": "@cf/google/gemma-3-12b-it", + "id": "deepseek-ai/deepseek-r1-distill-llama-70b", + "name": "DeepSeek R1 Distill Llama 70B", + "display_name": "DeepSeek R1 Distill Llama 70B", "modalities": { "input": [ "text" @@ -26168,27 +26232,37 @@ ] }, "limit": { - "context": 80000, - "output": 80000 + "context": 131072, + "output": 131072 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": true, - "release_date": "2025-03-01", - "last_updated": "2025-03-21", + "knowledge": "2024-10", + "release_date": "2025-01-23", + "last_updated": "2025-01-23", "cost": { - "input": 0.35, - "output": 0.56 + "input": 0.03, + "output": 0.14 } - }, + } + ] + }, + "google": { + "id": "google", + "name": "google", + "display_name": "google", + "doc": "https://ai.google.dev/gemini-api/docs/pricing", + "models": [ { - "id": "llama-guard-3-8b", - "name": "@cf/meta/llama-guard-3-8b", - "display_name": "@cf/meta/llama-guard-3-8b", + "id": "gemini-embedding-001", + "name": "Gemini Embedding 001", + "display_name": "Gemini Embedding 001", "modalities": { "input": [ "text" @@ -26198,8 +26272,41 @@ ] }, "limit": { - "context": 0, + "context": 2048, + "output": 3072 + }, + "temperature": false, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "knowledge": "2025-05", + "release_date": "2025-05-20", + "last_updated": "2025-05-20", + "cost": { + "input": 0.15, "output": 0 + } + }, + { + "id": "gemini-2.5-flash-image", + "name": "Gemini 2.5 Flash Image", + "display_name": "Gemini 2.5 Flash Image", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text", + "image" + ] + }, + "limit": { + "context": 32768, + "output": 32768 }, "temperature": true, "tool_call": false, @@ -26207,59 +26314,266 @@ "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2024-07-22", - "last_updated": "2024-10-11", + "open_weights": false, + "knowledge": "2025-06", + "release_date": "2025-08-26", + "last_updated": "2025-08-26", "cost": { - "input": 0.48, - "output": 0.03 + "input": 0.3, + "output": 30, + "cache_read": 0.075 } }, { - "id": "neural-chat-7b-v3-1-awq", - "name": "@hf/thebloke/neural-chat-7b-v3-1-awq", - "display_name": "@hf/thebloke/neural-chat-7b-v3-1-awq", + "id": "gemini-2.5-flash-preview-05-20", + "name": "Gemini 2.5 Flash Preview 05-20", + "display_name": "Gemini 2.5 Flash Preview 05-20", "modalities": { "input": [ + "text", + "image", + "audio", + "video", + "pdf" + ], + "output": [ "text" + ] + }, + "limit": { + "context": 1048576, + "output": 65536 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-05-20", + "last_updated": "2025-05-20", + "cost": { + "input": 0.15, + "output": 0.6, + "cache_read": 0.0375 + } + }, + { + "id": "gemini-flash-lite-latest", + "name": "Gemini Flash-Lite Latest", + "display_name": "Gemini Flash-Lite Latest", + "modalities": { + "input": [ + "text", + "image", + "audio", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 4096, - "output": 4096 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2023-11-15", - "last_updated": "2023-11-17", + "attachment": true, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-09-25", + "last_updated": "2025-09-25", "cost": { - "input": 0, - "output": 0 + "input": 0.1, + "output": 0.4, + "cache_read": 0.025 } }, { - "id": "whisper-tiny-en", - "name": "@cf/openai/whisper-tiny-en", - "display_name": "@cf/openai/whisper-tiny-en", + "id": "gemini-3-pro-preview", + "name": "Gemini 3 Pro Preview", + "display_name": "Gemini 3 Pro Preview", "modalities": { "input": [ - "audio" + "text", + "image", + "video", + "audio", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 0, - "output": 0 + "context": 1000000, + "output": 64000 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-11-18", + "last_updated": "2025-11-18", + "cost": { + "input": 2, + "output": 12, + "cache_read": 0.2, + "context_over_200k": { + "input": 4, + "output": 18, + "cache_read": 0.4 + } + } + }, + { + "id": "gemini-2.5-flash", + "name": "Gemini 2.5 Flash", + "display_name": "Gemini 2.5 Flash", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 1048576, + "output": 65536 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true, + "budget": { + "default": -1, + "min": 0, + "max": 24576 + } + }, + "search": { + "supported": true, + "default": false + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-03-20", + "last_updated": "2025-06-05", + "cost": { + "input": 0.3, + "output": 2.5, + "cache_read": 0.075, + "input_audio": 1 + } + }, + { + "id": "gemini-flash-latest", + "name": "Gemini Flash Latest", + "display_name": "Gemini Flash Latest", + "modalities": { + "input": [ + "text", + "image", + "audio", + "video", + "pdf" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 1048576, + "output": 65536 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-09-25", + "last_updated": "2025-09-25", + "cost": { + "input": 0.3, + "output": 2.5, + "cache_read": 0.075, + "input_audio": 1 + } + }, + { + "id": "gemini-2.5-pro-preview-05-06", + "name": "Gemini 2.5 Pro Preview 05-06", + "display_name": "Gemini 2.5 Pro Preview 05-06", + "modalities": { + "input": [ + "text", + "image", + "audio", + "video", + "pdf" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 1048576, + "output": 65536 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-05-06", + "last_updated": "2025-05-06", + "cost": { + "input": 1.25, + "output": 10, + "cache_read": 0.31 + } + }, + { + "id": "gemini-2.5-flash-preview-tts", + "name": "Gemini 2.5 Flash Preview TTS", + "display_name": "Gemini 2.5 Flash Preview TTS", + "modalities": { + "input": [ + "text" + ], + "output": [ + "audio" + ] + }, + "limit": { + "context": 8000, + "output": 16000 }, "temperature": false, "tool_call": false, @@ -26267,172 +26581,7154 @@ "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2022-09-26", - "last_updated": "2024-01-22", + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-05-01", + "last_updated": "2025-05-01", "cost": { - "input": 0, - "output": 0 + "input": 0.5, + "output": 10 + } + }, + { + "id": "gemini-2.0-flash-lite", + "name": "Gemini 2.0 Flash Lite", + "display_name": "Gemini 2.0 Flash Lite", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 1048576, + "output": 8192 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "search": { + "supported": false + }, + "attachment": true, + "open_weights": false, + "knowledge": "2024-06", + "release_date": "2024-12-11", + "last_updated": "2024-12-11", + "cost": { + "input": 0.075, + "output": 0.3 + } + }, + { + "id": "gemini-live-2.5-flash-preview-native-audio", + "name": "Gemini Live 2.5 Flash Preview Native Audio", + "display_name": "Gemini Live 2.5 Flash Preview Native Audio", + "modalities": { + "input": [ + "text", + "audio", + "video" + ], + "output": [ + "text", + "audio" + ] + }, + "limit": { + "context": 131072, + "output": 65536 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": false, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-06-17", + "last_updated": "2025-09-18", + "cost": { + "input": 0.5, + "output": 2, + "input_audio": 3, + "output_audio": 12 + } + }, + { + "id": "gemini-2.0-flash", + "name": "Gemini 2.0 Flash", + "display_name": "Gemini 2.0 Flash", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 1048576, + "output": 8192 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": false + }, + "search": { + "supported": true, + "default": false + }, + "attachment": true, + "open_weights": false, + "knowledge": "2024-06", + "release_date": "2024-12-11", + "last_updated": "2024-12-11", + "cost": { + "input": 0.1, + "output": 0.4, + "cache_read": 0.025 + } + }, + { + "id": "gemini-2.5-flash-lite", + "name": "Gemini 2.5 Flash Lite", + "display_name": "Gemini 2.5 Flash Lite", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 1048576, + "output": 65536 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": false, + "budget": { + "default": -1, + "min": 512, + "max": 24576 + } + }, + "search": { + "supported": true, + "default": false + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-06-17", + "last_updated": "2025-06-17", + "cost": { + "input": 0.1, + "output": 0.4, + "cache_read": 0.025 + } + }, + { + "id": "gemini-2.5-pro-preview-06-05", + "name": "Gemini 2.5 Pro Preview 06-05", + "display_name": "Gemini 2.5 Pro Preview 06-05", + "modalities": { + "input": [ + "text", + "image", + "audio", + "video", + "pdf" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 1048576, + "output": 65536 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-06-05", + "last_updated": "2025-06-05", + "cost": { + "input": 1.25, + "output": 10, + "cache_read": 0.31 + } + }, + { + "id": "gemini-live-2.5-flash", + "name": "Gemini Live 2.5 Flash", + "display_name": "Gemini Live 2.5 Flash", + "modalities": { + "input": [ + "text", + "image", + "audio", + "video" + ], + "output": [ + "text", + "audio" + ] + }, + "limit": { + "context": 128000, + "output": 8000 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-09-01", + "last_updated": "2025-09-01", + "cost": { + "input": 0.5, + "output": 2, + "input_audio": 3, + "output_audio": 12 + } + }, + { + "id": "gemini-2.5-flash-lite-preview-06-17", + "name": "Gemini 2.5 Flash Lite Preview 06-17", + "display_name": "Gemini 2.5 Flash Lite Preview 06-17", + "modalities": { + "input": [ + "text", + "image", + "audio", + "video", + "pdf" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 1048576, + "output": 65536 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-06-17", + "last_updated": "2025-06-17", + "cost": { + "input": 0.1, + "output": 0.4, + "cache_read": 0.025, + "input_audio": 0.3 + } + }, + { + "id": "gemini-2.5-flash-image-preview", + "name": "Gemini 2.5 Flash Image Preview", + "display_name": "Gemini 2.5 Flash Image Preview", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text", + "image" + ] + }, + "limit": { + "context": 32768, + "output": 32768 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "knowledge": "2025-06", + "release_date": "2025-08-26", + "last_updated": "2025-08-26", + "cost": { + "input": 0.3, + "output": 30, + "cache_read": 0.075 + } + }, + { + "id": "gemini-2.5-flash-preview-09-2025", + "name": "Gemini 2.5 Flash Preview 09 2025", + "display_name": "Gemini 2.5 Flash Preview 09 2025", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 1048576, + "output": 65536 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true, + "budget": { + "default": -1, + "min": 0, + "max": 24576 + } + }, + "search": { + "supported": true, + "default": false + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-09-25", + "last_updated": "2025-09-25", + "cost": { + "input": 0.3, + "output": 2.5, + "cache_read": 0.075, + "input_audio": 1 + } + }, + { + "id": "gemini-2.5-flash-preview-04-17", + "name": "Gemini 2.5 Flash Preview 04-17", + "display_name": "Gemini 2.5 Flash Preview 04-17", + "modalities": { + "input": [ + "text", + "image", + "audio", + "video", + "pdf" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 1048576, + "output": 65536 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-04-17", + "last_updated": "2025-04-17", + "cost": { + "input": 0.15, + "output": 0.6, + "cache_read": 0.0375 + } + }, + { + "id": "gemini-2.5-pro-preview-tts", + "name": "Gemini 2.5 Pro Preview TTS", + "display_name": "Gemini 2.5 Pro Preview TTS", + "modalities": { + "input": [ + "text" + ], + "output": [ + "audio" + ] + }, + "limit": { + "context": 8000, + "output": 16000 + }, + "temperature": false, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-05-01", + "last_updated": "2025-05-01", + "cost": { + "input": 1, + "output": 20 + } + }, + { + "id": "gemini-2.5-pro", + "name": "Gemini 2.5 Pro", + "display_name": "Gemini 2.5 Pro", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 1048576, + "output": 65536 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true, + "budget": { + "default": -1, + "min": 128, + "max": 32768 + } + }, + "search": { + "supported": true, + "default": false + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-03-20", + "last_updated": "2025-06-05", + "cost": { + "input": 1.25, + "output": 10, + "cache_read": 0.31 + } + }, + { + "id": "gemini-1.5-flash", + "name": "Gemini 1.5 Flash", + "display_name": "Gemini 1.5 Flash", + "modalities": { + "input": [ + "text", + "image", + "audio", + "video" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 1000000, + "output": 8192 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2024-05-14", + "last_updated": "2024-05-14", + "cost": { + "input": 0.075, + "output": 0.3, + "cache_read": 0.01875 + } + }, + { + "id": "gemini-1.5-flash-8b", + "name": "Gemini 1.5 Flash-8B", + "display_name": "Gemini 1.5 Flash-8B", + "modalities": { + "input": [ + "text", + "image", + "audio", + "video" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 1000000, + "output": 8192 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2024-10-03", + "last_updated": "2024-10-03", + "cost": { + "input": 0.0375, + "output": 0.15, + "cache_read": 0.01 + } + }, + { + "id": "gemini-2.5-flash-lite-preview-09-2025", + "name": "Gemini 2.5 Flash Lite Preview 09 2025", + "display_name": "Gemini 2.5 Flash Lite Preview 09 2025", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 1048576, + "output": 65536 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": false, + "budget": { + "default": -1, + "min": 512, + "max": 24576 + } + }, + "search": { + "supported": true, + "default": false + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-09-25", + "last_updated": "2025-09-25", + "cost": { + "input": 0.1, + "output": 0.4, + "cache_read": 0.025 + } + }, + { + "id": "gemini-1.5-pro", + "name": "Gemini 1.5 Pro", + "display_name": "Gemini 1.5 Pro", + "modalities": { + "input": [ + "text", + "image", + "audio", + "video" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 1000000, + "output": 8192 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2024-02-15", + "last_updated": "2024-02-15", + "cost": { + "input": 1.25, + "output": 5, + "cache_read": 0.3125 + } + }, + { + "id": "gemini-2.0-flash-preview-image-generation", + "name": "Gemini 2.0 Flash Preview Image Generation", + "display_name": "Gemini 2.0 Flash Preview Image Generation", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text", + "image" + ] + }, + "limit": { + "context": 32000, + "output": 8192 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false + }, + "search": { + "supported": false + }, + "attachment": true + } + ] + }, + "google-vertex": { + "id": "google-vertex", + "name": "Vertex", + "display_name": "Vertex", + "doc": "https://cloud.google.com/vertex-ai/generative-ai/docs/models", + "models": [ + { + "id": "gemini-embedding-001", + "name": "Gemini Embedding 001", + "display_name": "Gemini Embedding 001", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 2048, + "output": 3072 + }, + "temperature": false, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "knowledge": "2025-05", + "release_date": "2025-05-20", + "last_updated": "2025-05-20", + "cost": { + "input": 0.15, + "output": 0 + } + }, + { + "id": "gemini-2.5-flash-preview-05-20", + "name": "Gemini 2.5 Flash Preview 05-20", + "display_name": "Gemini 2.5 Flash Preview 05-20", + "modalities": { + "input": [ + "text", + "image", + "audio", + "video", + "pdf" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 1048576, + "output": 65536 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-05-20", + "last_updated": "2025-05-20", + "cost": { + "input": 0.15, + "output": 0.6, + "cache_read": 0.0375 + } + }, + { + "id": "gemini-flash-lite-latest", + "name": "Gemini Flash-Lite Latest", + "display_name": "Gemini Flash-Lite Latest", + "modalities": { + "input": [ + "text", + "image", + "audio", + "video", + "pdf" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 1048576, + "output": 65536 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-09-25", + "last_updated": "2025-09-25", + "cost": { + "input": 0.1, + "output": 0.4, + "cache_read": 0.025 + } + }, + { + "id": "gemini-3-pro-preview", + "name": "Gemini 3 Pro Preview", + "display_name": "Gemini 3 Pro Preview", + "modalities": { + "input": [ + "text", + "image", + "video", + "audio", + "pdf" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 1048576, + "output": 65536 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-11-18", + "last_updated": "2025-11-18", + "cost": { + "input": 2, + "output": 12, + "cache_read": 0.2, + "context_over_200k": { + "input": 4, + "output": 18, + "cache_read": 0.4 + } + } + }, + { + "id": "gemini-2.5-flash", + "name": "Gemini 2.5 Flash", + "display_name": "Gemini 2.5 Flash", + "modalities": { + "input": [ + "text", + "image", + "audio", + "video", + "pdf" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 1048576, + "output": 65536 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-06-17", + "last_updated": "2025-06-17", + "cost": { + "input": 0.3, + "output": 2.5, + "cache_read": 0.075, + "cache_write": 0.383 + } + }, + { + "id": "gemini-flash-latest", + "name": "Gemini Flash Latest", + "display_name": "Gemini Flash Latest", + "modalities": { + "input": [ + "text", + "image", + "audio", + "video", + "pdf" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 1048576, + "output": 65536 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-09-25", + "last_updated": "2025-09-25", + "cost": { + "input": 0.3, + "output": 2.5, + "cache_read": 0.075, + "cache_write": 0.383 + } + }, + { + "id": "gemini-2.5-pro-preview-05-06", + "name": "Gemini 2.5 Pro Preview 05-06", + "display_name": "Gemini 2.5 Pro Preview 05-06", + "modalities": { + "input": [ + "text", + "image", + "audio", + "video", + "pdf" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 1048576, + "output": 65536 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-05-06", + "last_updated": "2025-05-06", + "cost": { + "input": 1.25, + "output": 10, + "cache_read": 0.31 + } + }, + { + "id": "gemini-2.0-flash-lite", + "name": "Gemini 2.0 Flash Lite", + "display_name": "Gemini 2.0 Flash Lite", + "modalities": { + "input": [ + "text", + "image", + "audio", + "video", + "pdf" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 1048576, + "output": 8192 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": false, + "knowledge": "2024-06", + "release_date": "2024-12-11", + "last_updated": "2024-12-11", + "cost": { + "input": 0.075, + "output": 0.3 + } + }, + { + "id": "gemini-2.0-flash", + "name": "Gemini 2.0 Flash", + "display_name": "Gemini 2.0 Flash", + "modalities": { + "input": [ + "text", + "image", + "audio", + "video", + "pdf" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 1048576, + "output": 8192 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": false, + "knowledge": "2024-06", + "release_date": "2024-12-11", + "last_updated": "2024-12-11", + "cost": { + "input": 0.1, + "output": 0.4, + "cache_read": 0.025 + } + }, + { + "id": "gemini-2.5-flash-lite", + "name": "Gemini 2.5 Flash Lite", + "display_name": "Gemini 2.5 Flash Lite", + "modalities": { + "input": [ + "text", + "image", + "audio", + "video", + "pdf" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 1048576, + "output": 65536 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-06-17", + "last_updated": "2025-06-17", + "cost": { + "input": 0.1, + "output": 0.4, + "cache_read": 0.025 + } + }, + { + "id": "gemini-2.5-pro-preview-06-05", + "name": "Gemini 2.5 Pro Preview 06-05", + "display_name": "Gemini 2.5 Pro Preview 06-05", + "modalities": { + "input": [ + "text", + "image", + "audio", + "video", + "pdf" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 1048576, + "output": 65536 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-06-05", + "last_updated": "2025-06-05", + "cost": { + "input": 1.25, + "output": 10, + "cache_read": 0.31 + } + }, + { + "id": "gemini-2.5-flash-lite-preview-06-17", + "name": "Gemini 2.5 Flash Lite Preview 06-17", + "display_name": "Gemini 2.5 Flash Lite Preview 06-17", + "modalities": { + "input": [ + "text", + "image", + "audio", + "video", + "pdf" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 65536, + "output": 65536 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-06-17", + "last_updated": "2025-06-17", + "cost": { + "input": 0.1, + "output": 0.4, + "cache_read": 0.025 + } + }, + { + "id": "gemini-2.5-flash-preview-09-2025", + "name": "Gemini 2.5 Flash Preview 09-25", + "display_name": "Gemini 2.5 Flash Preview 09-25", + "modalities": { + "input": [ + "text", + "image", + "audio", + "video", + "pdf" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 1048576, + "output": 65536 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-09-25", + "last_updated": "2025-09-25", + "cost": { + "input": 0.3, + "output": 2.5, + "cache_read": 0.075, + "cache_write": 0.383 + } + }, + { + "id": "gemini-2.5-flash-preview-04-17", + "name": "Gemini 2.5 Flash Preview 04-17", + "display_name": "Gemini 2.5 Flash Preview 04-17", + "modalities": { + "input": [ + "text", + "image", + "audio", + "video", + "pdf" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 1048576, + "output": 65536 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-04-17", + "last_updated": "2025-04-17", + "cost": { + "input": 0.15, + "output": 0.6, + "cache_read": 0.0375 + } + }, + { + "id": "gemini-2.5-pro", + "name": "Gemini 2.5 Pro", + "display_name": "Gemini 2.5 Pro", + "modalities": { + "input": [ + "text", + "image", + "audio", + "video", + "pdf" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 1048576, + "output": 65536 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-03-20", + "last_updated": "2025-06-05", + "cost": { + "input": 1.25, + "output": 10, + "cache_read": 0.31 + } + }, + { + "id": "gemini-2.5-flash-lite-preview-09-2025", + "name": "Gemini 2.5 Flash Lite Preview 09-25", + "display_name": "Gemini 2.5 Flash Lite Preview 09-25", + "modalities": { + "input": [ + "text", + "image", + "audio", + "video", + "pdf" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 1048576, + "output": 65536 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-09-25", + "last_updated": "2025-09-25", + "cost": { + "input": 0.1, + "output": 0.4, + "cache_read": 0.025 + } + }, + { + "id": "openai/gpt-oss-120b-maas", + "name": "GPT OSS 120B", + "display_name": "GPT OSS 120B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 32768 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": false, + "open_weights": true, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", + "cost": { + "input": 0.09, + "output": 0.36 + } + }, + { + "id": "openai/gpt-oss-20b-maas", + "name": "GPT OSS 20B", + "display_name": "GPT OSS 20B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 32768 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": false, + "open_weights": true, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", + "cost": { + "input": 0.07, + "output": 0.25 + } + } + ] + }, + "cloudflare-workers-ai": { + "id": "cloudflare-workers-ai", + "name": "Cloudflare Workers AI", + "display_name": "Cloudflare Workers AI", + "doc": "https://developers.cloudflare.com/workers-ai/models/", + "models": [ + { + "id": "mistral-7b-instruct-v0.1-awq", + "name": "@hf/thebloke/mistral-7b-instruct-v0.1-awq", + "display_name": "@hf/thebloke/mistral-7b-instruct-v0.1-awq", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 4096, + "output": 4096 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "release_date": "2023-09-27", + "last_updated": "2023-11-09", + "cost": { + "input": 0, + "output": 0 + } + }, + { + "id": "aura-1", + "name": "@cf/deepgram/aura-1", + "display_name": "@cf/deepgram/aura-1", + "modalities": { + "input": [ + "text" + ], + "output": [ + "audio" + ] + }, + "limit": { + "context": 0, + "output": 0 + }, + "temperature": false, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "release_date": "2025-08-27", + "last_updated": "2025-07-07", + "cost": { + "input": 0.015, + "output": 0.015 + } + }, + { + "id": "mistral-7b-instruct-v0.2", + "name": "@hf/mistral/mistral-7b-instruct-v0.2", + "display_name": "@hf/mistral/mistral-7b-instruct-v0.2", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 3072, + "output": 4096 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "release_date": "2023-12-11", + "last_updated": "2025-07-24", + "cost": { + "input": 0, + "output": 0 + } + }, + { + "id": "tinyllama-1.1b-chat-v1.0", + "name": "@cf/tinyllama/tinyllama-1.1b-chat-v1.0", + "display_name": "@cf/tinyllama/tinyllama-1.1b-chat-v1.0", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 2048, + "output": 2048 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "release_date": "2023-12-30", + "last_updated": "2024-03-17", + "cost": { + "input": 0, + "output": 0 + } + }, + { + "id": "qwen1.5-0.5b-chat", + "name": "@cf/qwen/qwen1.5-0.5b-chat", + "display_name": "@cf/qwen/qwen1.5-0.5b-chat", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 32000, + "output": 32000 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "release_date": "2024-01-31", + "last_updated": "2024-04-30", + "cost": { + "input": 0, + "output": 0 + } + }, + { + "id": "llama-3.2-11b-vision-instruct", + "name": "@cf/meta/llama-3.2-11b-vision-instruct", + "display_name": "@cf/meta/llama-3.2-11b-vision-instruct", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 128000 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "release_date": "2024-09-18", + "last_updated": "2024-12-04", + "cost": { + "input": 0.049, + "output": 0.68 + } + }, + { + "id": "llama-2-13b-chat-awq", + "name": "@hf/thebloke/llama-2-13b-chat-awq", + "display_name": "@hf/thebloke/llama-2-13b-chat-awq", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 4096, + "output": 4096 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "release_date": "2023-09-19", + "last_updated": "2023-11-09", + "cost": { + "input": 0, + "output": 0 + } + }, + { + "id": "llama-3.1-8b-instruct-fp8", + "name": "@cf/meta/llama-3.1-8b-instruct-fp8", + "display_name": "@cf/meta/llama-3.1-8b-instruct-fp8", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 32000, + "output": 32000 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "release_date": "2024-07-25", + "last_updated": "2024-07-25", + "cost": { + "input": 0.15, + "output": 0.29 + } + }, + { + "id": "whisper", + "name": "@cf/openai/whisper", + "display_name": "@cf/openai/whisper", + "modalities": { + "input": [ + "audio" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 0, + "output": 0 + }, + "temperature": false, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "release_date": "2023-11-07", + "last_updated": "2024-08-12", + "cost": { + "input": 0.00045, + "output": 0.00045 + } + }, + { + "id": "stable-diffusion-xl-base-1.0", + "name": "@cf/stabilityai/stable-diffusion-xl-base-1.0", + "display_name": "@cf/stabilityai/stable-diffusion-xl-base-1.0", + "modalities": { + "input": [ + "text" + ], + "output": [ + "image" + ] + }, + "limit": { + "context": 0, + "output": 0 + }, + "temperature": false, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "release_date": "2023-07-25", + "last_updated": "2023-10-30", + "cost": { + "input": 0, + "output": 0 + } + }, + { + "id": "llama-2-7b-chat-fp16", + "name": "@cf/meta/llama-2-7b-chat-fp16", + "display_name": "@cf/meta/llama-2-7b-chat-fp16", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 4096, + "output": 4096 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "release_date": "2023-07-26", + "last_updated": "2023-07-26", + "cost": { + "input": 0.56, + "output": 6.67 + } + }, + { + "id": "resnet-50", + "name": "@cf/microsoft/resnet-50", + "display_name": "@cf/microsoft/resnet-50", + "modalities": { + "input": [ + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 0, + "output": 0 + }, + "temperature": false, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "release_date": "2022-03-16", + "last_updated": "2024-02-13", + "cost": { + "input": 0.0000025, + "output": 0 + } + }, + { + "id": "stable-diffusion-v1-5-inpainting", + "name": "@cf/runwayml/stable-diffusion-v1-5-inpainting", + "display_name": "@cf/runwayml/stable-diffusion-v1-5-inpainting", + "modalities": { + "input": [ + "text" + ], + "output": [ + "image" + ] + }, + "limit": { + "context": 0, + "output": 0 + }, + "temperature": false, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "release_date": "2024-02-27", + "last_updated": "2024-02-27", + "cost": { + "input": 0, + "output": 0 + } + }, + { + "id": "sqlcoder-7b-2", + "name": "@cf/defog/sqlcoder-7b-2", + "display_name": "@cf/defog/sqlcoder-7b-2", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 10000, + "output": 10000 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "release_date": "2024-02-05", + "last_updated": "2024-02-12", + "cost": { + "input": 0, + "output": 0 + } + }, + { + "id": "llama-3-8b-instruct", + "name": "@cf/meta/llama-3-8b-instruct", + "display_name": "@cf/meta/llama-3-8b-instruct", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 7968, + "output": 7968 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "release_date": "2024-04-17", + "last_updated": "2025-06-19", + "cost": { + "input": 0.28, + "output": 0.83 + } + }, + { + "id": "llama-2-7b-chat-hf-lora", + "name": "@cf/meta-llama/llama-2-7b-chat-hf-lora", + "display_name": "@cf/meta-llama/llama-2-7b-chat-hf-lora", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 8192, + "output": 8192 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "release_date": "2023-07-13", + "last_updated": "2024-04-17", + "cost": { + "input": 0, + "output": 0 + } + }, + { + "id": "llama-3.1-8b-instruct", + "name": "@cf/meta/llama-3.1-8b-instruct", + "display_name": "@cf/meta/llama-3.1-8b-instruct", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 7968, + "output": 7968 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "release_date": "2024-07-18", + "last_updated": "2024-09-25", + "cost": { + "input": 0.28, + "output": 0.83 + } + }, + { + "id": "openchat-3.5-0106", + "name": "@cf/openchat/openchat-3.5-0106", + "display_name": "@cf/openchat/openchat-3.5-0106", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 8192, + "output": 8192 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "release_date": "2024-01-07", + "last_updated": "2024-05-18", + "cost": { + "input": 0, + "output": 0 + } + }, + { + "id": "openhermes-2.5-mistral-7b-awq", + "name": "@hf/thebloke/openhermes-2.5-mistral-7b-awq", + "display_name": "@hf/thebloke/openhermes-2.5-mistral-7b-awq", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 4096, + "output": 4096 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "release_date": "2023-11-02", + "last_updated": "2023-11-09", + "cost": { + "input": 0, + "output": 0 + } + }, + { + "id": "lucid-origin", + "name": "@cf/leonardo/lucid-origin", + "display_name": "@cf/leonardo/lucid-origin", + "modalities": { + "input": [ + "text" + ], + "output": [ + "image" + ] + }, + "limit": { + "context": 0, + "output": 0 + }, + "temperature": false, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "release_date": "2025-08-25", + "last_updated": "2025-08-05", + "cost": { + "input": 0.007, + "output": 0.007 + } + }, + { + "id": "bart-large-cnn", + "name": "@cf/facebook/bart-large-cnn", + "display_name": "@cf/facebook/bart-large-cnn", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 0, + "output": 0 + }, + "temperature": false, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "release_date": "2022-03-02", + "last_updated": "2024-02-13", + "cost": { + "input": 0, + "output": 0 + } + }, + { + "id": "flux-1-schnell", + "name": "@cf/black-forest-labs/flux-1-schnell", + "display_name": "@cf/black-forest-labs/flux-1-schnell", + "modalities": { + "input": [ + "text" + ], + "output": [ + "image" + ] + }, + "limit": { + "context": 2048, + "output": 0 + }, + "temperature": false, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "release_date": "2024-07-31", + "last_updated": "2024-08-16", + "cost": { + "input": 0.000053, + "output": 0.00011 + } + }, + { + "id": "deepseek-r1-distill-qwen-32b", + "name": "@cf/deepseek-ai/deepseek-r1-distill-qwen-32b", + "display_name": "@cf/deepseek-ai/deepseek-r1-distill-qwen-32b", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 80000, + "output": 80000 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": false, + "open_weights": true, + "release_date": "2025-01-20", + "last_updated": "2025-02-24", + "cost": { + "input": 0.5, + "output": 4.88 + } + }, + { + "id": "gemma-2b-it-lora", + "name": "@cf/google/gemma-2b-it-lora", + "display_name": "@cf/google/gemma-2b-it-lora", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 8192, + "output": 8192 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "release_date": "2024-04-02", + "last_updated": "2024-04-02", + "cost": { + "input": 0, + "output": 0 + } + }, + { + "id": "una-cybertron-7b-v2-bf16", + "name": "@cf/fblgit/una-cybertron-7b-v2-bf16", + "display_name": "@cf/fblgit/una-cybertron-7b-v2-bf16", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 15000, + "output": 15000 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "release_date": "2023-12-02", + "last_updated": "2024-03-08", + "cost": { + "input": 0, + "output": 0 + } + }, + { + "id": "gemma-sea-lion-v4-27b-it", + "name": "@cf/aisingapore/gemma-sea-lion-v4-27b-it", + "display_name": "@cf/aisingapore/gemma-sea-lion-v4-27b-it", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 0 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "release_date": "2025-09-23", + "last_updated": "2025-12-02", + "cost": { + "input": 0.35, + "output": 0.56 + } + }, + { + "id": "m2m100-1.2b", + "name": "@cf/meta/m2m100-1.2b", + "display_name": "@cf/meta/m2m100-1.2b", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 0, + "output": 0 + }, + "temperature": false, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "release_date": "2022-03-02", + "last_updated": "2023-11-16", + "cost": { + "input": 0.34, + "output": 0.34 + } + }, + { + "id": "llama-3.2-3b-instruct", + "name": "@cf/meta/llama-3.2-3b-instruct", + "display_name": "@cf/meta/llama-3.2-3b-instruct", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 128000 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "release_date": "2024-09-18", + "last_updated": "2024-10-24", + "cost": { + "input": 0.051, + "output": 0.34 + } + }, + { + "id": "qwen2.5-coder-32b-instruct", + "name": "@cf/qwen/qwen2.5-coder-32b-instruct", + "display_name": "@cf/qwen/qwen2.5-coder-32b-instruct", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 32768, + "output": 32768 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "release_date": "2024-11-06", + "last_updated": "2025-01-12", + "cost": { + "input": 0.66, + "output": 1 + } + }, + { + "id": "stable-diffusion-v1-5-img2img", + "name": "@cf/runwayml/stable-diffusion-v1-5-img2img", + "display_name": "@cf/runwayml/stable-diffusion-v1-5-img2img", + "modalities": { + "input": [ + "text" + ], + "output": [ + "image" + ] + }, + "limit": { + "context": 0, + "output": 0 + }, + "temperature": false, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "release_date": "2024-02-27", + "last_updated": "2024-02-27", + "cost": { + "input": 0, + "output": 0 + } + }, + { + "id": "gemma-7b-it-lora", + "name": "@cf/google/gemma-7b-it-lora", + "display_name": "@cf/google/gemma-7b-it-lora", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 3500, + "output": 3500 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "release_date": "2024-04-02", + "last_updated": "2024-04-02", + "cost": { + "input": 0, + "output": 0 + } + }, + { + "id": "qwen1.5-14b-chat-awq", + "name": "@cf/qwen/qwen1.5-14b-chat-awq", + "display_name": "@cf/qwen/qwen1.5-14b-chat-awq", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 7500, + "output": 7500 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "release_date": "2024-02-03", + "last_updated": "2024-04-30", + "cost": { + "input": 0, + "output": 0 + } + }, + { + "id": "qwen1.5-1.8b-chat", + "name": "@cf/qwen/qwen1.5-1.8b-chat", + "display_name": "@cf/qwen/qwen1.5-1.8b-chat", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 32000, + "output": 32000 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "release_date": "2024-01-30", + "last_updated": "2024-04-30", + "cost": { + "input": 0, + "output": 0 + } + }, + { + "id": "mistral-small-3.1-24b-instruct", + "name": "@cf/mistralai/mistral-small-3.1-24b-instruct", + "display_name": "@cf/mistralai/mistral-small-3.1-24b-instruct", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 128000 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "release_date": "2025-03-11", + "last_updated": "2025-07-28", + "cost": { + "input": 0.35, + "output": 0.56 + } + }, + { + "id": "gemma-7b-it", + "name": "@hf/google/gemma-7b-it", + "display_name": "@hf/google/gemma-7b-it", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 8192, + "output": 8192 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "release_date": "2024-02-13", + "last_updated": "2024-08-14", + "cost": { + "input": 0, + "output": 0 + } + }, + { + "id": "qwen3-30b-a3b-fp8", + "name": "@cf/qwen/qwen3-30b-a3b-fp8", + "display_name": "@cf/qwen/qwen3-30b-a3b-fp8", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 32768, + "output": 0 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": false, + "open_weights": true, + "release_date": "2025-04-30", + "last_updated": "2025-12-02", + "cost": { + "input": 0.051, + "output": 0.34 + } + }, + { + "id": "llamaguard-7b-awq", + "name": "@hf/thebloke/llamaguard-7b-awq", + "display_name": "@hf/thebloke/llamaguard-7b-awq", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 4096, + "output": 4096 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "release_date": "2023-12-11", + "last_updated": "2023-12-11", + "cost": { + "input": 0, + "output": 0 + } + }, + { + "id": "hermes-2-pro-mistral-7b", + "name": "@hf/nousresearch/hermes-2-pro-mistral-7b", + "display_name": "@hf/nousresearch/hermes-2-pro-mistral-7b", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 24000, + "output": 24000 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "release_date": "2024-03-11", + "last_updated": "2024-09-08", + "cost": { + "input": 0, + "output": 0 + } + }, + { + "id": "granite-4.0-h-micro", + "name": "@cf/ibm-granite/granite-4.0-h-micro", + "display_name": "@cf/ibm-granite/granite-4.0-h-micro", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131000, + "output": 0 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "release_date": "2025-10-07", + "last_updated": "2025-12-02", + "cost": { + "input": 0.017, + "output": 0.11 + } + }, + { + "id": "falcon-7b-instruct", + "name": "@cf/tiiuae/falcon-7b-instruct", + "display_name": "@cf/tiiuae/falcon-7b-instruct", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 4096, + "output": 4096 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "release_date": "2023-04-25", + "last_updated": "2024-10-12", + "cost": { + "input": 0, + "output": 0 + } + }, + { + "id": "llama-3.3-70b-instruct-fp8-fast", + "name": "@cf/meta/llama-3.3-70b-instruct-fp8-fast", + "display_name": "@cf/meta/llama-3.3-70b-instruct-fp8-fast", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 24000, + "output": 24000 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "release_date": "2024-12-06", + "last_updated": "2024-12-06", + "cost": { + "input": 0.29, + "output": 2.25 + } + }, + { + "id": "llama-3-8b-instruct-awq", + "name": "@cf/meta/llama-3-8b-instruct-awq", + "display_name": "@cf/meta/llama-3-8b-instruct-awq", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 8192, + "output": 8192 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "release_date": "2024-05-09", + "last_updated": "2024-05-09", + "cost": { + "input": 0.12, + "output": 0.27 + } + }, + { + "id": "phoenix-1.0", + "name": "@cf/leonardo/phoenix-1.0", + "display_name": "@cf/leonardo/phoenix-1.0", + "modalities": { + "input": [ + "text" + ], + "output": [ + "image" + ] + }, + "limit": { + "context": 0, + "output": 0 + }, + "temperature": false, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "release_date": "2025-08-25", + "last_updated": "2025-08-25", + "cost": { + "input": 0.0058, + "output": 0.0058 + } + }, + { + "id": "phi-2", + "name": "@cf/microsoft/phi-2", + "display_name": "@cf/microsoft/phi-2", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 2048, + "output": 2048 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "release_date": "2023-12-13", + "last_updated": "2024-04-29", + "cost": { + "input": 0, + "output": 0 + } + }, + { + "id": "dreamshaper-8-lcm", + "name": "@cf/lykon/dreamshaper-8-lcm", + "display_name": "@cf/lykon/dreamshaper-8-lcm", + "modalities": { + "input": [ + "text" + ], + "output": [ + "image" + ] + }, + "limit": { + "context": 0, + "output": 0 + }, + "temperature": false, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": true, + "release_date": "2023-12-06", + "last_updated": "2023-12-07", + "cost": { + "input": 0, + "output": 0 + } + }, + { + "id": "discolm-german-7b-v1-awq", + "name": "@cf/thebloke/discolm-german-7b-v1-awq", + "display_name": "@cf/thebloke/discolm-german-7b-v1-awq", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 4096, + "output": 4096 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "release_date": "2024-01-18", + "last_updated": "2024-01-24", + "cost": { + "input": 0, + "output": 0 + } + }, + { + "id": "llama-2-7b-chat-int8", + "name": "@cf/meta/llama-2-7b-chat-int8", + "display_name": "@cf/meta/llama-2-7b-chat-int8", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 8192, + "output": 8192 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "release_date": "2023-09-25", + "last_updated": "2023-09-25", + "cost": { + "input": 0.556, + "output": 6.667 + } + }, + { + "id": "llama-3.2-1b-instruct", + "name": "@cf/meta/llama-3.2-1b-instruct", + "display_name": "@cf/meta/llama-3.2-1b-instruct", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 60000, + "output": 60000 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "release_date": "2024-09-18", + "last_updated": "2024-10-24", + "cost": { + "input": 0.027, + "output": 0.2 + } + }, + { + "id": "whisper-large-v3-turbo", + "name": "@cf/openai/whisper-large-v3-turbo", + "display_name": "@cf/openai/whisper-large-v3-turbo", + "modalities": { + "input": [ + "audio" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 0, + "output": 0 + }, + "temperature": false, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "release_date": "2024-10-01", + "last_updated": "2024-10-04", + "cost": { + "input": 0.00051, + "output": 0.00051 + } + }, + { + "id": "llama-4-scout-17b-16e-instruct", + "name": "@cf/meta/llama-4-scout-17b-16e-instruct", + "display_name": "@cf/meta/llama-4-scout-17b-16e-instruct", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131000, + "output": 131000 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "release_date": "2025-04-02", + "last_updated": "2025-05-23", + "cost": { + "input": 0.27, + "output": 0.85 + } + }, + { + "id": "starling-lm-7b-beta", + "name": "@hf/nexusflow/starling-lm-7b-beta", + "display_name": "@hf/nexusflow/starling-lm-7b-beta", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 4096, + "output": 4096 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "release_date": "2024-03-19", + "last_updated": "2024-04-03", + "cost": { + "input": 0, + "output": 0 + } + }, + { + "id": "deepseek-coder-6.7b-base-awq", + "name": "@hf/thebloke/deepseek-coder-6.7b-base-awq", + "display_name": "@hf/thebloke/deepseek-coder-6.7b-base-awq", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 4096, + "output": 4096 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "release_date": "2023-11-05", + "last_updated": "2023-11-09", + "cost": { + "input": 0, + "output": 0 + } + }, + { + "id": "gemma-3-12b-it", + "name": "@cf/google/gemma-3-12b-it", + "display_name": "@cf/google/gemma-3-12b-it", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 80000, + "output": 80000 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "release_date": "2025-03-01", + "last_updated": "2025-03-21", + "cost": { + "input": 0.35, + "output": 0.56 + } + }, + { + "id": "llama-guard-3-8b", + "name": "@cf/meta/llama-guard-3-8b", + "display_name": "@cf/meta/llama-guard-3-8b", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 0 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "release_date": "2024-07-22", + "last_updated": "2024-10-11", + "cost": { + "input": 0.48, + "output": 0.03 + } + }, + { + "id": "neural-chat-7b-v3-1-awq", + "name": "@hf/thebloke/neural-chat-7b-v3-1-awq", + "display_name": "@hf/thebloke/neural-chat-7b-v3-1-awq", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 4096, + "output": 4096 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "release_date": "2023-11-15", + "last_updated": "2023-11-17", + "cost": { + "input": 0, + "output": 0 + } + }, + { + "id": "whisper-tiny-en", + "name": "@cf/openai/whisper-tiny-en", + "display_name": "@cf/openai/whisper-tiny-en", + "modalities": { + "input": [ + "audio" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 0, + "output": 0 + }, + "temperature": false, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "release_date": "2022-09-26", + "last_updated": "2024-01-22", + "cost": { + "input": 0, + "output": 0 + } + }, + { + "id": "stable-diffusion-xl-lightning", + "name": "@cf/bytedance/stable-diffusion-xl-lightning", + "display_name": "@cf/bytedance/stable-diffusion-xl-lightning", + "modalities": { + "input": [ + "text" + ], + "output": [ + "image" + ] + }, + "limit": { + "context": 0, + "output": 0 + }, + "temperature": false, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "release_date": "2024-02-20", + "last_updated": "2024-04-03", + "cost": { + "input": 0, + "output": 0 + } + }, + { + "id": "mistral-7b-instruct-v0.1", + "name": "@cf/mistral/mistral-7b-instruct-v0.1", + "display_name": "@cf/mistral/mistral-7b-instruct-v0.1", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 2824, + "output": 2824 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "release_date": "2023-09-27", + "last_updated": "2025-07-24", + "cost": { + "input": 0.11, + "output": 0.19 + } + }, + { + "id": "llava-1.5-7b-hf", + "name": "@cf/llava-hf/llava-1.5-7b-hf", + "display_name": "@cf/llava-hf/llava-1.5-7b-hf", + "modalities": { + "input": [ + "image", + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 0, + "output": 0 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": true, + "release_date": "2023-12-05", + "last_updated": "2025-06-06", + "cost": { + "input": 0, + "output": 0 + } + }, + { + "id": "gpt-oss-20b", + "name": "@cf/openai/gpt-oss-20b", + "display_name": "@cf/openai/gpt-oss-20b", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 128000 + }, + "temperature": false, + "tool_call": false, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": false, + "open_weights": true, + "release_date": "2025-08-04", + "last_updated": "2025-08-14", + "cost": { + "input": 0.2, + "output": 0.3 + } + }, + { + "id": "deepseek-math-7b-instruct", + "name": "@cf/deepseek-ai/deepseek-math-7b-instruct", + "display_name": "@cf/deepseek-ai/deepseek-math-7b-instruct", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 4096, + "output": 4096 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "release_date": "2024-02-05", + "last_updated": "2024-02-06", + "cost": { + "input": 0, + "output": 0 + } + }, + { + "id": "gpt-oss-120b", + "name": "@cf/openai/gpt-oss-120b", + "display_name": "@cf/openai/gpt-oss-120b", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 128000 + }, + "temperature": false, + "tool_call": false, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": false, + "open_weights": true, + "release_date": "2025-08-04", + "last_updated": "2025-08-14", + "cost": { + "input": 0.35, + "output": 0.75 + } + }, + { + "id": "melotts", + "name": "@cf/myshell-ai/melotts", + "display_name": "@cf/myshell-ai/melotts", + "modalities": { + "input": [ + "text" + ], + "output": [ + "audio" + ] + }, + "limit": { + "context": 0, + "output": 0 + }, + "temperature": false, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": true, + "release_date": "2024-07-19", + "last_updated": "2024-07-19", + "cost": { + "input": 0.0002, + "output": 0 + } + }, + { + "id": "qwen1.5-7b-chat-awq", + "name": "@cf/qwen/qwen1.5-7b-chat-awq", + "display_name": "@cf/qwen/qwen1.5-7b-chat-awq", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 20000, + "output": 20000 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "release_date": "2024-02-03", + "last_updated": "2024-04-30", + "cost": { + "input": 0, + "output": 0 + } + }, + { + "id": "llama-3.1-8b-instruct-fast", + "name": "@cf/meta/llama-3.1-8b-instruct-fast", + "display_name": "@cf/meta/llama-3.1-8b-instruct-fast", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 128000 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "release_date": "2024-07-18", + "last_updated": "2024-09-25", + "cost": { + "input": 0.045, + "output": 0.384 + } + }, + { + "id": "nova-3", + "name": "@cf/deepgram/nova-3", + "display_name": "@cf/deepgram/nova-3", + "modalities": { + "input": [ + "audio" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 0, + "output": 0 + }, + "temperature": false, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "release_date": "2025-06-05", + "last_updated": "2025-07-08", + "cost": { + "input": 0.0052, + "output": 0.0052 + } + }, + { + "id": "llama-3.1-70b-instruct", + "name": "@cf/meta/llama-3.1-70b-instruct", + "display_name": "@cf/meta/llama-3.1-70b-instruct", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 24000, + "output": 24000 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "release_date": "2024-07-16", + "last_updated": "2024-12-15", + "cost": { + "input": 0.293, + "output": 2.253 + } + }, + { + "id": "qwq-32b", + "name": "@cf/qwen/qwq-32b", + "display_name": "@cf/qwen/qwq-32b", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 24000, + "output": 24000 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "release_date": "2025-03-05", + "last_updated": "2025-03-11", + "cost": { + "input": 0.66, + "output": 1 + } + }, + { + "id": "zephyr-7b-beta-awq", + "name": "@hf/thebloke/zephyr-7b-beta-awq", + "display_name": "@hf/thebloke/zephyr-7b-beta-awq", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 4096, + "output": 4096 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "release_date": "2023-10-27", + "last_updated": "2023-11-09", + "cost": { + "input": 0, + "output": 0 + } + }, + { + "id": "deepseek-coder-6.7b-instruct-awq", + "name": "@hf/thebloke/deepseek-coder-6.7b-instruct-awq", + "display_name": "@hf/thebloke/deepseek-coder-6.7b-instruct-awq", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 4096, + "output": 4096 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "release_date": "2023-11-05", + "last_updated": "2023-11-13", + "cost": { + "input": 0, + "output": 0 + } + }, + { + "id": "llama-3.1-8b-instruct-awq", + "name": "@cf/meta/llama-3.1-8b-instruct-awq", + "display_name": "@cf/meta/llama-3.1-8b-instruct-awq", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 8192, + "output": 8192 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "release_date": "2024-07-25", + "last_updated": "2024-07-25", + "cost": { + "input": 0.12, + "output": 0.27 + } + }, + { + "id": "mistral-7b-instruct-v0.2-lora", + "name": "@cf/mistral/mistral-7b-instruct-v0.2-lora", + "display_name": "@cf/mistral/mistral-7b-instruct-v0.2-lora", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 15000, + "output": 15000 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "release_date": "2024-04-01", + "last_updated": "2024-04-01", + "cost": { + "input": 0, + "output": 0 + } + }, + { + "id": "uform-gen2-qwen-500m", + "name": "@cf/unum/uform-gen2-qwen-500m", + "display_name": "@cf/unum/uform-gen2-qwen-500m", + "modalities": { + "input": [ + "image", + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 0, + "output": 0 + }, + "temperature": false, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "release_date": "2024-02-15", + "last_updated": "2024-04-24", + "cost": { + "input": 0, + "output": 0 + } + } + ] + }, + "inception": { + "id": "inception", + "name": "Inception", + "display_name": "Inception", + "api": "https://api.inceptionlabs.ai/v1/", + "doc": "https://platform.inceptionlabs.ai/docs", + "models": [ + { + "id": "mercury-coder", + "name": "Mercury Coder", + "display_name": "Mercury Coder", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 16384 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "knowledge": "2023-10", + "release_date": "2025-02-26", + "last_updated": "2025-07-31", + "cost": { + "input": 0.25, + "output": 1, + "cache_read": 0.25, + "cache_write": 1 + } + }, + { + "id": "mercury", + "name": "Mercury", + "display_name": "Mercury", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 16384 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "knowledge": "2023-10", + "release_date": "2025-06-26", + "last_updated": "2025-07-31", + "cost": { + "input": 0.25, + "output": 1, + "cache_read": 0.25, + "cache_write": 1 + } + } + ] + }, + "cloudflare-ai-gateway": { + "id": "cloudflare-ai-gateway", + "name": "Cloudflare AI Gateway", + "display_name": "Cloudflare AI Gateway", + "api": "https://gateway.ai.cloudflare.com/v1/${CLOUDFLARE_ACCOUNT_ID}/${CLOUDFLARE_GATEWAY_ID}/compat/", + "doc": "https://developers.cloudflare.com/ai-gateway/", + "models": [ + { + "id": "workers-ai/aura-1", + "name": "aura 1", + "display_name": "aura 1", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 16384 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "release_date": "2025-11-14", + "last_updated": "2025-11-14", + "cost": { + "input": 0, + "output": 0 + } + }, + { + "id": "workers-ai/llama-3.2-11b-vision-instruct", + "name": "llama 3.2 11u vision instruct", + "display_name": "llama 3.2 11u vision instruct", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 16384 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "release_date": "2025-04-03", + "last_updated": "2025-04-03", + "cost": { + "input": 0, + "output": 0 + } + }, + { + "id": "workers-ai/bge-m3", + "name": "uge m3", + "display_name": "uge m3", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 16384 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "release_date": "2025-04-03", + "last_updated": "2025-04-03", + "cost": { + "input": 0, + "output": 0 + } + }, + { + "id": "workers-ai/llama-3.1-8b-instruct-fp8", + "name": "llama 3.1 8u instruct fp8", + "display_name": "llama 3.1 8u instruct fp8", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 16384 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "release_date": "2025-04-03", + "last_updated": "2025-04-03", + "cost": { + "input": 0, + "output": 0 + } + }, + { + "id": "workers-ai/whisper", + "name": "whisper", + "display_name": "whisper", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 16384 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "release_date": "2025-11-14", + "last_updated": "2025-11-14", + "cost": { + "input": 0, + "output": 0 + } + }, + { + "id": "workers-ai/smart-turn-v2", + "name": "smart turn v2", + "display_name": "smart turn v2", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 16384 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "release_date": "2025-11-14", + "last_updated": "2025-11-14", + "cost": { + "input": 0, + "output": 0 + } + }, + { + "id": "workers-ai/llama-2-7b-chat-fp16", + "name": "llama 2 7u chat fp16", + "display_name": "llama 2 7u chat fp16", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 16384 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "release_date": "2025-04-03", + "last_updated": "2025-04-03", + "cost": { + "input": 0, + "output": 6.67 + } + }, + { + "id": "workers-ai/llama-3-8b-instruct", + "name": "llama 3 8u instruct", + "display_name": "llama 3 8u instruct", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 16384 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "release_date": "2025-04-03", + "last_updated": "2025-04-03", + "cost": { + "input": 0, + "output": 0 + } + }, + { + "id": "workers-ai/llama-3.1-8b-instruct", + "name": "llama 3.1 8u instruct", + "display_name": "llama 3.1 8u instruct", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 16384 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "release_date": "2025-04-03", + "last_updated": "2025-04-03", + "cost": { + "input": 0, + "output": 0 + } + }, + { + "id": "workers-ai/bge-base-en-v1.5", + "name": "uge uase en v1.5", + "display_name": "uge uase en v1.5", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 16384 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "release_date": "2025-04-03", + "last_updated": "2025-04-03", + "cost": { + "input": 0, + "output": 0 + } + }, + { + "id": "workers-ai/bart-large-cnn", + "name": "uart large cnn", + "display_name": "uart large cnn", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 16384 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "release_date": "2025-04-09", + "last_updated": "2025-04-09", + "cost": { + "input": 0, + "output": 0 + } + }, + { + "id": "workers-ai/deepseek-r1-distill-qwen-32b", + "name": "deepseek r1 distill qwen 32b", + "display_name": "deepseek r1 distill qwen 32b", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 16384 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "release_date": "2025-04-03", + "last_updated": "2025-04-03", + "cost": { + "input": 0, + "output": 4.88 + } + }, + { + "id": "workers-ai/plamo-embedding-1b", + "name": "plamo emuedding 1b", + "display_name": "plamo emuedding 1b", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 16384 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "release_date": "2025-09-25", + "last_updated": "2025-09-25", + "cost": { + "input": 0, + "output": 0 + } + }, + { + "id": "workers-ai/bge-large-en-v1.5", + "name": "uge large en v1.5", + "display_name": "uge large en v1.5", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 16384 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "release_date": "2025-04-03", + "last_updated": "2025-04-03", + "cost": { + "input": 0, + "output": 0 + } + }, + { + "id": "workers-ai/gemma-sea-lion-v4-27b-it", + "name": "gemma sea lion v4 27u it", + "display_name": "gemma sea lion v4 27u it", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 16384 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "release_date": "2025-09-25", + "last_updated": "2025-09-25", + "cost": { + "input": 0, + "output": 0 + } + }, + { + "id": "workers-ai/m2m100-1.2b", + "name": "m2m100 1.2b", + "display_name": "m2m100 1.2b", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 16384 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "release_date": "2025-04-03", + "last_updated": "2025-04-03", + "cost": { + "input": 0, + "output": 0 + } + }, + { + "id": "workers-ai/llama-3.2-3b-instruct", + "name": "llama 3.2 3u instruct", + "display_name": "llama 3.2 3u instruct", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 16384 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "release_date": "2025-04-03", + "last_updated": "2025-04-03", + "cost": { + "input": 0, + "output": 0 + } + }, + { + "id": "workers-ai/qwen2.5-coder-32b-instruct", + "name": "qwen2.5 coder 32u instruct", + "display_name": "qwen2.5 coder 32u instruct", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 16384 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "release_date": "2025-04-11", + "last_updated": "2025-04-11", + "cost": { + "input": 0, + "output": 1 + } + }, + { + "id": "workers-ai/bge-reranker-base", + "name": "uge reranker uase", + "display_name": "uge reranker uase", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 16384 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "release_date": "2025-04-09", + "last_updated": "2025-04-09", + "cost": { + "input": 0, + "output": 0 + } + }, + { + "id": "workers-ai/mistral-small-3.1-24b-instruct", + "name": "mistral small 3.1 24u instruct", + "display_name": "mistral small 3.1 24u instruct", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 16384 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "release_date": "2025-04-11", + "last_updated": "2025-04-11", + "cost": { + "input": 0, + "output": 0 + } + }, + { + "id": "workers-ai/aura-2-es", + "name": "aura 2 es", + "display_name": "aura 2 es", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 16384 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "release_date": "2025-11-14", + "last_updated": "2025-11-14", + "cost": { + "input": 0, + "output": 0 + } + }, + { + "id": "workers-ai/qwen3-30b-a3b-fp8", + "name": "qwen3 30u a3u fp8", + "display_name": "qwen3 30u a3u fp8", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 16384 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "release_date": "2025-11-14", + "last_updated": "2025-11-14", + "cost": { + "input": 0, + "output": 0 + } + }, + { + "id": "workers-ai/aura-2-en", + "name": "aura 2 en", + "display_name": "aura 2 en", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 16384 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "release_date": "2025-11-14", + "last_updated": "2025-11-14", + "cost": { + "input": 0, + "output": 0 + } + }, + { + "id": "workers-ai/granite-4.0-h-micro", + "name": "granite 4.0 h micro", + "display_name": "granite 4.0 h micro", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 16384 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "release_date": "2025-10-15", + "last_updated": "2025-10-15", + "cost": { + "input": 0, + "output": 0 + } + }, + { + "id": "workers-ai/llama-3.3-70b-instruct-fp8-fast", + "name": "llama 3.3 70u instruct fp8 fast", + "display_name": "llama 3.3 70u instruct fp8 fast", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 16384 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "release_date": "2025-04-03", + "last_updated": "2025-04-03", + "cost": { + "input": 0, + "output": 2.25 + } + }, + { + "id": "workers-ai/llama-3-8b-instruct-awq", + "name": "llama 3 8u instruct awq", + "display_name": "llama 3 8u instruct awq", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 16384 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "release_date": "2025-04-03", + "last_updated": "2025-04-03", + "cost": { + "input": 0, + "output": 0 + } + }, + { + "id": "workers-ai/qwen3-embedding-0.6b", + "name": "qwen3 emuedding 0.6b", + "display_name": "qwen3 emuedding 0.6b", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 16384 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "release_date": "2025-11-14", + "last_updated": "2025-11-14", + "cost": { + "input": 0, + "output": 0 + } + }, + { + "id": "workers-ai/llama-3.2-1b-instruct", + "name": "llama 3.2 1u instruct", + "display_name": "llama 3.2 1u instruct", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 16384 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "release_date": "2025-04-03", + "last_updated": "2025-04-03", + "cost": { + "input": 0, + "output": 0 + } + }, + { + "id": "workers-ai/whisper-large-v3-turbo", + "name": "whisper large v3 turuo", + "display_name": "whisper large v3 turuo", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 16384 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "release_date": "2025-11-14", + "last_updated": "2025-11-14", + "cost": { + "input": 0, + "output": 0 + } + }, + { + "id": "workers-ai/llama-4-scout-17b-16e-instruct", + "name": "llama 4 scout 17u 16e instruct", + "display_name": "llama 4 scout 17u 16e instruct", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 16384 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "release_date": "2025-04-16", + "last_updated": "2025-04-16", + "cost": { + "input": 0, + "output": 0 + } + }, + { + "id": "workers-ai/gemma-3-12b-it", + "name": "gemma 3 12u it", + "display_name": "gemma 3 12u it", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 16384 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "release_date": "2025-04-11", + "last_updated": "2025-04-11", + "cost": { + "input": 0, + "output": 0 + } + }, + { + "id": "workers-ai/llama-guard-3-8b", + "name": "llama guard 3 8b", + "display_name": "llama guard 3 8b", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 16384 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "release_date": "2025-04-03", + "last_updated": "2025-04-03", + "cost": { + "input": 0, + "output": 0 + } + }, + { + "id": "workers-ai/mistral-7b-instruct-v0.1", + "name": "mistral 7u instruct v0.1", + "display_name": "mistral 7u instruct v0.1", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 16384 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "release_date": "2025-04-03", + "last_updated": "2025-04-03", + "cost": { + "input": 0, + "output": 0 + } + }, + { + "id": "workers-ai/gpt-oss-20b", + "name": "gpt oss 20b", + "display_name": "gpt oss 20b", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 16384 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", + "cost": { + "input": 0, + "output": 0 + } + }, + { + "id": "workers-ai/gpt-oss-120b", + "name": "gpt oss 120b", + "display_name": "gpt oss 120b", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 16384 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", + "cost": { + "input": 0, + "output": 0 + } + }, + { + "id": "workers-ai/bge-small-en-v1.5", + "name": "uge small en v1.5", + "display_name": "uge small en v1.5", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 16384 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "release_date": "2025-04-03", + "last_updated": "2025-04-03", + "cost": { + "input": 0, + "output": 0 + } + }, + { + "id": "workers-ai/melotts", + "name": "melotts", + "display_name": "melotts", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 16384 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "release_date": "2025-11-14", + "last_updated": "2025-11-14", + "cost": { + "input": 0, + "output": 0 + } + }, + { + "id": "workers-ai/nova-3", + "name": "nova 3", + "display_name": "nova 3", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 16384 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "release_date": "2025-11-14", + "last_updated": "2025-11-14", + "cost": { + "input": 0, + "output": 0 + } + }, + { + "id": "workers-ai/qwq-32b", + "name": "qwq 32b", + "display_name": "qwq 32b", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 16384 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "release_date": "2025-04-11", + "last_updated": "2025-04-11", + "cost": { + "input": 0, + "output": 1 + } + }, + { + "id": "workers-ai/distilbert-sst-2-int8", + "name": "distiluert sst 2 int8", + "display_name": "distiluert sst 2 int8", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 16384 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "release_date": "2025-04-03", + "last_updated": "2025-04-03", + "cost": { + "input": 0, + "output": 0 + } + }, + { + "id": "workers-ai/llama-3.1-8b-instruct-awq", + "name": "llama 3.1 8u instruct awq", + "display_name": "llama 3.1 8u instruct awq", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 16384 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "release_date": "2025-04-03", + "last_updated": "2025-04-03", + "cost": { + "input": 0, + "output": 0 + } + }, + { + "id": "openai/gpt-4", + "name": "gpt 4", + "display_name": "gpt 4", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 16384 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "release_date": "2024-07-23", + "last_updated": "2024-07-23", + "cost": { + "input": 30, + "output": 60 + } + }, + { + "id": "openai/gpt-5.1-codex", + "name": "gpt 5.1 codex", + "display_name": "gpt 5.1 codex", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 16384 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "release_date": "2025-11-14", + "last_updated": "2025-11-14", + "cost": { + "input": 1.25, + "output": 10 + } + }, + { + "id": "openai/gpt-3.5-turbo", + "name": "gpt 3.5 turuo", + "display_name": "gpt 3.5 turuo", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 16384 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "release_date": "2025-02-10", + "last_updated": "2025-02-10", + "cost": { + "input": 0, + "output": 1.5 + } + }, + { + "id": "openai/gpt-4-turbo", + "name": "gpt 4 turuo", + "display_name": "gpt 4 turuo", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 16384 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "release_date": "2024-07-23", + "last_updated": "2024-07-23", + "cost": { + "input": 10, + "output": 30 + } + }, + { + "id": "openai/o1-preview", + "name": "o1 preview", + "display_name": "o1 preview", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 16384 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "release_date": "2024-09-12", + "last_updated": "2024-09-12", + "cost": { + "input": 15, + "output": 60 + } + }, + { + "id": "openai/o3-mini", + "name": "o3 mini", + "display_name": "o3 mini", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 16384 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "release_date": "2025-02-05", + "last_updated": "2025-02-05", + "cost": { + "input": 1.1, + "output": 4.4 + } + }, + { + "id": "openai/gpt-5.1", + "name": "gpt 5.1", + "display_name": "gpt 5.1", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 16384 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "release_date": "2025-11-14", + "last_updated": "2025-11-14", + "cost": { + "input": 1.25, + "output": 10 + } + }, + { + "id": "openai/gpt-4o", + "name": "gpt 4o", + "display_name": "gpt 4o", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 16384 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "release_date": "2025-02-10", + "last_updated": "2025-02-10", + "cost": { + "input": 2.5, + "output": 10 + } + }, + { + "id": "openai/o4-mini", + "name": "o4 mini", + "display_name": "o4 mini", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 16384 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "release_date": "2025-04-16", + "last_updated": "2025-04-16", + "cost": { + "input": 1.1, + "output": 4.4 + } + }, + { + "id": "openai/o1", + "name": "o1", + "display_name": "o1", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 16384 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "release_date": "2025-01-07", + "last_updated": "2025-01-07", + "cost": { + "input": 15, + "output": 60 + } + }, + { + "id": "openai/o1-mini", + "name": "o1 mini", + "display_name": "o1 mini", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 16384 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "release_date": "2025-02-10", + "last_updated": "2025-02-10", + "cost": { + "input": 1.1, + "output": 4.4 + } + }, + { + "id": "openai/o3-pro", + "name": "o3 pro", + "display_name": "o3 pro", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 16384 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "release_date": "2025-06-11", + "last_updated": "2025-06-11", + "cost": { + "input": 20, + "output": 80 + } + }, + { + "id": "openai/o3", + "name": "o3", + "display_name": "o3", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 16384 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "release_date": "2025-06-10", + "last_updated": "2025-06-10", + "cost": { + "input": 2, + "output": 8 + } + }, + { + "id": "openai/gpt-4o-mini", + "name": "gpt 4o mini", + "display_name": "gpt 4o mini", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 16384 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "release_date": "2024-07-23", + "last_updated": "2024-07-23", + "cost": { + "input": 0, + "output": 0 + } + }, + { + "id": "replicate/replicate-internal/llama-405b-instruct-vllm", + "name": "llama 405u instruct vllm", + "display_name": "llama 405u instruct vllm", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 16384 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "release_date": "2024-08-27", + "last_updated": "2024-08-27", + "cost": { + "input": 9.5, + "output": 9.5 + } + }, + { + "id": "replicate/meta/meta-llama-3.1-405b-instruct", + "name": "meta llama 3.1 405u instruct", + "display_name": "meta llama 3.1 405u instruct", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 16384 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "release_date": "2024-09-25", + "last_updated": "2024-09-25", + "cost": { + "input": 9.5, + "output": 9.5 + } + }, + { + "id": "replicate/meta/meta-llama-3-70b-instruct", + "name": "meta llama 3 70u instruct", + "display_name": "meta llama 3 70u instruct", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 16384 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "release_date": "2024-10-08", + "last_updated": "2024-10-08", + "cost": { + "input": 0, + "output": 2.75 + } + }, + { + "id": "replicate/meta/meta-llama-3-8b-instruct", + "name": "meta llama 3 8u instruct", + "display_name": "meta llama 3 8u instruct", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 16384 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "release_date": "2025-02-05", + "last_updated": "2025-02-05", + "cost": { + "input": 0, + "output": 0 + } + }, + { + "id": "replicate/deepseek-ai/deepseek-r1", + "name": "deepseek r1", + "display_name": "deepseek r1", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 16384 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "release_date": "2025-03-11", + "last_updated": "2025-03-11", + "cost": { + "input": 10, + "output": 10 + } + }, + { + "id": "anthropic/claude-opus-4", + "name": "claude opus 4", + "display_name": "claude opus 4", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 16384 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "release_date": "2025-05-22", + "last_updated": "2025-05-22", + "cost": { + "input": 15, + "output": 75 + } + }, + { + "id": "anthropic/claude-opus-4-1", + "name": "claude opus 4 1", + "display_name": "claude opus 4 1", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 16384 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "release_date": "2025-11-14", + "last_updated": "2025-11-14", + "cost": { + "input": 15, + "output": 75 + } + }, + { + "id": "anthropic/claude-haiku-4-5", + "name": "claude haiku 4 5", + "display_name": "claude haiku 4 5", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 16384 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "release_date": "2025-11-14", + "last_updated": "2025-11-14", + "cost": { + "input": 1, + "output": 5 + } + }, + { + "id": "anthropic/claude-haiku-4.5", + "name": "claude haiku 4.5", + "display_name": "claude haiku 4.5", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 16384 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "release_date": "2025-11-14", + "last_updated": "2025-11-14", + "cost": { + "input": 1, + "output": 5 + } + }, + { + "id": "anthropic/claude-3-haiku", + "name": "claude 3 haiku", + "display_name": "claude 3 haiku", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 16384 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "release_date": "2024-07-31", + "last_updated": "2024-07-31", + "cost": { + "input": 0, + "output": 1.25 + } + }, + { + "id": "anthropic/claude-opus-4-5", + "name": "claude opus 4 5", + "display_name": "claude opus 4 5", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 16384 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "release_date": "2025-11-24", + "last_updated": "2025-11-24", + "cost": { + "input": 5, + "output": 25 + } + }, + { + "id": "anthropic/claude-3-opus", + "name": "claude 3 opus", + "display_name": "claude 3 opus", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 16384 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "release_date": "2024-07-31", + "last_updated": "2024-07-31", + "cost": { + "input": 15, + "output": 75 + } + }, + { + "id": "anthropic/claude-sonnet-4-5", + "name": "claude sonnet 4 5", + "display_name": "claude sonnet 4 5", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 16384 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "release_date": "2025-11-14", + "last_updated": "2025-11-14", + "cost": { + "input": 3, + "output": 15 + } + }, + { + "id": "anthropic/claude-3.5-sonnet", + "name": "claude 3.5 sonnet", + "display_name": "claude 3.5 sonnet", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 16384 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "release_date": "2024-07-31", + "last_updated": "2024-07-31", + "cost": { + "input": 3, + "output": 15 + } + }, + { + "id": "anthropic/claude-3-sonnet", + "name": "claude 3 sonnet", + "display_name": "claude 3 sonnet", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 16384 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "release_date": "2024-07-31", + "last_updated": "2024-07-31", + "cost": { + "input": 3, + "output": 15 + } + }, + { + "id": "anthropic/claude-3-5-haiku", + "name": "claude 3 5 haiku", + "display_name": "claude 3 5 haiku", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 16384 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "release_date": "2024-11-04", + "last_updated": "2024-11-04", + "cost": { + "input": 0, + "output": 4 + } + }, + { + "id": "anthropic/claude-opus-4.1", + "name": "claude opus 4.1", + "display_name": "claude opus 4.1", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 16384 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", + "cost": { + "input": 15, + "output": 75 + } + }, + { + "id": "anthropic/claude-3.5-haiku", + "name": "claude 3.5 haiku", + "display_name": "claude 3.5 haiku", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 16384 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "release_date": "2025-01-07", + "last_updated": "2025-01-07", + "cost": { + "input": 0, + "output": 4 + } + }, + { + "id": "anthropic/claude-sonnet-4", + "name": "claude sonnet 4", + "display_name": "claude sonnet 4", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 16384 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "release_date": "2025-05-22", + "last_updated": "2025-05-22", + "cost": { + "input": 3, + "output": 15 + } + }, + { + "id": "anthropic/claude-opus-4.5", + "name": "claude opus 4.5", + "display_name": "claude opus 4.5", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 16384 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "release_date": "2025-11-24", + "last_updated": "2025-11-24", + "cost": { + "input": 5, + "output": 25 + } + }, + { + "id": "anthropic/claude-sonnet-4.5", + "name": "claude sonnet 4.5", + "display_name": "claude sonnet 4.5", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 16384 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "release_date": "2025-10-08", + "last_updated": "2025-10-08", + "cost": { + "input": 3, + "output": 15 + } + } + ] + }, + "openai": { + "id": "openai", + "name": "OpenAI", + "display_name": "OpenAI", + "doc": "https://platform.openai.com/docs/models", + "models": [ + { + "id": "gpt-4.1-nano", + "name": "GPT-4.1 nano", + "display_name": "GPT-4.1 nano", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 1047576, + "output": 32768 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", + "cost": { + "input": 0.1, + "output": 0.4, + "cache_read": 0.03 + } + }, + { + "id": "text-embedding-3-small", + "name": "text-embedding-3-small", + "display_name": "text-embedding-3-small", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 8191, + "output": 1536 + }, + "temperature": false, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "knowledge": "2024-01", + "release_date": "2024-01-25", + "last_updated": "2024-01-25", + "cost": { + "input": 0.02, + "output": 0 + } + }, + { + "id": "gpt-4", + "name": "GPT-4", + "display_name": "GPT-4", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 8192, + "output": 8192 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": false, + "knowledge": "2023-11", + "release_date": "2023-11-06", + "last_updated": "2024-04-09", + "cost": { + "input": 30, + "output": 60 + } + }, + { + "id": "o1-pro", + "name": "o1-pro", + "display_name": "o1-pro", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 200000, + "output": 100000 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": false, + "knowledge": "2023-09", + "release_date": "2025-03-19", + "last_updated": "2025-03-19", + "cost": { + "input": 150, + "output": 600 + } + }, + { + "id": "gpt-4o-2024-05-13", + "name": "GPT-4o (2024-05-13)", + "display_name": "GPT-4o (2024-05-13)", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 4096 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": false, + "knowledge": "2023-09", + "release_date": "2024-05-13", + "last_updated": "2024-05-13", + "cost": { + "input": 5, + "output": 15 + } + }, + { + "id": "gpt-5.1-codex", + "name": "GPT-5.1 Codex", + "display_name": "GPT-5.1 Codex", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 400000, + "output": 128000 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": false, + "knowledge": "2024-09-30", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", + "cost": { + "input": 1.25, + "output": 10, + "cache_read": 0.125 + } + }, + { + "id": "gpt-4o-2024-08-06", + "name": "GPT-4o (2024-08-06)", + "display_name": "GPT-4o (2024-08-06)", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 16384 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": false, + "knowledge": "2023-09", + "release_date": "2024-08-06", + "last_updated": "2024-08-06", + "cost": { + "input": 2.5, + "output": 10, + "cache_read": 1.25 + } + }, + { + "id": "gpt-4.1-mini", + "name": "GPT-4.1 mini", + "display_name": "GPT-4.1 mini", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 1047576, + "output": 32768 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", + "cost": { + "input": 0.4, + "output": 1.6, + "cache_read": 0.1 + } + }, + { + "id": "o3-deep-research", + "name": "o3-deep-research", + "display_name": "o3-deep-research", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 200000, + "output": 100000 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": false, + "knowledge": "2024-05", + "release_date": "2024-06-26", + "last_updated": "2024-06-26", + "cost": { + "input": 10, + "output": 40, + "cache_read": 2.5 + } + }, + { + "id": "gpt-3.5-turbo", + "name": "GPT-3.5-turbo", + "display_name": "GPT-3.5-turbo", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 16385, + "output": 4096 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "knowledge": "2021-09-01", + "release_date": "2023-03-01", + "last_updated": "2023-11-06", + "cost": { + "input": 0.5, + "output": 1.5, + "cache_read": 1.25 + } + }, + { + "id": "gpt-5.2-pro", + "name": "GPT-5.2 Pro", + "display_name": "GPT-5.2 Pro", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 400000, + "output": 128000 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2025-12-11", + "last_updated": "2025-12-11", + "cost": { + "input": 21, + "output": 168 + } + }, + { + "id": "text-embedding-3-large", + "name": "text-embedding-3-large", + "display_name": "text-embedding-3-large", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 8191, + "output": 3072 + }, + "temperature": false, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "knowledge": "2024-01", + "release_date": "2024-01-25", + "last_updated": "2024-01-25", + "cost": { + "input": 0.13, + "output": 0 + } + }, + { + "id": "gpt-4-turbo", + "name": "GPT-4 Turbo", + "display_name": "GPT-4 Turbo", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 4096 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": false, + "knowledge": "2023-12", + "release_date": "2023-11-06", + "last_updated": "2024-04-09", + "cost": { + "input": 10, + "output": 30 + } + }, + { + "id": "o1-preview", + "name": "o1-preview", + "display_name": "o1-preview", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 32768 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": false, + "open_weights": false, + "knowledge": "2023-09", + "release_date": "2024-09-12", + "last_updated": "2024-09-12", + "cost": { + "input": 15, + "output": 60, + "cache_read": 7.5 + } + }, + { + "id": "gpt-5.1-codex-mini", + "name": "GPT-5.1 Codex mini", + "display_name": "GPT-5.1 Codex mini", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text", + "image" + ] + }, + "limit": { + "context": 400000, + "output": 128000 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": false, + "knowledge": "2024-09-30", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", + "cost": { + "input": 0.25, + "output": 2, + "cache_read": 0.025 + } + }, + { + "id": "o3-mini", + "name": "o3-mini", + "display_name": "o3-mini", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 200000, + "output": 100000 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": false, + "open_weights": false, + "knowledge": "2024-05", + "release_date": "2024-12-20", + "last_updated": "2025-01-29", + "cost": { + "input": 1.1, + "output": 4.4, + "cache_read": 0.55 + } + }, + { + "id": "gpt-5.2-chat-latest", + "name": "GPT-5.2 Chat", + "display_name": "GPT-5.2 Chat", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 16384 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2025-12-11", + "last_updated": "2025-12-11", + "cost": { + "input": 1.75, + "output": 14, + "cache_read": 0.175 + } + }, + { + "id": "gpt-5.1", + "name": "GPT-5.1", + "display_name": "GPT-5.1", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 400000, + "output": 128000 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": false, + "knowledge": "2024-09-30", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", + "cost": { + "input": 1.25, + "output": 10, + "cache_read": 0.13 + } + }, + { + "id": "codex-mini-latest", + "name": "Codex Mini", + "display_name": "Codex Mini", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 200000, + "output": 100000 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2025-05-16", + "last_updated": "2025-05-16", + "cost": { + "input": 1.5, + "output": 6, + "cache_read": 0.375 + } + }, + { + "id": "gpt-5-nano", + "name": "GPT-5 Nano", + "display_name": "GPT-5 Nano", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 400000, + "output": 128000 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": false, + "knowledge": "2024-05-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", + "cost": { + "input": 0.05, + "output": 0.4, + "cache_read": 0.01 + } + }, + { + "id": "gpt-5-codex", + "name": "GPT-5-Codex", + "display_name": "GPT-5-Codex", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 400000, + "output": 128000 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": false, + "open_weights": false, + "knowledge": "2024-09-30", + "release_date": "2025-09-15", + "last_updated": "2025-09-15", + "cost": { + "input": 1.25, + "output": 10, + "cache_read": 0.125 + } + }, + { + "id": "gpt-4o", + "name": "GPT-4o", + "display_name": "GPT-4o", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 16384 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": false, + "knowledge": "2023-09", + "release_date": "2024-05-13", + "last_updated": "2024-08-06", + "cost": { + "input": 2.5, + "output": 10, + "cache_read": 1.25 + } + }, + { + "id": "gpt-4.1", + "name": "GPT-4.1", + "display_name": "GPT-4.1", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 1047576, + "output": 32768 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", + "cost": { + "input": 2, + "output": 8, + "cache_read": 0.5 + } + }, + { + "id": "o4-mini", + "name": "o4-mini", + "display_name": "o4-mini", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 200000, + "output": 100000 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": false, + "knowledge": "2024-05", + "release_date": "2025-04-16", + "last_updated": "2025-04-16", + "cost": { + "input": 1.1, + "output": 4.4, + "cache_read": 0.28 + } + }, + { + "id": "o1", + "name": "o1", + "display_name": "o1", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 200000, + "output": 100000 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": false, + "knowledge": "2023-09", + "release_date": "2024-12-05", + "last_updated": "2024-12-05", + "cost": { + "input": 15, + "output": 60, + "cache_read": 7.5 + } + }, + { + "id": "gpt-5-mini", + "name": "GPT-5 Mini", + "display_name": "GPT-5 Mini", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 400000, + "output": 128000 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": false, + "knowledge": "2024-05-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", + "cost": { + "input": 0.25, + "output": 2, + "cache_read": 0.03 + } + }, + { + "id": "o1-mini", + "name": "o1-mini", + "display_name": "o1-mini", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 65536 + }, + "temperature": false, + "tool_call": false, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": false, + "open_weights": false, + "knowledge": "2023-09", + "release_date": "2024-09-12", + "last_updated": "2024-09-12", + "cost": { + "input": 1.1, + "output": 4.4, + "cache_read": 0.55 + } + }, + { + "id": "text-embedding-ada-002", + "name": "text-embedding-ada-002", + "display_name": "text-embedding-ada-002", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 8192, + "output": 1536 + }, + "temperature": false, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "knowledge": "2022-12", + "release_date": "2022-12-15", + "last_updated": "2022-12-15", + "cost": { + "input": 0.1, + "output": 0 + } + }, + { + "id": "o3-pro", + "name": "o3-pro", + "display_name": "o3-pro", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 200000, + "output": 100000 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": false, + "knowledge": "2024-05", + "release_date": "2025-06-10", + "last_updated": "2025-06-10", + "cost": { + "input": 20, + "output": 80 + } + }, + { + "id": "gpt-4o-2024-11-20", + "name": "GPT-4o (2024-11-20)", + "display_name": "GPT-4o (2024-11-20)", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 16384 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": false, + "knowledge": "2023-09", + "release_date": "2024-11-20", + "last_updated": "2024-11-20", + "cost": { + "input": 2.5, + "output": 10, + "cache_read": 1.25 + } + }, + { + "id": "gpt-5.1-codex-max", + "name": "GPT-5.1 Codex Max", + "display_name": "GPT-5.1 Codex Max", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 400000, + "output": 128000 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": false, + "knowledge": "2024-09-30", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", + "cost": { + "input": 1.25, + "output": 10, + "cache_read": 0.125 + } + }, + { + "id": "o3", + "name": "o3", + "display_name": "o3", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 200000, + "output": 100000 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": false, + "knowledge": "2024-05", + "release_date": "2025-04-16", + "last_updated": "2025-04-16", + "cost": { + "input": 2, + "output": 8, + "cache_read": 0.5 + } + }, + { + "id": "o4-mini-deep-research", + "name": "o4-mini-deep-research", + "display_name": "o4-mini-deep-research", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 200000, + "output": 100000 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": false, + "knowledge": "2024-05", + "release_date": "2024-06-26", + "last_updated": "2024-06-26", + "cost": { + "input": 2, + "output": 8, + "cache_read": 0.5 } }, { - "id": "stable-diffusion-xl-lightning", - "name": "@cf/bytedance/stable-diffusion-xl-lightning", - "display_name": "@cf/bytedance/stable-diffusion-xl-lightning", + "id": "gpt-5-chat-latest", + "name": "GPT-5 Chat (latest)", + "display_name": "GPT-5 Chat (latest)", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 0, - "output": 0 + "context": 400000, + "output": 128000 }, - "temperature": false, + "temperature": true, "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2024-02-20", - "last_updated": "2024-04-03", + "attachment": true, + "open_weights": false, + "knowledge": "2024-09-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 0, - "output": 0 + "input": 1.25, + "output": 10 } }, { - "id": "mistral-7b-instruct-v0.1", - "name": "@cf/mistral/mistral-7b-instruct-v0.1", - "display_name": "@cf/mistral/mistral-7b-instruct-v0.1", + "id": "gpt-4o-mini", + "name": "GPT-4o mini", + "display_name": "GPT-4o mini", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 2824, - "output": 2824 + "context": 128000, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "release_date": "2023-09-27", - "last_updated": "2025-07-24", + "attachment": true, + "open_weights": false, + "knowledge": "2023-09", + "release_date": "2024-07-18", + "last_updated": "2024-07-18", "cost": { - "input": 0.11, - "output": 0.19 + "input": 0.15, + "output": 0.6, + "cache_read": 0.08 } }, { - "id": "llava-1.5-7b-hf", - "name": "@cf/llava-hf/llava-1.5-7b-hf", - "display_name": "@cf/llava-hf/llava-1.5-7b-hf", + "id": "gpt-5", + "name": "GPT-5", + "display_name": "GPT-5", "modalities": { "input": [ - "image", - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 0, - "output": 0 + "context": 400000, + "output": 128000 }, - "temperature": true, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, - "open_weights": true, - "release_date": "2023-12-05", - "last_updated": "2025-06-06", + "open_weights": false, + "knowledge": "2024-09-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 0, - "output": 0 + "input": 1.25, + "output": 10, + "cache_read": 0.13 } }, { - "id": "gpt-oss-20b", - "name": "@cf/openai/gpt-oss-20b", - "display_name": "@cf/openai/gpt-oss-20b", + "id": "gpt-5-pro", + "name": "GPT-5 Pro", + "display_name": "GPT-5 Pro", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 128000 + "context": 400000, + "output": 272000 }, "temperature": false, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2025-08-04", - "last_updated": "2025-08-14", + "attachment": true, + "open_weights": false, + "knowledge": "2024-09-30", + "release_date": "2025-10-06", + "last_updated": "2025-10-06", "cost": { - "input": 0.2, - "output": 0.3 + "input": 15, + "output": 120 } }, { - "id": "deepseek-math-7b-instruct", - "name": "@cf/deepseek-ai/deepseek-math-7b-instruct", - "display_name": "@cf/deepseek-ai/deepseek-math-7b-instruct", + "id": "gpt-5.2", + "name": "GPT-5.2", + "display_name": "GPT-5.2", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 4096, - "output": 4096 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2024-02-05", - "last_updated": "2024-02-06", + "attachment": true, + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2025-12-11", + "last_updated": "2025-12-11", "cost": { - "input": 0, - "output": 0 + "input": 1.75, + "output": 14, + "cache_read": 0.175 } }, { - "id": "gpt-oss-120b", - "name": "@cf/openai/gpt-oss-120b", - "display_name": "@cf/openai/gpt-oss-120b", + "id": "gpt-5.1-chat-latest", + "name": "GPT-5.1 Chat", + "display_name": "GPT-5.1 Chat", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -26440,56 +33736,72 @@ }, "limit": { "context": 128000, - "output": 128000 + "output": 16384 }, "temperature": false, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2025-08-04", - "last_updated": "2025-08-14", + "attachment": true, + "open_weights": false, + "knowledge": "2024-09-30", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", "cost": { - "input": 0.35, - "output": 0.75 + "input": 1.25, + "output": 10, + "cache_read": 0.125 } - }, + } + ] + }, + "zhipuai-coding-plan": { + "id": "zhipuai-coding-plan", + "name": "Zhipu AI Coding Plan", + "display_name": "Zhipu AI Coding Plan", + "api": "https://open.bigmodel.cn/api/coding/paas/v4", + "doc": "https://docs.bigmodel.cn/cn/coding-plan/overview", + "models": [ { - "id": "melotts", - "name": "@cf/myshell-ai/melotts", - "display_name": "@cf/myshell-ai/melotts", + "id": "glm-4.6v", + "name": "GLM-4.6V", + "display_name": "GLM-4.6V", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ - "audio" + "text" ] }, "limit": { - "context": 0, - "output": 0 + "context": 128000, + "output": 32768 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": true, - "release_date": "2024-07-19", - "last_updated": "2024-07-19", + "knowledge": "2025-04", + "release_date": "2025-12-08", + "last_updated": "2025-12-08", "cost": { - "input": 0.0002, + "input": 0, "output": 0 } }, { - "id": "qwen1.5-7b-chat-awq", - "name": "@cf/qwen/qwen1.5-7b-chat-awq", - "display_name": "@cf/qwen/qwen1.5-7b-chat-awq", + "id": "glm-4.6", + "name": "GLM-4.6", + "display_name": "GLM-4.6", "modalities": { "input": [ "text" @@ -26499,87 +33811,99 @@ ] }, "limit": { - "context": 20000, - "output": 20000 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": true, - "release_date": "2024-02-03", - "last_updated": "2024-04-30", + "knowledge": "2025-04", + "release_date": "2025-09-30", + "last_updated": "2025-09-30", "cost": { "input": 0, - "output": 0 + "output": 0, + "cache_read": 0, + "cache_write": 0 } }, { - "id": "llama-3.1-8b-instruct-fast", - "name": "@cf/meta/llama-3.1-8b-instruct-fast", - "display_name": "@cf/meta/llama-3.1-8b-instruct-fast", + "id": "glm-4.5v", + "name": "GLM-4.5V", + "display_name": "GLM-4.5V", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 128000 + "context": 64000, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": true, - "release_date": "2024-07-18", - "last_updated": "2024-09-25", + "knowledge": "2025-04", + "release_date": "2025-08-11", + "last_updated": "2025-08-11", "cost": { - "input": 0.045, - "output": 0.384 + "input": 0, + "output": 0 } }, { - "id": "nova-3", - "name": "@cf/deepgram/nova-3", - "display_name": "@cf/deepgram/nova-3", + "id": "glm-4.5-air", + "name": "GLM-4.5-Air", + "display_name": "GLM-4.5-Air", "modalities": { "input": [ - "audio" + "text" ], "output": [ "text" ] }, "limit": { - "context": 0, - "output": 0 + "context": 131072, + "output": 98304 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": true, - "release_date": "2025-06-05", - "last_updated": "2025-07-08", + "knowledge": "2025-04", + "release_date": "2025-07-28", + "last_updated": "2025-07-28", "cost": { - "input": 0.0052, - "output": 0.0052 + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 } }, { - "id": "llama-3.1-70b-instruct", - "name": "@cf/meta/llama-3.1-70b-instruct", - "display_name": "@cf/meta/llama-3.1-70b-instruct", + "id": "glm-4.5", + "name": "GLM-4.5", + "display_name": "GLM-4.5", "modalities": { "input": [ "text" @@ -26589,27 +33913,31 @@ ] }, "limit": { - "context": 24000, - "output": 24000 + "context": 131072, + "output": 98304 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": true, - "release_date": "2024-07-16", - "last_updated": "2024-12-15", + "knowledge": "2025-04", + "release_date": "2025-07-28", + "last_updated": "2025-07-28", "cost": { - "input": 0.293, - "output": 2.253 + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 } }, { - "id": "qwq-32b", - "name": "@cf/qwen/qwq-32b", - "display_name": "@cf/qwen/qwq-32b", + "id": "glm-4.5-flash", + "name": "GLM-4.5-Flash", + "display_name": "GLM-4.5-Flash", "modalities": { "input": [ "text" @@ -26619,27 +33947,39 @@ ] }, "limit": { - "context": 24000, - "output": 24000 + "context": 131072, + "output": 98304 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": true, - "release_date": "2025-03-05", - "last_updated": "2025-03-11", + "knowledge": "2025-04", + "release_date": "2025-07-28", + "last_updated": "2025-07-28", "cost": { - "input": 0.66, - "output": 1 + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 } - }, + } + ] + }, + "perplexity": { + "id": "perplexity", + "name": "Perplexity", + "display_name": "Perplexity", + "doc": "https://docs.perplexity.ai", + "models": [ { - "id": "zephyr-7b-beta-awq", - "name": "@hf/thebloke/zephyr-7b-beta-awq", - "display_name": "@hf/thebloke/zephyr-7b-beta-awq", + "id": "sonar-reasoning", + "name": "Sonar Reasoning", + "display_name": "Sonar Reasoning", "modalities": { "input": [ "text" @@ -26649,27 +33989,29 @@ ] }, "limit": { - "context": 4096, + "context": 128000, "output": 4096 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": true, - "release_date": "2023-10-27", - "last_updated": "2023-11-09", + "open_weights": false, + "knowledge": "2025-09-01", + "release_date": "2024-01-01", + "last_updated": "2025-09-01", "cost": { - "input": 0, - "output": 0 + "input": 1, + "output": 5 } }, { - "id": "deepseek-coder-6.7b-instruct-awq", - "name": "@hf/thebloke/deepseek-coder-6.7b-instruct-awq", - "display_name": "@hf/thebloke/deepseek-coder-6.7b-instruct-awq", + "id": "sonar", + "name": "Sonar", + "display_name": "Sonar", "modalities": { "input": [ "text" @@ -26679,90 +34021,104 @@ ] }, "limit": { - "context": 4096, + "context": 128000, "output": 4096 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2023-11-05", - "last_updated": "2023-11-13", + "open_weights": false, + "knowledge": "2025-09-01", + "release_date": "2024-01-01", + "last_updated": "2025-09-01", "cost": { - "input": 0, - "output": 0 + "input": 1, + "output": 1 } }, { - "id": "llama-3.1-8b-instruct-awq", - "name": "@cf/meta/llama-3.1-8b-instruct-awq", - "display_name": "@cf/meta/llama-3.1-8b-instruct-awq", + "id": "sonar-pro", + "name": "Sonar Pro", + "display_name": "Sonar Pro", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 8192, + "context": 200000, "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "release_date": "2024-07-25", - "last_updated": "2024-07-25", + "attachment": true, + "open_weights": false, + "knowledge": "2025-09-01", + "release_date": "2024-01-01", + "last_updated": "2025-09-01", "cost": { - "input": 0.12, - "output": 0.27 + "input": 3, + "output": 15 } }, { - "id": "mistral-7b-instruct-v0.2-lora", - "name": "@cf/mistral/mistral-7b-instruct-v0.2-lora", - "display_name": "@cf/mistral/mistral-7b-instruct-v0.2-lora", + "id": "sonar-reasoning-pro", + "name": "Sonar Reasoning Pro", + "display_name": "Sonar Reasoning Pro", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 15000, - "output": 15000 + "context": 128000, + "output": 4096 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2024-04-01", - "last_updated": "2024-04-01", + "attachment": true, + "open_weights": false, + "knowledge": "2025-09-01", + "release_date": "2024-01-01", + "last_updated": "2025-09-01", "cost": { - "input": 0, - "output": 0 + "input": 2, + "output": 8 } - }, + } + ] + }, + "zenmux": { + "id": "zenmux", + "name": "zenmux", + "display_name": "zenmux", + "api": "https://zenmux.ai/api/v1", + "doc": "https://docs.zenmux.ai", + "models": [ { - "id": "uform-gen2-qwen-500m", - "name": "@cf/unum/uform-gen2-qwen-500m", - "display_name": "@cf/unum/uform-gen2-qwen-500m", + "id": "moonshotai/kimi-k2-thinking-turbo", + "name": "Kimi K2 Thinking Turbo", + "display_name": "Kimi K2 Thinking Turbo", "modalities": { "input": [ - "image", "text" ], "output": [ @@ -26770,36 +34126,29 @@ ] }, "limit": { - "context": 0, - "output": 0 + "context": 262144, + "output": 262144 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": true, - "release_date": "2024-02-15", - "last_updated": "2024-04-24", + "open_weights": false, + "knowledge": "2025-11", + "release_date": "2025-11-06", + "last_updated": "2025-11-06", "cost": { - "input": 0, - "output": 0 + "input": 1.15, + "output": 8 } - } - ] - }, - "inception": { - "id": "inception", - "name": "Inception", - "display_name": "Inception", - "api": "https://api.inceptionlabs.ai/v1/", - "doc": "https://platform.inceptionlabs.ai/docs", - "models": [ + }, { - "id": "mercury-coder", - "name": "Mercury Coder", - "display_name": "Mercury Coder", + "id": "moonshotai/kimi-k2-0905", + "name": "MoonshotAI: Kimi K2 0905", + "display_name": "MoonshotAI: Kimi K2 0905", "modalities": { "input": [ "text" @@ -26809,8 +34158,8 @@ ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, @@ -26819,20 +34168,20 @@ }, "attachment": false, "open_weights": false, - "knowledge": "2023-10", - "release_date": "2025-02-26", - "last_updated": "2025-07-31", + "knowledge": "2024-10", + "release_date": "2025-09-04", + "last_updated": "2025-09-04", "cost": { - "input": 0.25, - "output": 1, - "cache_read": 0.25, - "cache_write": 1 - } + "input": 0.6, + "output": 2.5, + "cache_read": 0.15 + }, + "type": "chat" }, { - "id": "mercury", - "name": "Mercury", - "display_name": "Mercury", + "id": "moonshotai/kimi-k2-thinking", + "name": "Kimi K2 Thinking", + "display_name": "Kimi K2 Thinking", "modalities": { "input": [ "text" @@ -26842,38 +34191,29 @@ ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": false, - "knowledge": "2023-10", - "release_date": "2025-06-26", - "last_updated": "2025-07-31", + "knowledge": "2025-11", + "release_date": "2025-11-06", + "last_updated": "2025-11-06", "cost": { - "input": 0.25, - "output": 1, - "cache_read": 0.25, - "cache_write": 1 + "input": 0.6, + "output": 2.5 } - } - ] - }, - "openai": { - "id": "openai", - "name": "OpenAI", - "display_name": "OpenAI", - "doc": "https://platform.openai.com/docs/models", - "models": [ + }, { - "id": "gpt-4.1-nano", - "name": "GPT-4.1 nano", - "display_name": "GPT-4.1 nano", + "id": "x-ai/grok-4-fast-non-reasoning", + "name": "Grok 4 Fast (Non-Reasoning)", + "display_name": "Grok 4 Fast (Non-Reasoning)", "modalities": { "input": [ "text", @@ -26884,8 +34224,8 @@ ] }, "limit": { - "context": 1047576, - "output": 32768 + "context": 2000000, + "output": 30000 }, "temperature": true, "tool_call": true, @@ -26894,19 +34234,19 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", + "knowledge": "2025-07", + "release_date": "2025-09-19", + "last_updated": "2025-09-19", "cost": { - "input": 0.1, - "output": 0.4, - "cache_read": 0.03 + "input": 0.2, + "output": 0.5, + "cache_read": 0.05 } }, { - "id": "text-embedding-3-small", - "name": "text-embedding-3-small", - "display_name": "text-embedding-3-small", + "id": "x-ai/grok-4", + "name": "Grok 4", + "display_name": "Grok 4", "modalities": { "input": [ "text" @@ -26916,28 +34256,31 @@ ] }, "limit": { - "context": 8191, - "output": 1536 + "context": 256000, + "output": 64000 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": false, - "knowledge": "2024-01", - "release_date": "2024-01-25", - "last_updated": "2024-01-25", + "knowledge": "2025-07", + "release_date": "2025-07-09", + "last_updated": "2025-07-09", "cost": { - "input": 0.02, - "output": 0 + "input": 3, + "output": 15, + "cache_read": 0.75, + "reasoning": 15 } }, { - "id": "gpt-4", - "name": "GPT-4", - "display_name": "GPT-4", + "id": "x-ai/grok-code-fast-1", + "name": "Grok Code Fast 1", + "display_name": "Grok Code Fast 1", "modalities": { "input": [ "text" @@ -26947,28 +34290,30 @@ ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 256000, + "output": 10000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2023-11", - "release_date": "2023-11-06", - "last_updated": "2024-04-09", + "knowledge": "2023-10", + "release_date": "2025-08-28", + "last_updated": "2025-08-28", "cost": { - "input": 30, - "output": 60 + "input": 0.2, + "output": 1.5, + "cache_read": 0.02 } }, { - "id": "o1-pro", - "name": "o1-pro", - "display_name": "o1-pro", + "id": "x-ai/grok-4-fast", + "name": "Grok 4 Fast", + "display_name": "Grok 4 Fast", "modalities": { "input": [ "text", @@ -26979,10 +34324,10 @@ ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 2000000, + "output": 30000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -26990,118 +34335,121 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2023-09", - "release_date": "2025-03-19", - "last_updated": "2025-03-19", + "knowledge": "2025-07", + "release_date": "2025-09-19", + "last_updated": "2025-09-19", "cost": { - "input": 150, - "output": 600 + "input": 0.2, + "output": 0.5, + "cache_read": 0.05 } }, { - "id": "gpt-4o-2024-05-13", - "name": "GPT-4o (2024-05-13)", - "display_name": "GPT-4o (2024-05-13)", + "id": "deepseek/deepseek-chat", + "name": "DeepSeek: DeepSeek V3", + "display_name": "DeepSeek: DeepSeek V3", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 163840, + "output": 163840 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2023-09", - "release_date": "2024-05-13", - "last_updated": "2024-05-13", + "attachment": false, + "open_weights": true, + "knowledge": "2025-07", + "release_date": "2025-09-29", + "last_updated": "2025-09-29", "cost": { - "input": 5, - "output": 15 - } + "input": 0.56, + "output": 1.68, + "cache_read": 0.07 + }, + "type": "chat" }, { - "id": "gpt-5.1-codex", - "name": "GPT-5.1 Codex", - "display_name": "GPT-5.1 Codex", + "id": "minimax/minimax-m2", + "name": "MiniMax M2", + "display_name": "MiniMax M2", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ - "text", - "image" + "text" ] }, "limit": { - "context": 400000, + "context": 204800, "output": 128000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-13", - "last_updated": "2025-11-13", + "knowledge": "2025-10", + "release_date": "2025-10-27", + "last_updated": "2025-10-27", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125 + "input": 0.3, + "output": 1.2 } }, { - "id": "gpt-4o-2024-08-06", - "name": "GPT-4o (2024-08-06)", - "display_name": "GPT-4o (2024-08-06)", + "id": "google/gemini-2.5-pro", + "name": "Google: Gemini 2.5 Pro", + "display_name": "Google: Gemini 2.5 Pro", "modalities": { "input": [ + "image", "text", - "image" + "audio" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": false, - "knowledge": "2023-09", - "release_date": "2024-08-06", - "last_updated": "2024-08-06", + "knowledge": "2025-01", + "release_date": "2025-03-20", + "last_updated": "2025-06-05", "cost": { - "input": 2.5, + "input": 1.25, "output": 10, - "cache_read": 1.25 - } + "cache_read": 0.31, + "cache_write": 4.5 + }, + "type": "imageGeneration" }, { - "id": "gpt-4.1-mini", - "name": "GPT-4.1 mini", - "display_name": "GPT-4.1 mini", + "id": "openai/gpt-5-codex", + "name": "GPT-5 Codex", + "display_name": "GPT-5 Codex", "modalities": { "input": [ "text", @@ -27112,29 +34460,30 @@ ] }, "limit": { - "context": 1047576, - "output": 32768 + "context": 400000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", + "knowledge": "2024-10-01", + "release_date": "2025-09-23", + "last_updated": "2025-09-23", "cost": { - "input": 0.4, - "output": 1.6, - "cache_read": 0.1 + "input": 1.25, + "output": 10, + "cache_read": 0.125 } }, { - "id": "o3-deep-research", - "name": "o3-deep-research", - "display_name": "o3-deep-research", + "id": "openai/gpt-5", + "name": "gpt-5", + "display_name": "gpt-5", "modalities": { "input": [ "text", @@ -27145,8 +34494,8 @@ ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 272000, + "output": 128000 }, "temperature": false, "tool_call": true, @@ -27156,19 +34505,20 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2024-05", - "release_date": "2024-06-26", - "last_updated": "2024-06-26", + "knowledge": "2024-09-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 10, - "output": 40, - "cache_read": 2.5 - } + "input": 1.25, + "output": 10, + "cache_read": 0.13 + }, + "type": "chat" }, { - "id": "gpt-3.5-turbo", - "name": "GPT-3.5-turbo", - "display_name": "GPT-3.5-turbo", + "id": "inclusionai/ring-1t", + "name": "inclusionAI: Ring 1T", + "display_name": "inclusionAI: Ring 1T", "modalities": { "input": [ "text" @@ -27178,64 +34528,34 @@ ] }, "limit": { - "context": 16385, - "output": 4096 + "context": 131072, + "output": 131072 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": false, - "knowledge": "2021-09-01", - "release_date": "2023-03-01", - "last_updated": "2023-11-06", + "open_weights": true, + "knowledge": "2025-10", + "release_date": "2025-10-12", + "last_updated": "2025-10-12", "cost": { - "input": 0.5, - "output": 1.5, - "cache_read": 1.25 - } - }, - { - "id": "text-embedding-3-large", - "name": "text-embedding-3-large", - "display_name": "text-embedding-3-large", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 8191, - "output": 3072 - }, - "temperature": false, - "tool_call": false, - "reasoning": { - "supported": false + "input": 0.56, + "output": 2.24, + "cache_read": 0.112 }, - "attachment": false, - "open_weights": false, - "knowledge": "2024-01", - "release_date": "2024-01-25", - "last_updated": "2024-01-25", - "cost": { - "input": 0.13, - "output": 0 - } + "type": "chat" }, { - "id": "gpt-4-turbo", - "name": "GPT-4 Turbo", - "display_name": "GPT-4 Turbo", + "id": "inclusionai/lint-1t", + "name": "Ling-1T", + "display_name": "Ling-1T", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" @@ -27243,27 +34563,29 @@ }, "limit": { "context": 128000, - "output": 4096 + "output": 32000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2023-12", - "release_date": "2023-11-06", - "last_updated": "2024-04-09", + "attachment": false, + "open_weights": true, + "knowledge": "2025-10", + "release_date": "2025-10-09", + "last_updated": "2025-10-09", "cost": { - "input": 10, - "output": 30 + "input": 0.56, + "output": 2.24, + "cache_read": 0.112 } }, { - "id": "o1-preview", - "name": "o1-preview", - "display_name": "o1-preview", + "id": "z-ai/glm-4.5-air", + "name": "GLM-4.5-Air", + "display_name": "GLM-4.5-Air", "modalities": { "input": [ "text" @@ -27273,65 +34595,65 @@ ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 131072, + "output": 98304 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, "default": true }, "attachment": false, - "open_weights": false, - "knowledge": "2023-09", - "release_date": "2024-09-12", - "last_updated": "2024-09-12", + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-07-28", + "last_updated": "2025-07-28", "cost": { - "input": 15, - "output": 60, - "cache_read": 7.5 + "input": 0.2, + "output": 1.1, + "cache_read": 0.03, + "cache_write": 0 } }, { - "id": "gpt-5.1-codex-mini", - "name": "GPT-5.1 Codex mini", - "display_name": "GPT-5.1 Codex mini", + "id": "z-ai/glm-4.6", + "name": "GLM-4.6", + "display_name": "GLM-4.6", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ - "text", - "image" + "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 204800, + "output": 131072 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-13", - "last_updated": "2025-11-13", + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-09-30", + "last_updated": "2025-09-30", "cost": { - "input": 0.25, - "output": 2, - "cache_read": 0.025 + "input": 0.6, + "output": 2.2, + "cache_read": 0.11, + "cache_write": 0 } }, { - "id": "o3-mini", - "name": "o3-mini", - "display_name": "o3-mini", + "id": "qwen/qwen3-coder-plus", + "name": "Qwen: Qwen3 Coder 480B A35B Instruct", + "display_name": "Qwen: Qwen3 Coder 480B A35B Instruct", "modalities": { "input": [ "text" @@ -27341,67 +34663,68 @@ ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 4096, + "output": 4096 }, - "temperature": false, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2024-05", - "release_date": "2024-12-20", - "last_updated": "2025-01-29", + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-07-23", + "last_updated": "2025-07-23", "cost": { - "input": 1.1, - "output": 4.4, - "cache_read": 0.55 + "input": 1, + "output": 5, + "cache_read": 0.1, + "cache_write": 1.25 } }, { - "id": "gpt-5.1", - "name": "GPT-5.1", - "display_name": "GPT-5.1", + "id": "kuaishou/kat-coder-pro-v1", + "name": "KAT-Coder-Pro-V1", + "display_name": "KAT-Coder-Pro-V1", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 256000, + "output": 32000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-13", - "last_updated": "2025-11-13", + "knowledge": "2025-01-01", + "release_date": "2025-10-23", + "last_updated": "2025-10-23", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.13 + "input": 0.6, + "output": 2.4, + "cache_read": 0.12 } }, { - "id": "codex-mini-latest", - "name": "Codex Mini", - "display_name": "Codex Mini", + "id": "anthropic/claude-haiku-4.5", + "name": "Claude Haiku 4.5", + "display_name": "Claude Haiku 4.5", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" @@ -27409,9 +34732,9 @@ }, "limit": { "context": 200000, - "output": 100000 + "output": 64000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -27419,19 +34742,20 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-05-16", - "last_updated": "2025-05-16", + "knowledge": "2025-02-28", + "release_date": "2025-10-15", + "last_updated": "2025-10-15", "cost": { - "input": 1.5, - "output": 6, - "cache_read": 0.375 + "input": 1, + "output": 5, + "cache_read": 0.1, + "cache_write": 1.25 } }, { - "id": "gpt-5-nano", - "name": "GPT-5 Nano", - "display_name": "GPT-5 Nano", + "id": "anthropic/claude-opus-4.1", + "name": "Claude Opus 4.1", + "display_name": "Claude Opus 4.1", "modalities": { "input": [ "text", @@ -27442,10 +34766,10 @@ ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 200000, + "output": 32000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -27453,19 +34777,20 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2024-05-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "knowledge": "2025-03-31", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 0.05, - "output": 0.4, - "cache_read": 0.01 + "input": 15, + "output": 75, + "cache_read": 1.5, + "cache_write": 18.75 } }, { - "id": "gpt-5-codex", - "name": "GPT-5-Codex", - "display_name": "GPT-5-Codex", + "id": "anthropic/claude-sonnet-4.5", + "name": "Claude Sonnet 4.5", + "display_name": "Claude Sonnet 4.5", "modalities": { "input": [ "text", @@ -27476,30 +34801,31 @@ ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 200000, + "output": 64000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-09-15", - "last_updated": "2025-09-15", + "knowledge": "2025-07-31", + "release_date": "2025-09-29", + "last_updated": "2025-09-29", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 } }, { - "id": "gpt-4o", - "name": "GPT-4o", - "display_name": "GPT-4o", + "id": "anthropic/claude-3.5-haiku", + "name": "Claude Haiku 3.5", + "display_name": "Claude Haiku 3.5", "modalities": { "input": [ "text", @@ -27510,8 +34836,8 @@ ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 200000, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -27520,19 +34846,20 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2023-09", - "release_date": "2024-05-13", - "last_updated": "2024-08-06", + "knowledge": "2024-07-31", + "release_date": "2024-10-22", + "last_updated": "2024-10-22", "cost": { - "input": 2.5, - "output": 10, - "cache_read": 1.25 + "input": 0.8, + "output": 4, + "cache_read": 0.08, + "cache_write": 1 } }, { - "id": "gpt-4.1", - "name": "GPT-4.1", - "display_name": "GPT-4.1", + "id": "anthropic/claude-3.5-sonnet", + "name": "Claude Sonnet 3.5 v2", + "display_name": "Claude Sonnet 3.5 v2", "modalities": { "input": [ "text", @@ -27543,8 +34870,8 @@ ] }, "limit": { - "context": 1047576, - "output": 32768 + "context": 200000, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -27553,19 +34880,20 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", + "knowledge": "2024-04-30", + "release_date": "2024-10-22", + "last_updated": "2024-10-22", "cost": { - "input": 2, - "output": 8, - "cache_read": 0.5 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 } }, { - "id": "o4-mini", - "name": "o4-mini", - "display_name": "o4-mini", + "id": "anthropic/claude-3.7-sonnet", + "name": "Claude Sonnet 3.7", + "display_name": "Claude Sonnet 3.7", "modalities": { "input": [ "text", @@ -27577,9 +34905,9 @@ }, "limit": { "context": 200000, - "output": 100000 + "output": 64000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -27587,19 +34915,20 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2024-05", - "release_date": "2025-04-16", - "last_updated": "2025-04-16", + "knowledge": "2024-10-31", + "release_date": "2025-02-19", + "last_updated": "2025-02-19", "cost": { - "input": 1.1, - "output": 4.4, - "cache_read": 0.28 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 } }, { - "id": "o1", - "name": "o1", - "display_name": "o1", + "id": "anthropic/claude-opus-4", + "name": "Claude Opus 4", + "display_name": "Claude Opus 4", "modalities": { "input": [ "text", @@ -27611,9 +34940,9 @@ }, "limit": { "context": 200000, - "output": 100000 + "output": 32000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -27621,19 +34950,20 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2023-09", - "release_date": "2024-12-05", - "last_updated": "2024-12-05", + "knowledge": "2025-03-31", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", "cost": { "input": 15, - "output": 60, - "cache_read": 7.5 + "output": 75, + "cache_read": 1.5, + "cache_write": 18.75 } }, { - "id": "gpt-5-mini", - "name": "GPT-5 Mini", - "display_name": "GPT-5 Mini", + "id": "anthropic/claude-sonnet-4", + "name": "Claude Sonnet 4", + "display_name": "Claude Sonnet 4", "modalities": { "input": [ "text", @@ -27644,10 +34974,10 @@ ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 200000, + "output": 64000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -27655,19 +34985,20 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2024-05-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "knowledge": "2025-03-31", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", "cost": { - "input": 0.25, - "output": 2, - "cache_read": 0.03 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 } }, { - "id": "o1-mini", - "name": "o1-mini", - "display_name": "o1-mini", + "id": "deepseek/deepseek-chat-v3.1", + "name": "DeepSeek: DeepSeek V3.1", + "display_name": "DeepSeek: DeepSeek V3.1", "modalities": { "input": [ "text" @@ -27677,30 +35008,20 @@ ] }, "limit": { - "context": 128000, - "output": 65536 + "context": 131072, + "output": 32768 }, - "temperature": false, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, - "open_weights": false, - "knowledge": "2023-09", - "release_date": "2024-09-12", - "last_updated": "2024-09-12", - "cost": { - "input": 1.1, - "output": 4.4, - "cache_read": 0.55 - } + "type": "chat" }, { - "id": "text-embedding-ada-002", - "name": "text-embedding-ada-002", - "display_name": "text-embedding-ada-002", + "id": "deepseek/deepseek-r1-0528", + "name": "DeepSeek: R1 0528", + "display_name": "DeepSeek: R1 0528", "modalities": { "input": [ "text" @@ -27710,295 +35031,289 @@ ] }, "limit": { - "context": 8192, - "output": 1536 + "context": 163840, + "output": 163840 }, - "temperature": false, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": false, - "knowledge": "2022-12", - "release_date": "2022-12-15", - "last_updated": "2022-12-15", - "cost": { - "input": 0.1, - "output": 0 - } + "type": "chat" }, { - "id": "o3-pro", - "name": "o3-pro", - "display_name": "o3-pro", + "id": "google/gemini-2.0-flash", + "name": "Google: Gemini 2.0 Flash", + "display_name": "Google: Gemini 2.0 Flash", "modalities": { "input": [ "text", - "image" + "image", + "audio" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 1048576, + "output": 8192 }, - "temperature": false, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, - "open_weights": false, - "knowledge": "2024-05", - "release_date": "2025-06-10", - "last_updated": "2025-06-10", - "cost": { - "input": 20, - "output": 80 - } + "type": "imageGeneration" }, { - "id": "gpt-4o-2024-11-20", - "name": "GPT-4o (2024-11-20)", - "display_name": "GPT-4o (2024-11-20)", + "id": "google/gemini-2.0-flash-lite-001", + "name": "Google: Gemini 2.0 Flash Lite", + "display_name": "Google: Gemini 2.0 Flash Lite", "modalities": { "input": [ "text", - "image" + "image", + "audio" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 1048576, + "output": 8192 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": false }, "attachment": true, - "open_weights": false, - "knowledge": "2023-09", - "release_date": "2024-11-20", - "last_updated": "2024-11-20", - "cost": { - "input": 2.5, - "output": 10, - "cache_read": 1.25 - } + "type": "imageGeneration" }, { - "id": "o3", - "name": "o3", - "display_name": "o3", + "id": "google/gemini-2.5-flash", + "name": "Google: Gemini 2.5 Flash", + "display_name": "Google: Gemini 2.5 Flash", "modalities": { "input": [ + "image", "text", - "image" + "audio" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 1048576, + "output": 65535 }, - "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, "attachment": true, - "open_weights": false, - "knowledge": "2024-05", - "release_date": "2025-04-16", - "last_updated": "2025-04-16", - "cost": { - "input": 2, - "output": 8, - "cache_read": 0.5 - } + "type": "imageGeneration" }, { - "id": "o4-mini-deep-research", - "name": "o4-mini-deep-research", - "display_name": "o4-mini-deep-research", + "id": "google/gemini-2.5-flash-lite", + "name": "Google: Gemini 2.5 Flash Lite", + "display_name": "Google: Gemini 2.5 Flash Lite", "modalities": { "input": [ + "image", "text", - "image" + "audio" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 1048576, + "output": 65535 }, - "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, "attachment": true, - "open_weights": false, - "knowledge": "2024-05", - "release_date": "2024-06-26", - "last_updated": "2024-06-26", - "cost": { - "input": 2, - "output": 8, - "cache_read": 0.5 - } + "type": "imageGeneration" }, { - "id": "gpt-5-chat-latest", - "name": "GPT-5 Chat (latest)", - "display_name": "GPT-5 Chat (latest)", + "id": "inclusionai/ling-1t", + "name": "inclusionAI: Ling-1T", + "display_name": "inclusionAI: Ling-1T", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 131072, + "output": 131072 }, - "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", - "cost": { - "input": 1.25, - "output": 10 - } + "type": "chat" }, { - "id": "gpt-4o-mini", - "name": "GPT-4o mini", - "display_name": "GPT-4o mini", + "id": "inclusionai/ling-flash-2.0", + "name": "inclusionAI: Ling Flash 2.0", + "display_name": "inclusionAI: Ling Flash 2.0", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 131072, + "output": 131072 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2023-09", - "release_date": "2024-07-18", - "last_updated": "2024-07-18", - "cost": { - "input": 0.15, - "output": 0.6, - "cache_read": 0.08 - } + "type": "chat" }, { - "id": "gpt-5", - "name": "GPT-5", - "display_name": "GPT-5", + "id": "inclusionai/ling-mini-2.0", + "name": "inclusionAI: Ling Mini 2.0", + "display_name": "inclusionAI: Ling Mini 2.0", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 131072, + "output": 131072 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "inclusionai/ring-flash-2.0", + "name": "inclusionAI: Ring Flash 2.0", + "display_name": "inclusionAI: Ring Flash 2.0", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 131072 }, - "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", - "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.13 - } + "type": "chat" }, { - "id": "gpt-5-pro", - "name": "GPT-5 Pro", - "display_name": "GPT-5 Pro", + "id": "inclusionai/ring-mini-2.0", + "name": "inclusionAI: Ring Mini 2.0", + "display_name": "inclusionAI: Ring Mini 2.0", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 272000 + "context": 131072, + "output": 131072 }, - "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, + "type": "chat" + }, + { + "id": "moonshotai/kimi-k2-0711", + "name": "kimi-k2-0711", + "display_name": "kimi-k2-0711", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 128000 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "openai/gpt-4.1", + "name": "GPT-4.1", + "display_name": "GPT-4.1", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 1047576, + "output": 32768 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, "attachment": true, "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-10-06", - "last_updated": "2025-10-06", + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { - "input": 15, - "output": 120 + "input": 2, + "output": 8, + "cache_read": 0.5 } - }, - { - "id": "gpt-5.1-chat-latest", - "name": "GPT-5.1 Chat", - "display_name": "GPT-5.1 Chat", + }, + { + "id": "openai/gpt-4.1-mini", + "name": "GPT-4.1 mini", + "display_name": "GPT-4.1 mini", "modalities": { "input": [ "text", @@ -28009,249 +35324,242 @@ ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 1047576, + "output": 32768 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-13", - "last_updated": "2025-11-13", + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125 + "input": 0.4, + "output": 1.6, + "cache_read": 0.1 } - } - ] - }, - "zhipuai-coding-plan": { - "id": "zhipuai-coding-plan", - "name": "Zhipu AI Coding Plan", - "display_name": "Zhipu AI Coding Plan", - "api": "https://open.bigmodel.cn/api/coding/paas/v4", - "doc": "https://docs.bigmodel.cn/cn/coding-plan/overview", - "models": [ + }, { - "id": "glm-4.6", - "name": "GLM-4.6", - "display_name": "GLM-4.6", + "id": "openai/gpt-4.1-nano", + "name": "GPT-4.1 nano", + "display_name": "GPT-4.1 nano", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 1047576, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-09-30", - "last_updated": "2025-09-30", + "attachment": true, + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "input": 0.1, + "output": 0.4, + "cache_read": 0.03 } }, { - "id": "glm-4.5v", - "name": "GLM 4.5V", - "display_name": "GLM 4.5V", + "id": "openai/gpt-4o", + "name": "GPT-4o", + "display_name": "GPT-4o", "modalities": { "input": [ "text", - "image", - "video" + "image" ], "output": [ "text" ] }, "limit": { - "context": 64000, + "context": 128000, "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-08-11", - "last_updated": "2025-08-11", + "open_weights": false, + "knowledge": "2023-09", + "release_date": "2024-05-13", + "last_updated": "2024-08-06", "cost": { - "input": 0, - "output": 0 + "input": 2.5, + "output": 10, + "cache_read": 1.25 } }, { - "id": "glm-4.5-air", - "name": "GLM-4.5-Air", - "display_name": "GLM-4.5-Air", + "id": "openai/gpt-4o-mini", + "name": "GPT-4o mini", + "display_name": "GPT-4o mini", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 98304 + "context": 128000, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-28", - "last_updated": "2025-07-28", + "attachment": true, + "open_weights": false, + "knowledge": "2023-09", + "release_date": "2024-07-18", + "last_updated": "2024-07-18", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "input": 0.15, + "output": 0.6, + "cache_read": 0.08 } }, { - "id": "glm-4.5", - "name": "GLM-4.5", - "display_name": "GLM-4.5", + "id": "openai/gpt-5-chat", + "name": "gpt-5-chat", + "display_name": "gpt-5-chat", + "limit": { + "context": 272000, + "output": 16384 + }, + "type": "chat" + }, + { + "id": "openai/gpt-5-mini", + "name": "gpt-5-mini", + "display_name": "gpt-5-mini", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 98304 + "context": 272000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-28", - "last_updated": "2025-07-28", + "attachment": true, + "open_weights": false, + "knowledge": "2024-05-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 - } + "input": 0.25, + "output": 2, + "cache_read": 0.03 + }, + "type": "chat" }, { - "id": "glm-4.5-flash", - "name": "GLM-4.5-Flash", - "display_name": "GLM-4.5-Flash", + "id": "openai/gpt-5-nano", + "name": "gpt-5-nano", + "display_name": "gpt-5-nano", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 98304 + "context": 272000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-28", - "last_updated": "2025-07-28", + "attachment": true, + "open_weights": false, + "knowledge": "2024-05-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 - } - } - ] - }, - "perplexity": { - "id": "perplexity", - "name": "Perplexity", - "display_name": "Perplexity", - "doc": "https://docs.perplexity.ai", - "models": [ + "input": 0.05, + "output": 0.4, + "cache_read": 0.01 + }, + "type": "chat" + }, { - "id": "sonar-reasoning", - "name": "Sonar Reasoning", - "display_name": "Sonar Reasoning", + "id": "openai/o4-mini", + "name": "o4-mini", + "display_name": "o4-mini", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 200000, + "output": 100000 }, - "temperature": true, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2025-09-01", - "release_date": "2024-01-01", - "last_updated": "2025-09-01", + "knowledge": "2024-05", + "release_date": "2025-04-16", + "last_updated": "2025-04-16", "cost": { - "input": 1, - "output": 5 + "input": 1.1, + "output": 4.4, + "cache_read": 0.28 } }, { - "id": "sonar", - "name": "Sonar", - "display_name": "Sonar", + "id": "qwen/qwen3-235b-a22b-2507", + "name": "Qwen: Qwen3 235B A22B Instruct 2507", + "display_name": "Qwen: Qwen3 235B A22B Instruct 2507", "modalities": { "input": [ "text" @@ -28261,102 +35569,66 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 262144, + "output": 262144 }, - "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": false, - "knowledge": "2025-09-01", - "release_date": "2024-01-01", - "last_updated": "2025-09-01", - "cost": { - "input": 1, - "output": 1 - } + "type": "chat" }, { - "id": "sonar-pro", - "name": "Sonar Pro", - "display_name": "Sonar Pro", + "id": "qwen/qwen3-235b-a22b-thinking-2507", + "name": "Qwen: Qwen3 235B A22B Thinking 2507", + "display_name": "Qwen: Qwen3 235B A22B Thinking 2507", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 8192 + "context": 262144, + "output": 262144 }, - "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-09-01", - "release_date": "2024-01-01", - "last_updated": "2025-09-01", - "cost": { - "input": 3, - "output": 15 - } + "type": "chat" }, { - "id": "sonar-reasoning-pro", - "name": "Sonar Reasoning Pro", - "display_name": "Sonar Reasoning Pro", + "id": "qwen/qwen3-coder", + "name": "Qwen: Qwen3 Coder 480B A35B", + "display_name": "Qwen: Qwen3 Coder 480B A35B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 262144, + "output": 262144 }, - "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-09-01", - "release_date": "2024-01-01", - "last_updated": "2025-09-01", - "cost": { - "input": 2, - "output": 8 - } - } - ] - }, - "zenmux": { - "id": "zenmux", - "name": "zenmux", - "display_name": "zenmux", - "api": "https://zenmux.ai/api/v1", - "doc": "https://docs.zenmux.ai", - "models": [ + "type": "chat" + }, { - "id": "moonshotai/kimi-k2-thinking-turbo", - "name": "Kimi K2 Thinking Turbo", - "display_name": "Kimi K2 Thinking Turbo", + "id": "qwen/qwen3-max", + "name": "Qwen: Qwen3 Max", + "display_name": "Qwen: Qwen3 Max", "modalities": { "input": [ "text" @@ -28366,32 +35638,23 @@ ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 256000, + "output": 32768 }, - "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": false, - "open_weights": false, - "knowledge": "2025-11", - "release_date": "2025-11-06", - "last_updated": "2025-11-06", - "cost": { - "input": 1.15, - "output": 8 - } + "type": "chat" }, { - "id": "moonshotai/kimi-k2-0905", - "name": "MoonshotAI: Kimi K2 0905", - "display_name": "MoonshotAI: Kimi K2 0905", + "id": "qwen/qwen3-vl-plus", + "name": "Qwen: Qwen3 VL 235B A22B Instruct", + "display_name": "Qwen: Qwen3 VL 235B A22B Instruct", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -28404,24 +35667,15 @@ "temperature": true, "tool_call": true, "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": false, - "knowledge": "2024-10", - "release_date": "2025-09-04", - "last_updated": "2025-09-04", - "cost": { - "input": 0.6, - "output": 2.5, - "cache_read": 0.15 + "supported": true, + "default": true }, - "type": "chat" + "type": "imageGeneration" }, { - "id": "moonshotai/kimi-k2-thinking", - "name": "Kimi K2 Thinking", - "display_name": "Kimi K2 Thinking", + "id": "z-ai/glm-4.5", + "name": "GLM-4.5", + "display_name": "GLM-4.5", "modalities": { "input": [ "text" @@ -28431,8 +35685,8 @@ ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 131072, + "output": 98304 }, "temperature": true, "tool_call": true, @@ -28441,52 +35695,60 @@ "default": true }, "attachment": false, - "open_weights": false, - "knowledge": "2025-11", - "release_date": "2025-11-06", - "last_updated": "2025-11-06", + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-07-28", + "last_updated": "2025-07-28", "cost": { "input": 0.6, - "output": 2.5 + "output": 2.2, + "cache_read": 0.11, + "cache_write": 0 } - }, + } + ] + }, + "ovhcloud": { + "id": "ovhcloud", + "name": "OVHcloud AI Endpoints", + "display_name": "OVHcloud AI Endpoints", + "api": "https://oai.endpoints.kepler.ai.cloud.ovh.net/v1", + "doc": "https://www.ovhcloud.com/en/public-cloud/ai-endpoints/catalog//", + "models": [ { - "id": "x-ai/grok-4-fast-non-reasoning", - "name": "Grok 4 Fast (Non-Reasoning)", - "display_name": "Grok 4 Fast (Non-Reasoning)", + "id": "mixtral-8x7b-instruct-v0.1", + "name": "Mixtral-8x7B-Instruct-v0.1", + "display_name": "Mixtral-8x7B-Instruct-v0.1", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 2000000, - "output": 30000 + "context": 32000, + "output": 32000 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-07", - "release_date": "2025-09-19", - "last_updated": "2025-09-19", + "attachment": false, + "open_weights": true, + "release_date": "2025-04-01", + "last_updated": "2025-04-01", "cost": { - "input": 0.2, - "output": 0.5, - "cache_read": 0.05 + "input": 0.7, + "output": 0.7 } }, { - "id": "x-ai/grok-4", - "name": "Grok 4", - "display_name": "Grok 4", + "id": "mistral-7b-instruct-v0.3", + "name": "Mistral-7B-Instruct-v0.3", + "display_name": "Mistral-7B-Instruct-v0.3", "modalities": { "input": [ "text" @@ -28496,31 +35758,27 @@ ] }, "limit": { - "context": 256000, - "output": 64000 + "context": 127000, + "output": 127000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2025-07", - "release_date": "2025-07-09", - "last_updated": "2025-07-09", + "open_weights": true, + "release_date": "2025-04-01", + "last_updated": "2025-04-01", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.75, - "reasoning": 15 + "input": 0.11, + "output": 0.11 } }, { - "id": "x-ai/grok-code-fast-1", - "name": "Grok Code Fast 1", - "display_name": "Grok Code Fast 1", + "id": "llama-3.1-8b-instruct", + "name": "Llama-3.1-8B-Instruct", + "display_name": "Llama-3.1-8B-Instruct", "modalities": { "input": [ "text" @@ -28530,30 +35788,27 @@ ] }, "limit": { - "context": 256000, - "output": 10000 + "context": 131000, + "output": 131000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2023-10", - "release_date": "2025-08-28", - "last_updated": "2025-08-28", + "open_weights": true, + "release_date": "2025-06-11", + "last_updated": "2025-06-11", "cost": { - "input": 0.2, - "output": 1.5, - "cache_read": 0.02 + "input": 0.11, + "output": 0.11 } }, { - "id": "x-ai/grok-4-fast", - "name": "Grok 4 Fast", - "display_name": "Grok 4 Fast", + "id": "qwen2.5-vl-72b-instruct", + "name": "Qwen2.5-VL-72B-Instruct", + "display_name": "Qwen2.5-VL-72B-Instruct", "modalities": { "input": [ "text", @@ -28563,31 +35818,28 @@ "text" ] }, - "limit": { - "context": 2000000, - "output": 30000 + "limit": { + "context": 32000, + "output": 32000 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, - "open_weights": false, - "knowledge": "2025-07", - "release_date": "2025-09-19", - "last_updated": "2025-09-19", + "open_weights": true, + "release_date": "2025-03-31", + "last_updated": "2025-03-31", "cost": { - "input": 0.2, - "output": 0.5, - "cache_read": 0.05 + "input": 1.01, + "output": 1.01 } }, { - "id": "deepseek/deepseek-chat", - "name": "DeepSeek: DeepSeek V3", - "display_name": "DeepSeek: DeepSeek V3", + "id": "mistral-nemo-instruct-2407", + "name": "Mistral-Nemo-Instruct-2407", + "display_name": "Mistral-Nemo-Instruct-2407", "modalities": { "input": [ "text" @@ -28597,8 +35849,8 @@ ] }, "limit": { - "context": 163840, - "output": 163840 + "context": 118000, + "output": 118000 }, "temperature": true, "tool_call": true, @@ -28607,123 +35859,108 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2025-07", - "release_date": "2025-09-29", - "last_updated": "2025-09-29", + "release_date": "2024-11-20", + "last_updated": "2024-11-20", "cost": { - "input": 0.56, - "output": 1.68, - "cache_read": 0.07 - }, - "type": "chat" + "input": 0.14, + "output": 0.14 + } }, { - "id": "minimax/minimax-m2", - "name": "MiniMax M2", - "display_name": "MiniMax M2", + "id": "mistral-small-3.2-24b-instruct-2506", + "name": "Mistral-Small-3.2-24B-Instruct-2506", + "display_name": "Mistral-Small-3.2-24B-Instruct-2506", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 204800, + "context": 128000, "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": false, - "open_weights": false, - "knowledge": "2025-10", - "release_date": "2025-10-27", - "last_updated": "2025-10-27", + "attachment": true, + "open_weights": true, + "release_date": "2025-07-16", + "last_updated": "2025-07-16", "cost": { - "input": 0.3, - "output": 1.2 + "input": 0.1, + "output": 0.31 } }, { - "id": "google/gemini-2.5-pro", - "name": "Google: Gemini 2.5 Pro", - "display_name": "Google: Gemini 2.5 Pro", + "id": "qwen2.5-coder-32b-instruct", + "name": "Qwen2.5-Coder-32B-Instruct", + "display_name": "Qwen2.5-Coder-32B-Instruct", "modalities": { "input": [ - "image", - "text", - "audio" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 32000, + "output": 32000 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-03-20", - "last_updated": "2025-06-05", + "attachment": false, + "open_weights": true, + "release_date": "2025-03-24", + "last_updated": "2025-03-24", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.31, - "cache_write": 4.5 - }, - "type": "imageGeneration" + "input": 0.96, + "output": 0.96 + } }, { - "id": "openai/gpt-5-codex", - "name": "GPT-5 Codex", - "display_name": "GPT-5 Codex", + "id": "qwen3-coder-30b-a3b-instruct", + "name": "Qwen3-Coder-30B-A3B-Instruct", + "display_name": "Qwen3-Coder-30B-A3B-Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 256000, + "output": 256000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-10-01", - "release_date": "2025-09-23", - "last_updated": "2025-09-23", + "attachment": false, + "open_weights": true, + "release_date": "2025-10-28", + "last_updated": "2025-10-28", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125 + "input": 0.07, + "output": 0.26 } }, { - "id": "openai/gpt-5", - "name": "gpt-5", - "display_name": "gpt-5", + "id": "llava-next-mistral-7b", + "name": "llava-next-mistral-7b", + "display_name": "llava-next-mistral-7b", "modalities": { "input": [ "text", @@ -28734,31 +35971,27 @@ ] }, "limit": { - "context": 272000, - "output": 128000 + "context": 32000, + "output": 32000 }, - "temperature": false, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, - "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "open_weights": true, + "release_date": "2025-01-08", + "last_updated": "2025-01-08", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.13 - }, - "type": "chat" + "input": 0.32, + "output": 0.32 + } }, { - "id": "inclusionai/ring-1t", - "name": "inclusionAI: Ring 1T", - "display_name": "inclusionAI: Ring 1T", + "id": "deepseek-r1-distill-llama-70b", + "name": "DeepSeek-R1-Distill-Llama-70B", + "display_name": "DeepSeek-R1-Distill-Llama-70B", "modalities": { "input": [ "text" @@ -28768,8 +36001,8 @@ ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 131000, + "output": 131000 }, "temperature": true, "tool_call": true, @@ -28779,20 +36012,17 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2025-10", - "release_date": "2025-10-12", - "last_updated": "2025-10-12", + "release_date": "2025-01-30", + "last_updated": "2025-01-30", "cost": { - "input": 0.56, - "output": 2.24, - "cache_read": 0.112 - }, - "type": "chat" + "input": 0.74, + "output": 0.74 + } }, { - "id": "inclusionai/lint-1t", - "name": "Ling-1T", - "display_name": "Ling-1T", + "id": "meta-llama-3_1-70b-instruct", + "name": "Meta-Llama-3_1-70B-Instruct", + "display_name": "Meta-Llama-3_1-70B-Instruct", "modalities": { "input": [ "text" @@ -28802,30 +36032,27 @@ ] }, "limit": { - "context": 128000, - "output": 32000 + "context": 131000, + "output": 131000 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2025-10", - "release_date": "2025-10-09", - "last_updated": "2025-10-09", + "release_date": "2025-04-01", + "last_updated": "2025-04-01", "cost": { - "input": 0.56, - "output": 2.24, - "cache_read": 0.112 + "input": 0.74, + "output": 0.74 } }, { - "id": "z-ai/glm-4.5-air", - "name": "GLM-4.5-Air", - "display_name": "GLM-4.5-Air", + "id": "gpt-oss-20b", + "name": "gpt-oss-20b", + "display_name": "gpt-oss-20b", "modalities": { "input": [ "text" @@ -28835,10 +36062,9 @@ ] }, "limit": { - "context": 131072, - "output": 98304 + "context": 131000, + "output": 131000 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -28846,20 +36072,17 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-28", - "last_updated": "2025-07-28", + "release_date": "2025-08-28", + "last_updated": "2025-08-28", "cost": { - "input": 0.2, - "output": 1.1, - "cache_read": 0.03, - "cache_write": 0 + "input": 0.05, + "output": 0.18 } }, { - "id": "z-ai/glm-4.6", - "name": "GLM-4.6", - "display_name": "GLM-4.6", + "id": "gpt-oss-120b", + "name": "gpt-oss-120b", + "display_name": "gpt-oss-120b", "modalities": { "input": [ "text" @@ -28869,10 +36092,9 @@ ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 131000, + "output": 131000 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -28880,20 +36102,17 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-09-30", - "last_updated": "2025-09-30", + "release_date": "2025-08-28", + "last_updated": "2025-08-28", "cost": { - "input": 0.6, - "output": 2.2, - "cache_read": 0.11, - "cache_write": 0 + "input": 0.09, + "output": 0.47 } }, { - "id": "qwen/qwen3-coder-plus", - "name": "Qwen: Qwen3 Coder 480B A35B Instruct", - "display_name": "Qwen: Qwen3 Coder 480B A35B Instruct", + "id": "meta-llama-3_3-70b-instruct", + "name": "Meta-Llama-3_3-70B-Instruct", + "display_name": "Meta-Llama-3_3-70B-Instruct", "modalities": { "input": [ "text" @@ -28903,30 +36122,27 @@ ] }, "limit": { - "context": 4096, - "output": 4096 + "context": 131000, + "output": 131000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-23", - "last_updated": "2025-07-23", + "release_date": "2025-04-01", + "last_updated": "2025-04-01", "cost": { - "input": 1, - "output": 5, - "cache_read": 0.1, - "cache_write": 1.25 + "input": 0.74, + "output": 0.74 } }, { - "id": "kuaishou/kat-coder-pro-v1", - "name": "KAT-Coder-Pro-V1", - "display_name": "KAT-Coder-Pro-V1", + "id": "qwen3-32b", + "name": "Qwen3-32B", + "display_name": "Qwen3-32B", "modalities": { "input": [ "text" @@ -28936,7 +36152,7 @@ ] }, "limit": { - "context": 256000, + "context": 32000, "output": 32000 }, "temperature": true, @@ -28946,20 +36162,26 @@ "default": true }, "attachment": false, - "open_weights": false, - "knowledge": "2025-01-01", - "release_date": "2025-10-23", - "last_updated": "2025-10-23", + "open_weights": true, + "release_date": "2025-07-16", + "last_updated": "2025-07-16", "cost": { - "input": 0.6, - "output": 2.4, - "cache_read": 0.12 + "input": 0.09, + "output": 0.25 } - }, + } + ] + }, + "v0": { + "id": "v0", + "name": "v0", + "display_name": "v0", + "doc": "https://sdk.vercel.ai/providers/ai-sdk-providers/vercel", + "models": [ { - "id": "anthropic/claude-haiku-4.5", - "name": "Claude Haiku 4.5", - "display_name": "Claude Haiku 4.5", + "id": "v0-1.5-lg", + "name": "v0-1.5-lg", + "display_name": "v0-1.5-lg", "modalities": { "input": [ "text", @@ -28970,8 +36192,8 @@ ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 512000, + "output": 32000 }, "temperature": true, "tool_call": true, @@ -28981,20 +36203,17 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2025-02-28", - "release_date": "2025-10-15", - "last_updated": "2025-10-15", + "release_date": "2025-06-09", + "last_updated": "2025-06-09", "cost": { - "input": 1, - "output": 5, - "cache_read": 0.1, - "cache_write": 1.25 + "input": 15, + "output": 75 } }, { - "id": "anthropic/claude-opus-4.1", - "name": "Claude Opus 4.1", - "display_name": "Claude Opus 4.1", + "id": "v0-1.5-md", + "name": "v0-1.5-md", + "display_name": "v0-1.5-md", "modalities": { "input": [ "text", @@ -29005,7 +36224,7 @@ ] }, "limit": { - "context": 200000, + "context": 128000, "output": 32000 }, "temperature": true, @@ -29016,20 +36235,17 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "release_date": "2025-06-09", + "last_updated": "2025-06-09", "cost": { - "input": 15, - "output": 75, - "cache_read": 1.5, - "cache_write": 18.75 + "input": 3, + "output": 15 } }, { - "id": "anthropic/claude-sonnet-4.5", - "name": "Claude Sonnet 4.5", - "display_name": "Claude Sonnet 4.5", + "id": "v0-1.0-md", + "name": "v0-1.0-md", + "display_name": "v0-1.0-md", "modalities": { "input": [ "text", @@ -29040,8 +36256,8 @@ ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 128000, + "output": 32000 }, "temperature": true, "tool_call": true, @@ -29051,170 +36267,130 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2025-07-31", - "release_date": "2025-09-29", - "last_updated": "2025-09-29", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", "cost": { "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "output": 15 } - }, + } + ] + }, + "iflowcn": { + "id": "iflowcn", + "name": "iFlow", + "display_name": "iFlow", + "api": "https://apis.iflow.cn/v1", + "doc": "https://platform.iflow.cn/en/docs", + "models": [ { - "id": "anthropic/claude-3.5-haiku", - "name": "Claude Haiku 3.5", - "display_name": "Claude Haiku 3.5", + "id": "qwen3-coder", + "name": "Qwen3-Coder-480B-A35B", + "display_name": "Qwen3-Coder-480B-A35B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 8192 + "context": 256000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-07-31", - "release_date": "2024-10-22", - "last_updated": "2024-10-22", + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-07-01", + "last_updated": "2025-07-01", "cost": { - "input": 0.8, - "output": 4, - "cache_read": 0.08, - "cache_write": 1 + "input": 0, + "output": 0 } }, { - "id": "anthropic/claude-3.5-sonnet", - "name": "Claude Sonnet 3.5 v2", - "display_name": "Claude Sonnet 3.5 v2", + "id": "deepseek-v3", + "name": "DeepSeek-V3", + "display_name": "DeepSeek-V3", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 8192 + "context": 128000, + "output": 32000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-04-30", - "release_date": "2024-10-22", - "last_updated": "2024-10-22", + "attachment": false, + "open_weights": true, + "knowledge": "2024-10", + "release_date": "2024-12-26", + "last_updated": "2024-12-26", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 0, + "output": 0 } }, { - "id": "anthropic/claude-3.7-sonnet", - "name": "Claude Sonnet 3.7", - "display_name": "Claude Sonnet 3.7", + "id": "kimi-k2", + "name": "Kimi-K2", + "display_name": "Kimi-K2", "modalities": { "input": [ - "text", - "image" - ], - "output": [ "text" - ] - }, - "limit": { - "context": 200000, - "output": 64000 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": true, - "default": true - }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-10-31", - "release_date": "2025-02-19", - "last_updated": "2025-02-19", - "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 - } - }, - { - "id": "anthropic/claude-opus-4", - "name": "Claude Opus 4", - "display_name": "Claude Opus 4", - "modalities": { - "input": [ - "text", - "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 32000 + "context": 128000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-05-22", - "last_updated": "2025-05-22", + "knowledge": "2024-10", + "release_date": "2024-12-01", + "last_updated": "2024-12-01", "cost": { - "input": 15, - "output": 75, - "cache_read": 1.5, - "cache_write": 18.75 + "input": 0, + "output": 0 } }, { - "id": "anthropic/claude-sonnet-4", - "name": "Claude Sonnet 4", - "display_name": "Claude Sonnet 4", + "id": "deepseek-r1", + "name": "DeepSeek-R1", + "display_name": "DeepSeek-R1", "modalities": { - "input": [ - "text", - "image" + "input": [ + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 128000, + "output": 32000 }, "temperature": true, "tool_call": true, @@ -29222,22 +36398,20 @@ "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-05-22", - "last_updated": "2025-05-22", + "attachment": false, + "open_weights": true, + "knowledge": "2024-12", + "release_date": "2025-01-20", + "last_updated": "2025-01-20", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 0, + "output": 0 } }, { - "id": "deepseek/deepseek-chat-v3.1", - "name": "DeepSeek: DeepSeek V3.1", - "display_name": "DeepSeek: DeepSeek V3.1", + "id": "deepseek-v3.1", + "name": "DeepSeek-V3.1-Terminus", + "display_name": "DeepSeek-V3.1-Terminus", "modalities": { "input": [ "text" @@ -29247,20 +36421,29 @@ ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 128000, + "output": 64000 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "type": "chat" + "attachment": false, + "open_weights": true, + "knowledge": "2024-12", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", + "cost": { + "input": 0, + "output": 0 + } }, { - "id": "deepseek/deepseek-r1-0528", - "name": "DeepSeek: R1 0528", - "display_name": "DeepSeek: R1 0528", + "id": "minimax-m2", + "name": "MiniMax-M2", + "display_name": "MiniMax-M2", "modalities": { "input": [ "text" @@ -29270,122 +36453,157 @@ ] }, "limit": { - "context": 163840, - "output": 163840 + "context": 204800, + "output": 131100 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "type": "chat" + "attachment": false, + "open_weights": true, + "release_date": "2025-11-13", + "last_updated": "2025-11-13", + "cost": { + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 + } }, { - "id": "google/gemini-2.0-flash", - "name": "Google: Gemini 2.0 Flash", - "display_name": "Google: Gemini 2.0 Flash", + "id": "qwen3-235b", + "name": "Qwen3-235B-A22B", + "display_name": "Qwen3-235B-A22B", "modalities": { "input": [ - "text", - "image", - "audio" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 8192 + "context": 128000, + "output": 32000 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "type": "imageGeneration" + "attachment": false, + "open_weights": true, + "knowledge": "2024-10", + "release_date": "2024-12-01", + "last_updated": "2024-12-01", + "cost": { + "input": 0, + "output": 0 + } }, { - "id": "google/gemini-2.0-flash-lite-001", - "name": "Google: Gemini 2.0 Flash Lite", - "display_name": "Google: Gemini 2.0 Flash Lite", + "id": "deepseek-v3.2-chat", + "name": "DeepSeek-V3.2", + "display_name": "DeepSeek-V3.2", "modalities": { "input": [ - "text", - "image", - "audio" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 8192 + "context": 128000, + "output": 64000 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "type": "imageGeneration" + "attachment": false, + "open_weights": true, + "knowledge": "2025-11", + "release_date": "2025-12-01", + "last_updated": "2025-12-01", + "cost": { + "input": 0, + "output": 0 + } }, { - "id": "google/gemini-2.5-flash", - "name": "Google: Gemini 2.5 Flash", - "display_name": "Google: Gemini 2.5 Flash", + "id": "kimi-k2-0905", + "name": "Kimi-K2-0905", + "display_name": "Kimi-K2-0905", "modalities": { "input": [ - "image", - "text", - "audio" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65535 + "context": 256000, + "output": 64000 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "type": "imageGeneration" + "attachment": false, + "open_weights": false, + "knowledge": "2024-12", + "release_date": "2025-09-05", + "last_updated": "2025-09-05", + "cost": { + "input": 0, + "output": 0 + } }, { - "id": "google/gemini-2.5-flash-lite", - "name": "Google: Gemini 2.5 Flash Lite", - "display_name": "Google: Gemini 2.5 Flash Lite", + "id": "kimi-k2-thinking", + "name": "Kimi-K2-Thinking", + "display_name": "Kimi-K2-Thinking", "modalities": { "input": [ - "image", - "text", - "audio" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65535 + "context": 128000, + "output": 64000 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": true, - "type": "imageGeneration" + "attachment": false, + "open_weights": true, + "knowledge": "2025-11", + "release_date": "2025-11-06", + "last_updated": "2025-11-06", + "cost": { + "input": 0, + "output": 0 + } }, { - "id": "inclusionai/ling-1t", - "name": "inclusionAI: Ling-1T", - "display_name": "inclusionAI: Ling-1T", + "id": "qwen3-235b-a22b-thinking-2507", + "name": "Qwen3-235B-A22B-Thinking", + "display_name": "Qwen3-235B-A22B-Thinking", "modalities": { "input": [ "text" @@ -29395,41 +36613,61 @@ ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 256000, + "output": 64000 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "type": "chat" + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-07-01", + "last_updated": "2025-07-01", + "cost": { + "input": 0, + "output": 0 + } }, { - "id": "inclusionai/ling-flash-2.0", - "name": "inclusionAI: Ling Flash 2.0", - "display_name": "inclusionAI: Ling Flash 2.0", + "id": "qwen3-vl-plus", + "name": "Qwen3-VL-Plus", + "display_name": "Qwen3-VL-Plus", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 256000, + "output": 32000 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "type": "chat" + "attachment": true, + "open_weights": false, + "knowledge": "2024-12", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", + "cost": { + "input": 0, + "output": 0 + } }, { - "id": "inclusionai/ling-mini-2.0", - "name": "inclusionAI: Ling Mini 2.0", - "display_name": "inclusionAI: Ling Mini 2.0", + "id": "glm-4.6", + "name": "GLM-4.6", + "display_name": "GLM-4.6", "modalities": { "input": [ "text" @@ -29439,19 +36677,29 @@ ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 200000, + "output": 128000 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "type": "chat" + "attachment": false, + "open_weights": false, + "knowledge": "2024-10", + "release_date": "2024-12-01", + "last_updated": "2025-11-13", + "cost": { + "input": 0, + "output": 0 + } }, { - "id": "inclusionai/ring-flash-2.0", - "name": "inclusionAI: Ring Flash 2.0", - "display_name": "inclusionAI: Ring Flash 2.0", + "id": "tstars2.0", + "name": "TStars-2.0", + "display_name": "TStars-2.0", "modalities": { "input": [ "text" @@ -29461,20 +36709,28 @@ ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 128000, + "output": 64000 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "type": "chat" + "attachment": false, + "open_weights": false, + "knowledge": "2024-01", + "release_date": "2024-01-01", + "last_updated": "2025-01-01", + "cost": { + "input": 0, + "output": 0 + } }, { - "id": "inclusionai/ring-mini-2.0", - "name": "inclusionAI: Ring Mini 2.0", - "display_name": "inclusionAI: Ring Mini 2.0", + "id": "qwen3-235b-a22b-instruct", + "name": "Qwen3-235B-A22B-Instruct", + "display_name": "Qwen3-235B-A22B-Instruct", "modalities": { "input": [ "text" @@ -29484,20 +36740,28 @@ ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 256000, + "output": 64000 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "type": "chat" + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-07-01", + "last_updated": "2025-07-01", + "cost": { + "input": 0, + "output": 0 + } }, { - "id": "moonshotai/kimi-k2-0711", - "name": "kimi-k2-0711", - "display_name": "kimi-k2-0711", + "id": "qwen3-max", + "name": "Qwen3-Max", + "display_name": "Qwen3-Max", "modalities": { "input": [ "text" @@ -29507,122 +36771,124 @@ ] }, "limit": { - "context": 128000, - "output": 128000 + "context": 256000, + "output": 32000 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "type": "chat" + "attachment": false, + "open_weights": false, + "knowledge": "2024-12", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", + "cost": { + "input": 0, + "output": 0 + } }, { - "id": "openai/gpt-4.1", - "name": "GPT-4.1", - "display_name": "GPT-4.1", + "id": "deepseek-v3.2", + "name": "DeepSeek-V3.2-Exp", + "display_name": "DeepSeek-V3.2-Exp", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1047576, - "output": 32768 + "context": 128000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", + "attachment": false, + "open_weights": true, + "knowledge": "2024-12", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 2, - "output": 8, - "cache_read": 0.5 + "input": 0, + "output": 0 } }, { - "id": "openai/gpt-4.1-mini", - "name": "GPT-4.1 mini", - "display_name": "GPT-4.1 mini", + "id": "qwen3-max-preview", + "name": "Qwen3-Max-Preview", + "display_name": "Qwen3-Max-Preview", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1047576, - "output": 32768 + "context": 256000, + "output": 32000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", + "knowledge": "2024-12", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 0.4, - "output": 1.6, - "cache_read": 0.1 + "input": 0, + "output": 0 } }, { - "id": "openai/gpt-4.1-nano", - "name": "GPT-4.1 nano", - "display_name": "GPT-4.1 nano", + "id": "qwen3-coder-plus", + "name": "Qwen3-Coder-Plus", + "display_name": "Qwen3-Coder-Plus", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1047576, - "output": 32768 + "context": 256000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-07-01", + "last_updated": "2025-07-01", "cost": { - "input": 0.1, - "output": 0.4, - "cache_read": 0.03 + "input": 0, + "output": 0 } }, { - "id": "openai/gpt-4o", - "name": "GPT-4o", - "display_name": "GPT-4o", + "id": "qwen3-32b", + "name": "Qwen3-32B", + "display_name": "Qwen3-32B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" @@ -29630,32 +36896,39 @@ }, "limit": { "context": 128000, - "output": 16384 + "output": 32000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2023-09", - "release_date": "2024-05-13", - "last_updated": "2024-08-06", + "attachment": false, + "open_weights": true, + "knowledge": "2024-10", + "release_date": "2024-12-01", + "last_updated": "2024-12-01", "cost": { - "input": 2.5, - "output": 10, - "cache_read": 1.25 + "input": 0, + "output": 0 } - }, + } + ] + }, + "synthetic": { + "id": "synthetic", + "name": "Synthetic", + "display_name": "Synthetic", + "api": "https://api.synthetic.new/v1", + "doc": "https://synthetic.new/pricing", + "models": [ { - "id": "openai/gpt-4o-mini", - "name": "GPT-4o mini", - "display_name": "GPT-4o mini", + "id": "hf:openai/gpt-oss-120b", + "name": "GPT OSS 120B", + "display_name": "GPT OSS 120B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" @@ -29663,142 +36936,140 @@ }, "limit": { "context": 128000, - "output": 16384 + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2023-09", - "release_date": "2024-07-18", - "last_updated": "2024-07-18", + "attachment": false, + "open_weights": true, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 0.15, - "output": 0.6, - "cache_read": 0.08 + "input": 0.1, + "output": 0.1 } - }, - { - "id": "openai/gpt-5-chat", - "name": "gpt-5-chat", - "display_name": "gpt-5-chat", - "limit": { - "context": 272000, - "output": 16384 - }, - "type": "chat" - }, + } + ] + }, + "deepinfra": { + "id": "deepinfra", + "name": "Deep Infra", + "display_name": "Deep Infra", + "doc": "https://deepinfra.com/models", + "models": [ { - "id": "openai/gpt-5-mini", - "name": "gpt-5-mini", - "display_name": "gpt-5-mini", + "id": "openai/gpt-oss-20b", + "name": "GPT OSS 20B", + "display_name": "GPT OSS 20B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 272000, - "output": 128000 + "context": 131072, + "output": 16384 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-05-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "attachment": false, + "open_weights": true, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 0.25, - "output": 2, - "cache_read": 0.03 - }, - "type": "chat" + "input": 0.03, + "output": 0.14 + } }, { - "id": "openai/gpt-5-nano", - "name": "gpt-5-nano", - "display_name": "gpt-5-nano", + "id": "openai/gpt-oss-120b", + "name": "GPT OSS 120B", + "display_name": "GPT OSS 120B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 272000, - "output": 128000 + "context": 131072, + "output": 16384 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-05-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "attachment": false, + "open_weights": true, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { "input": 0.05, - "output": 0.4, - "cache_read": 0.01 - }, - "type": "chat" - }, + "output": 0.24 + } + } + ] + }, + "zhipuai": { + "id": "zhipuai", + "name": "Zhipu AI", + "display_name": "Zhipu AI", + "api": "https://open.bigmodel.cn/api/paas/v4", + "doc": "https://docs.z.ai/guides/overview/pricing", + "models": [ { - "id": "openai/o4-mini", - "name": "o4-mini", - "display_name": "o4-mini", + "id": "glm-4.6v", + "name": "GLM-4.6V", + "display_name": "GLM-4.6V", "modalities": { "input": [ "text", - "image" + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 128000, + "output": 32768 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, "attachment": true, - "open_weights": false, - "knowledge": "2024-05", - "release_date": "2025-04-16", - "last_updated": "2025-04-16", + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-12-08", + "last_updated": "2025-12-08", "cost": { - "input": 1.1, - "output": 4.4, - "cache_read": 0.28 + "input": 0.3, + "output": 0.9 } }, { - "id": "qwen/qwen3-235b-a22b-2507", - "name": "Qwen: Qwen3 235B A22B Instruct 2507", - "display_name": "Qwen: Qwen3 235B A22B Instruct 2507", + "id": "glm-4.6", + "name": "GLM-4.6", + "display_name": "GLM-4.6", "modalities": { "input": [ "text" @@ -29808,43 +37079,65 @@ ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 204800, + "output": 131072 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "type": "chat" + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-09-30", + "last_updated": "2025-09-30", + "cost": { + "input": 0.6, + "output": 2.2, + "cache_read": 0.11, + "cache_write": 0 + } }, { - "id": "qwen/qwen3-235b-a22b-thinking-2507", - "name": "Qwen: Qwen3 235B A22B Thinking 2507", - "display_name": "Qwen: Qwen3 235B A22B Thinking 2507", + "id": "glm-4.5v", + "name": "GLM-4.5V", + "display_name": "GLM-4.5V", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 64000, + "output": 16384 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "type": "chat" + "attachment": true, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-08-11", + "last_updated": "2025-08-11", + "cost": { + "input": 0.6, + "output": 1.8 + } }, { - "id": "qwen/qwen3-coder", - "name": "Qwen: Qwen3 Coder 480B A35B", - "display_name": "Qwen: Qwen3 Coder 480B A35B", + "id": "glm-4.5-air", + "name": "GLM-4.5-Air", + "display_name": "GLM-4.5-Air", "modalities": { "input": [ "text" @@ -29854,20 +37147,31 @@ ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 131072, + "output": 98304 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "type": "chat" + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-07-28", + "last_updated": "2025-07-28", + "cost": { + "input": 0.2, + "output": 1.1, + "cache_read": 0.03, + "cache_write": 0 + } }, { - "id": "qwen/qwen3-max", - "name": "Qwen: Qwen3 Max", - "display_name": "Qwen: Qwen3 Max", + "id": "glm-4.5", + "name": "GLM-4.5", + "display_name": "GLM-4.5", "modalities": { "input": [ "text" @@ -29877,31 +37181,42 @@ ] }, "limit": { - "context": 256000, - "output": 32768 + "context": 131072, + "output": 98304 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "type": "chat" + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-07-28", + "last_updated": "2025-07-28", + "cost": { + "input": 0.6, + "output": 2.2, + "cache_read": 0.11, + "cache_write": 0 + } }, { - "id": "qwen/qwen3-vl-plus", - "name": "Qwen: Qwen3 VL 235B A22B Instruct", - "display_name": "Qwen: Qwen3 VL 235B A22B Instruct", + "id": "glm-4.5-flash", + "name": "GLM-4.5-Flash", + "display_name": "GLM-4.5-Flash", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 131072, + "output": 98304 }, "temperature": true, "tool_call": true, @@ -29909,12 +37224,31 @@ "supported": true, "default": true }, - "type": "imageGeneration" - }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-07-28", + "last_updated": "2025-07-28", + "cost": { + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 + } + } + ] + }, + "submodel": { + "id": "submodel", + "name": "submodel", + "display_name": "submodel", + "api": "https://llm.submodel.ai/v1", + "doc": "https://submodel.gitbook.io", + "models": [ { - "id": "z-ai/glm-4.5", - "name": "GLM-4.5", - "display_name": "GLM-4.5", + "id": "openai/gpt-oss-120b", + "name": "GPT OSS 120B", + "display_name": "GPT OSS 120B", "modalities": { "input": [ "text" @@ -29925,7 +37259,7 @@ }, "limit": { "context": 131072, - "output": 98304 + "output": 32768 }, "temperature": true, "tool_call": true, @@ -29935,29 +37269,26 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-28", - "last_updated": "2025-07-28", + "release_date": "2025-08-23", + "last_updated": "2025-08-23", "cost": { - "input": 0.6, - "output": 2.2, - "cache_read": 0.11, - "cache_write": 0 + "input": 0.1, + "output": 0.5 } } ] }, - "ovhcloud": { - "id": "ovhcloud", - "name": "OVHcloud AI Endpoints", - "display_name": "OVHcloud AI Endpoints", - "api": "https://oai.endpoints.kepler.ai.cloud.ovh.net/v1", - "doc": "https://www.ovhcloud.com/en/public-cloud/ai-endpoints/catalog//", + "zai": { + "id": "zai", + "name": "Z.AI", + "display_name": "Z.AI", + "api": "https://api.z.ai/api/paas/v4", + "doc": "https://docs.z.ai/guides/overview/pricing", "models": [ { - "id": "mixtral-8x7b-instruct-v0.1", - "name": "Mixtral-8x7B-Instruct-v0.1", - "display_name": "Mixtral-8x7B-Instruct-v0.1", + "id": "glm-4.5-flash", + "name": "GLM-4.5-Flash", + "display_name": "GLM-4.5-Flash", "modalities": { "input": [ "text" @@ -29967,27 +37298,31 @@ ] }, "limit": { - "context": 32000, - "output": 32000 + "context": 131072, + "output": 98304 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": true, - "release_date": "2025-04-01", - "last_updated": "2025-04-01", + "knowledge": "2025-04", + "release_date": "2025-07-28", + "last_updated": "2025-07-28", "cost": { - "input": 0.7, - "output": 0.7 + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 } }, { - "id": "mistral-7b-instruct-v0.3", - "name": "Mistral-7B-Instruct-v0.3", - "display_name": "Mistral-7B-Instruct-v0.3", + "id": "glm-4.5", + "name": "GLM-4.5", + "display_name": "GLM-4.5", "modalities": { "input": [ "text" @@ -29997,27 +37332,31 @@ ] }, "limit": { - "context": 127000, - "output": 127000 + "context": 131072, + "output": 98304 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": true, - "release_date": "2025-04-01", - "last_updated": "2025-04-01", + "knowledge": "2025-04", + "release_date": "2025-07-28", + "last_updated": "2025-07-28", "cost": { - "input": 0.11, - "output": 0.11 + "input": 0.6, + "output": 2.2, + "cache_read": 0.11, + "cache_write": 0 } }, { - "id": "llama-3.1-8b-instruct", - "name": "Llama-3.1-8B-Instruct", - "display_name": "Llama-3.1-8B-Instruct", + "id": "glm-4.5-air", + "name": "GLM-4.5-Air", + "display_name": "GLM-4.5-Air", "modalities": { "input": [ "text" @@ -30027,58 +37366,65 @@ ] }, "limit": { - "context": 131000, - "output": 131000 + "context": 131072, + "output": 98304 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": true, - "release_date": "2025-06-11", - "last_updated": "2025-06-11", + "knowledge": "2025-04", + "release_date": "2025-07-28", + "last_updated": "2025-07-28", "cost": { - "input": 0.11, - "output": 0.11 + "input": 0.2, + "output": 1.1, + "cache_read": 0.03, + "cache_write": 0 } }, { - "id": "qwen2.5-vl-72b-instruct", - "name": "Qwen2.5-VL-72B-Instruct", - "display_name": "Qwen2.5-VL-72B-Instruct", + "id": "glm-4.5v", + "name": "GLM-4.5V", + "display_name": "GLM-4.5V", "modalities": { "input": [ "text", - "image" + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 32000, - "output": 32000 + "context": 64000, + "output": 16384 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": true, - "release_date": "2025-03-31", - "last_updated": "2025-03-31", + "knowledge": "2025-04", + "release_date": "2025-08-11", + "last_updated": "2025-08-11", "cost": { - "input": 1.01, - "output": 1.01 + "input": 0.6, + "output": 1.8 } }, { - "id": "mistral-nemo-instruct-2407", - "name": "Mistral-Nemo-Instruct-2407", - "display_name": "Mistral-Nemo-Instruct-2407", + "id": "glm-4.6", + "name": "GLM-4.6", + "display_name": "GLM-4.6", "modalities": { "input": [ "text" @@ -30088,31 +37434,36 @@ ] }, "limit": { - "context": 118000, - "output": 118000 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": true, - "release_date": "2024-11-20", - "last_updated": "2024-11-20", + "knowledge": "2025-04", + "release_date": "2025-09-30", + "last_updated": "2025-09-30", "cost": { - "input": 0.14, - "output": 0.14 + "input": 0.6, + "output": 2.2, + "cache_read": 0.11, + "cache_write": 0 } }, { - "id": "mistral-small-3.2-24b-instruct-2506", - "name": "Mistral-Small-3.2-24B-Instruct-2506", - "display_name": "Mistral-Small-3.2-24B-Instruct-2506", + "id": "glm-4.6v", + "name": "GLM-4.6V", + "display_name": "GLM-4.6V", "modalities": { "input": [ "text", - "image" + "image", + "video" ], "output": [ "text" @@ -30120,26 +37471,37 @@ }, "limit": { "context": 128000, - "output": 128000 + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": true, - "release_date": "2025-07-16", - "last_updated": "2025-07-16", + "knowledge": "2025-04", + "release_date": "2025-12-08", + "last_updated": "2025-12-08", "cost": { - "input": 0.1, - "output": 0.31 + "input": 0.3, + "output": 0.9 } - }, + } + ] + }, + "inference": { + "id": "inference", + "name": "Inference", + "display_name": "Inference", + "api": "https://inference.net/v1", + "doc": "https://inference.net/models", + "models": [ { - "id": "qwen2.5-coder-32b-instruct", - "name": "Qwen2.5-Coder-32B-Instruct", - "display_name": "Qwen2.5-Coder-32B-Instruct", + "id": "mistral/mistral-nemo-12b-instruct", + "name": "Mistral Nemo 12B Instruct", + "display_name": "Mistral Nemo 12B Instruct", "modalities": { "input": [ "text" @@ -30149,88 +37511,91 @@ ] }, "limit": { - "context": 32000, - "output": 32000 + "context": 16000, + "output": 4096 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2025-03-24", - "last_updated": "2025-03-24", + "knowledge": "2024-12", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 0.96, - "output": 0.96 + "input": 0.038, + "output": 0.1 } }, { - "id": "qwen3-coder-30b-a3b-instruct", - "name": "Qwen3-Coder-30B-A3B-Instruct", - "display_name": "Qwen3-Coder-30B-A3B-Instruct", + "id": "google/gemma-3", + "name": "Google Gemma 3", + "display_name": "Google Gemma 3", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 256000 + "context": 125000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": true, - "release_date": "2025-10-28", - "last_updated": "2025-10-28", + "knowledge": "2024-12", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 0.07, - "output": 0.26 + "input": 0.15, + "output": 0.3 } }, { - "id": "llava-next-mistral-7b", - "name": "llava-next-mistral-7b", - "display_name": "llava-next-mistral-7b", + "id": "osmosis/osmosis-structure-0.6b", + "name": "Osmosis Structure 0.6B", + "display_name": "Osmosis Structure 0.6B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 32000, - "output": 32000 + "context": 4000, + "output": 2048 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": true, - "release_date": "2025-01-08", - "last_updated": "2025-01-08", + "knowledge": "2024-12", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 0.32, - "output": 0.32 + "input": 0.1, + "output": 0.5 } }, { - "id": "deepseek-r1-distill-llama-70b", - "name": "DeepSeek-R1-Distill-Llama-70B", - "display_name": "DeepSeek-R1-Distill-Llama-70B", + "id": "qwen/qwen3-embedding-4b", + "name": "Qwen 3 Embedding 4B", + "display_name": "Qwen 3 Embedding 4B", "modalities": { "input": [ "text" @@ -30240,88 +37605,92 @@ ] }, "limit": { - "context": 131000, - "output": 131000 + "context": 32000, + "output": 2048 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2025-01-30", - "last_updated": "2025-01-30", + "knowledge": "2024-12", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 0.74, - "output": 0.74 + "input": 0.01, + "output": 0 } }, { - "id": "meta-llama-3_1-70b-instruct", - "name": "Meta-Llama-3_1-70B-Instruct", - "display_name": "Meta-Llama-3_1-70B-Instruct", + "id": "qwen/qwen-2.5-7b-vision-instruct", + "name": "Qwen 2.5 7B Vision Instruct", + "display_name": "Qwen 2.5 7B Vision Instruct", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131000, - "output": 131000 + "context": 125000, + "output": 4096 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": true, - "release_date": "2025-04-01", - "last_updated": "2025-04-01", + "knowledge": "2024-12", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 0.74, - "output": 0.74 + "input": 0.2, + "output": 0.2 } }, { - "id": "gpt-oss-20b", - "name": "gpt-oss-20b", - "display_name": "gpt-oss-20b", + "id": "meta/llama-3.2-11b-vision-instruct", + "name": "Llama 3.2 11B Vision Instruct", + "display_name": "Llama 3.2 11B Vision Instruct", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131000, - "output": 131000 + "context": 16000, + "output": 4096 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": true, - "release_date": "2025-08-28", - "last_updated": "2025-08-28", + "knowledge": "2023-12", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 0.05, - "output": 0.18 + "input": 0.055, + "output": 0.055 } }, { - "id": "gpt-oss-120b", - "name": "gpt-oss-120b", - "display_name": "gpt-oss-120b", + "id": "meta/llama-3.1-8b-instruct", + "name": "Llama 3.1 8B Instruct", + "display_name": "Llama 3.1 8B Instruct", "modalities": { "input": [ "text" @@ -30331,27 +37700,28 @@ ] }, "limit": { - "context": 131000, - "output": 131000 + "context": 16000, + "output": 4096 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2025-08-28", - "last_updated": "2025-08-28", + "knowledge": "2023-12", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 0.09, - "output": 0.47 + "input": 0.025, + "output": 0.025 } }, { - "id": "meta-llama-3_3-70b-instruct", - "name": "Meta-Llama-3_3-70B-Instruct", - "display_name": "Meta-Llama-3_3-70B-Instruct", + "id": "meta/llama-3.2-3b-instruct", + "name": "Llama 3.2 3B Instruct", + "display_name": "Llama 3.2 3B Instruct", "modalities": { "input": [ "text" @@ -30361,8 +37731,8 @@ ] }, "limit": { - "context": 131000, - "output": 131000 + "context": 16000, + "output": 4096 }, "temperature": true, "tool_call": true, @@ -30371,17 +37741,18 @@ }, "attachment": false, "open_weights": true, - "release_date": "2025-04-01", - "last_updated": "2025-04-01", + "knowledge": "2023-12", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 0.74, - "output": 0.74 + "input": 0.02, + "output": 0.02 } }, { - "id": "qwen3-32b", - "name": "Qwen3-32B", - "display_name": "Qwen3-32B", + "id": "meta/llama-3.2-1b-instruct", + "name": "Llama 3.2 1B Instruct", + "display_name": "Llama 3.2 1B Instruct", "modalities": { "input": [ "text" @@ -30391,36 +37762,37 @@ ] }, "limit": { - "context": 32000, - "output": 32000 + "context": 16000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2025-07-16", - "last_updated": "2025-07-16", + "knowledge": "2023-12", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 0.09, - "output": 0.25 + "input": 0.01, + "output": 0.01 } } ] }, - "v0": { - "id": "v0", - "name": "v0", - "display_name": "v0", - "doc": "https://sdk.vercel.ai/providers/ai-sdk-providers/vercel", + "requesty": { + "id": "requesty", + "name": "Requesty", + "display_name": "Requesty", + "api": "https://router.requesty.ai/v1", + "doc": "https://requesty.ai/solution/llm-routing/models", "models": [ { - "id": "v0-1.5-lg", - "name": "v0-1.5-lg", - "display_name": "v0-1.5-lg", + "id": "xai/grok-4", + "name": "Grok 4", + "display_name": "Grok 4", "modalities": { "input": [ "text", @@ -30431,8 +37803,8 @@ ] }, "limit": { - "context": 512000, - "output": 32000 + "context": 256000, + "output": 64000 }, "temperature": true, "tool_call": true, @@ -30442,29 +37814,31 @@ }, "attachment": true, "open_weights": false, - "release_date": "2025-06-09", - "last_updated": "2025-06-09", + "knowledge": "2025-01", + "release_date": "2025-09-09", + "last_updated": "2025-09-09", "cost": { - "input": 15, - "output": 75 + "input": 3, + "output": 15, + "cache_read": 0.75, + "cache_write": 3 } }, { - "id": "v0-1.5-md", - "name": "v0-1.5-md", - "display_name": "v0-1.5-md", + "id": "xai/grok-4-fast", + "name": "Grok 4 Fast", + "display_name": "Grok 4 Fast", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 32000 + "context": 2000000, + "output": 64000 }, "temperature": true, "tool_call": true, @@ -30474,29 +37848,35 @@ }, "attachment": true, "open_weights": false, - "release_date": "2025-06-09", - "last_updated": "2025-06-09", + "knowledge": "2025-01", + "release_date": "2025-09-19", + "last_updated": "2025-09-19", "cost": { - "input": 3, - "output": 15 + "input": 0.2, + "output": 0.5, + "cache_read": 0.05, + "cache_write": 0.2 } }, { - "id": "v0-1.0-md", - "name": "v0-1.0-md", - "display_name": "v0-1.0-md", + "id": "google/gemini-3-pro-preview", + "name": "Gemini 3 Pro", + "display_name": "Gemini 3 Pro", "modalities": { "input": [ "text", - "image" + "image", + "audio", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 32000 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -30506,119 +37886,129 @@ }, "attachment": true, "open_weights": false, - "release_date": "2025-05-22", - "last_updated": "2025-05-22", + "knowledge": "2025-01", + "release_date": "2025-11-18", + "last_updated": "2025-11-18", "cost": { - "input": 3, - "output": 15 + "input": 2, + "output": 12, + "cache_read": 0.2, + "cache_write": 4.5 } - } - ] - }, - "iflowcn": { - "id": "iflowcn", - "name": "iFlow", - "display_name": "iFlow", - "api": "https://apis.iflow.cn/v1", - "doc": "https://platform.iflow.cn/en/docs", - "models": [ + }, { - "id": "qwen3-coder", - "name": "Qwen3-Coder-480B-A35B", - "display_name": "Qwen3-Coder-480B-A35B", + "id": "google/gemini-2.5-flash", + "name": "Gemini 2.5 Flash", + "display_name": "Gemini 2.5 Flash", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 64000 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-01", - "last_updated": "2025-07-01", + "attachment": true, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-06-17", + "last_updated": "2025-06-17", "cost": { - "input": 0, - "output": 0 + "input": 0.3, + "output": 2.5, + "cache_read": 0.075, + "cache_write": 0.55 } }, { - "id": "deepseek-v3", - "name": "DeepSeek-V3-671B", - "display_name": "DeepSeek-V3-671B", + "id": "google/gemini-2.5-pro", + "name": "Gemini 2.5 Pro", + "display_name": "Gemini 2.5 Pro", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 32000 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-10", - "release_date": "2024-12-26", - "last_updated": "2024-12-26", + "attachment": true, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-06-17", + "last_updated": "2025-06-17", "cost": { - "input": 0, - "output": 0 + "input": 1.25, + "output": 10, + "cache_read": 0.31, + "cache_write": 2.375 } }, { - "id": "kimi-k2", - "name": "Kimi-K2", - "display_name": "Kimi-K2", + "id": "openai/gpt-4.1-mini", + "name": "GPT-4.1 Mini", + "display_name": "GPT-4.1 Mini", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 64000 + "context": 1047576, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-10", - "release_date": "2024-12-01", - "last_updated": "2024-12-01", + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { - "input": 0, - "output": 0 + "input": 0.4, + "output": 1.6, + "cache_read": 0.1 } }, { - "id": "deepseek-r1", - "name": "DeepSeek-R1", - "display_name": "DeepSeek-R1", + "id": "openai/gpt-5-nano", + "name": "GPT-5 Nano", + "display_name": "GPT-5 Nano", "modalities": { "input": [ "text" @@ -30628,72 +38018,75 @@ ] }, "limit": { - "context": 128000, - "output": 32000 + "context": 16000, + "output": 4000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-12", - "release_date": "2025-01-20", - "last_updated": "2025-01-20", + "attachment": true, + "open_weights": false, + "knowledge": "2024-05-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 0, - "output": 0 + "input": 0.05, + "output": 0.4, + "cache_read": 0.01 } }, { - "id": "deepseek-v3.1", - "name": "DeepSeek-V3.1-Terminus", - "display_name": "DeepSeek-V3.1-Terminus", + "id": "openai/gpt-4.1", + "name": "GPT-4.1", + "display_name": "GPT-4.1", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 64000 + "context": 1047576, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-12", - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "attachment": true, + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { - "input": 0, - "output": 0 + "input": 2, + "output": 8, + "cache_read": 0.5 } }, { - "id": "minimax-m2", - "name": "MiniMax M2", - "display_name": "MiniMax M2", + "id": "openai/o4-mini", + "name": "o4 Mini", + "display_name": "o4 Mini", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 204800, - "output": 131100 + "context": 200000, + "output": 100000 }, "temperature": true, "tool_call": true, @@ -30701,24 +38094,25 @@ "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2025-11-13", - "last_updated": "2025-11-13", + "attachment": true, + "open_weights": false, + "knowledge": "2024-06", + "release_date": "2025-04-16", + "last_updated": "2025-04-16", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "input": 1.1, + "output": 4.4, + "cache_read": 0.28 } }, { - "id": "qwen3-235b", - "name": "Qwen3-235B-A22B", - "display_name": "Qwen3-235B-A22B", + "id": "openai/gpt-5-mini", + "name": "GPT-5 Mini", + "display_name": "GPT-5 Mini", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -30728,124 +38122,139 @@ "context": 128000, "output": 32000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-10", - "release_date": "2024-12-01", - "last_updated": "2024-12-01", + "attachment": true, + "open_weights": false, + "knowledge": "2024-05-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 0, - "output": 0 + "input": 0.25, + "output": 2, + "cache_read": 0.03 } }, { - "id": "kimi-k2-0905", - "name": "Kimi-K2-Instruct-0905", - "display_name": "Kimi-K2-Instruct-0905", + "id": "openai/gpt-4o-mini", + "name": "GPT-4o Mini", + "display_name": "GPT-4o Mini", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 64000 + "context": 128000, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-12", - "release_date": "2025-09-05", - "last_updated": "2025-09-05", + "knowledge": "2024-10", + "release_date": "2024-07-18", + "last_updated": "2024-07-18", "cost": { - "input": 0, - "output": 0 + "input": 0.15, + "output": 0.6, + "cache_read": 0.08 } }, { - "id": "qwen3-235b-a22b-thinking-2507", - "name": "Qwen3-235B-A22B-Thinking", - "display_name": "Qwen3-235B-A22B-Thinking", + "id": "openai/gpt-5", + "name": "GPT-5", + "display_name": "GPT-5", "modalities": { "input": [ - "text" + "text", + "audio", + "image", + "video" ], "output": [ - "text" + "text", + "audio", + "image" ] }, "limit": { - "context": 256000, - "output": 64000 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-01", - "last_updated": "2025-07-01", + "attachment": true, + "open_weights": false, + "knowledge": "2024-09-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 0, - "output": 0 + "input": 1.25, + "output": 10, + "cache_read": 0.13 } }, { - "id": "qwen3-vl-plus", - "name": "Qwen3-VL-Plus", - "display_name": "Qwen3-VL-Plus", + "id": "anthropic/claude-opus-4", + "name": "Claude Opus 4", + "display_name": "Claude Opus 4", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 256000, + "context": 200000, "output": 32000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": false, - "knowledge": "2024-12", - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "knowledge": "2025-03-31", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", "cost": { - "input": 0, - "output": 0 + "input": 15, + "output": 75, + "cache_read": 1.5, + "cache_write": 18.75 } }, { - "id": "glm-4.6", - "name": "GLM-4.6", - "display_name": "GLM-4.6", + "id": "anthropic/claude-opus-4-1", + "name": "Claude Opus 4.1", + "display_name": "Claude Opus 4.1", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" @@ -30853,7 +38262,7 @@ }, "limit": { "context": 200000, - "output": 128000 + "output": 32000 }, "temperature": true, "tool_call": true, @@ -30861,175 +38270,211 @@ "supported": true, "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-10", - "release_date": "2024-12-01", - "last_updated": "2025-11-13", + "knowledge": "2025-03-31", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 0, - "output": 0 + "input": 15, + "output": 75, + "cache_read": 1.5, + "cache_write": 18.75 } }, { - "id": "tstars2.0", - "name": "TStars-2.0", - "display_name": "TStars-2.0", + "id": "anthropic/claude-haiku-4-5", + "name": "Claude Haiku 4.5", + "display_name": "Claude Haiku 4.5", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 64000 + "context": 200000, + "output": 62000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-01", - "release_date": "2024-01-01", - "last_updated": "2025-01-01", + "knowledge": "2025-02-01", + "release_date": "2025-10-15", + "last_updated": "2025-10-15", "cost": { - "input": 0, - "output": 0 + "input": 1, + "output": 5, + "cache_read": 0.1, + "cache_write": 1.25 } }, { - "id": "qwen3-235b-a22b-instruct", - "name": "Qwen3-235B-A22B-Instruct", - "display_name": "Qwen3-235B-A22B-Instruct", + "id": "anthropic/claude-opus-4-5", + "name": "Claude Opus 4.5", + "display_name": "Claude Opus 4.5", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 256000, + "context": 200000, "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-01", - "last_updated": "2025-07-01", + "attachment": true, + "open_weights": false, + "knowledge": "2025-03-31", + "release_date": "2025-11-24", + "last_updated": "2025-11-24", "cost": { - "input": 0, - "output": 0 + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 } }, { - "id": "qwen3-max", - "name": "Qwen3-Max", - "display_name": "Qwen3-Max", + "id": "anthropic/claude-sonnet-4-5", + "name": "Claude Sonnet 4.5", + "display_name": "Claude Sonnet 4.5", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 32000 + "context": 1000000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-12", - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "knowledge": "2025-07-31", + "release_date": "2025-09-29", + "last_updated": "2025-09-29", "cost": { - "input": 0, - "output": 0 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 } }, { - "id": "deepseek-v3.2", - "name": "DeepSeek-V3.2-Exp", - "display_name": "DeepSeek-V3.2-Exp", + "id": "anthropic/claude-3-7-sonnet", + "name": "Claude Sonnet 3.7", + "display_name": "Claude Sonnet 3.7", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, + "context": 200000, "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-12", - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "attachment": true, + "open_weights": false, + "knowledge": "2024-01", + "release_date": "2025-02-19", + "last_updated": "2025-02-19", "cost": { - "input": 0, - "output": 0 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 } }, { - "id": "qwen3-max-preview", - "name": "Qwen3-Max-Preview", - "display_name": "Qwen3-Max-Preview", + "id": "anthropic/claude-sonnet-4", + "name": "Claude Sonnet 4", + "display_name": "Claude Sonnet 4", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 32000 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-12", - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "knowledge": "2025-03-31", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", "cost": { - "input": 0, - "output": 0 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 } - }, + } + ] + }, + "morph": { + "id": "morph", + "name": "Morph", + "display_name": "Morph", + "api": "https://api.morphllm.com/v1", + "doc": "https://docs.morphllm.com/api-reference/introduction", + "models": [ { - "id": "qwen3-coder-plus", - "name": "Qwen3-Coder-Plus", - "display_name": "Qwen3-Coder-Plus", + "id": "morph-v3-large", + "name": "Morph v3 Large", + "display_name": "Morph v3 Large", "modalities": { "input": [ "text" @@ -31039,28 +38484,27 @@ ] }, "limit": { - "context": 256000, - "output": 64000 + "context": 32000, + "output": 32000 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-01", - "last_updated": "2025-07-01", + "open_weights": false, + "release_date": "2024-08-15", + "last_updated": "2024-08-15", "cost": { - "input": 0, - "output": 0 + "input": 0.9, + "output": 1.9 } }, { - "id": "qwen3-32b", - "name": "Qwen3-32B", - "display_name": "Qwen3-32B", + "id": "auto", + "name": "Auto", + "display_name": "Auto", "modalities": { "input": [ "text" @@ -31070,37 +38514,27 @@ ] }, "limit": { - "context": 128000, + "context": 32000, "output": 32000 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2024-10", - "release_date": "2024-12-01", - "last_updated": "2024-12-01", + "open_weights": false, + "release_date": "2024-06-01", + "last_updated": "2024-06-01", "cost": { - "input": 0, - "output": 0 + "input": 0.85, + "output": 1.55 } - } - ] - }, - "synthetic": { - "id": "synthetic", - "name": "Synthetic", - "display_name": "Synthetic", - "api": "https://api.synthetic.new/v1", - "doc": "https://synthetic.new/pricing", - "models": [ + }, { - "id": "hf:openai/gpt-oss-120b", - "name": "GPT OSS 120B", - "display_name": "GPT OSS 120B", + "id": "morph-v3-fast", + "name": "Morph v3 Fast", + "display_name": "Morph v3 Fast", "modalities": { "input": [ "text" @@ -31110,31 +38544,31 @@ ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 16000, + "output": 16000 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "open_weights": false, + "release_date": "2024-08-15", + "last_updated": "2024-08-15", "cost": { - "input": 0.1, - "output": 0.1 + "input": 0.8, + "output": 1.2 } } ] }, - "deepinfra": { - "id": "deepinfra", - "name": "Deep Infra", - "display_name": "Deep Infra", - "doc": "https://deepinfra.com/models", + "lmstudio": { + "id": "lmstudio", + "name": "LMStudio", + "display_name": "LMStudio", + "api": "http://127.0.0.1:1234/v1", + "doc": "https://lmstudio.ai/models", "models": [ { "id": "openai/gpt-oss-20b", @@ -31150,7 +38584,7 @@ }, "limit": { "context": 131072, - "output": 16384 + "output": 32768 }, "temperature": true, "tool_call": true, @@ -31163,14 +38597,14 @@ "release_date": "2025-08-05", "last_updated": "2025-08-05", "cost": { - "input": 0.03, - "output": 0.14 + "input": 0, + "output": 0 } }, { - "id": "openai/gpt-oss-120b", - "name": "GPT OSS 120B", - "display_name": "GPT OSS 120B", + "id": "qwen/qwen3-30b-a3b-2507", + "name": "Qwen3 30B A3B 2507", + "display_name": "Qwen3 30B A3B 2507", "modalities": { "input": [ "text" @@ -31180,37 +38614,28 @@ ] }, "limit": { - "context": 131072, + "context": 262144, "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "knowledge": "2025-04", + "release_date": "2025-07-30", + "last_updated": "2025-07-30", "cost": { - "input": 0.05, - "output": 0.24 + "input": 0, + "output": 0 } - } - ] - }, - "zhipuai": { - "id": "zhipuai", - "name": "Zhipu AI", - "display_name": "Zhipu AI", - "api": "https://open.bigmodel.cn/api/paas/v4", - "doc": "https://docs.z.ai/guides/overview/pricing", - "models": [ + }, { - "id": "glm-4.6", - "name": "GLM-4.6", - "display_name": "GLM-4.6", + "id": "qwen/qwen3-coder-30b", + "name": "Qwen3 Coder 30B", + "display_name": "Qwen3 Coder 30B", "modalities": { "input": [ "text" @@ -31220,76 +38645,84 @@ ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 262144, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": true, "knowledge": "2025-04", - "release_date": "2025-09-30", - "last_updated": "2025-09-30", + "release_date": "2025-07-23", + "last_updated": "2025-07-23", "cost": { - "input": 0.6, - "output": 2.2, - "cache_read": 0.11, - "cache_write": 0 + "input": 0, + "output": 0 } - }, + } + ] + }, + "sap-ai-core": { + "id": "sap-ai-core", + "name": "SAP AI Core", + "display_name": "SAP AI Core", + "doc": "https://help.sap.com/docs/sap-ai-core", + "models": [ { - "id": "glm-4.5v", - "name": "GLM 4.5V", - "display_name": "GLM 4.5V", + "id": "anthropic--claude-3.5-sonnet", + "name": "anthropic--claude-3.5-sonnet", + "display_name": "anthropic--claude-3.5-sonnet", "modalities": { "input": [ "text", "image", - "video" + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 64000, - "output": 16384 + "context": 200000, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-08-11", - "last_updated": "2025-08-11", + "open_weights": false, + "knowledge": "2024-04-30", + "release_date": "2024-10-22", + "last_updated": "2024-10-22", "cost": { - "input": 0.6, - "output": 1.8 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 } }, { - "id": "glm-4.5-air", - "name": "GLM-4.5-Air", - "display_name": "GLM-4.5-Air", + "id": "anthropic--claude-4-opus", + "name": "anthropic--claude-4-opus", + "display_name": "anthropic--claude-4-opus", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 98304 + "context": 200000, + "output": 32000 }, "temperature": true, "tool_call": true, @@ -31297,33 +38730,37 @@ "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-28", - "last_updated": "2025-07-28", + "attachment": true, + "open_weights": false, + "knowledge": "2025-01-31", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", "cost": { - "input": 0.2, - "output": 1.1, - "cache_read": 0.03, - "cache_write": 0 + "input": 15, + "output": 75, + "cache_read": 1.5, + "cache_write": 18.75 } }, { - "id": "glm-4.5", - "name": "GLM-4.5", - "display_name": "GLM-4.5", + "id": "gemini-2.5-flash", + "name": "gemini-2.5-flash", + "display_name": "gemini-2.5-flash", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 98304 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -31331,150 +38768,137 @@ "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-28", - "last_updated": "2025-07-28", + "attachment": true, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-03-25", + "last_updated": "2025-06-05", "cost": { - "input": 0.6, - "output": 2.2, - "cache_read": 0.11, - "cache_write": 0 + "input": 0.3, + "output": 2.5, + "cache_read": 0.075, + "input_audio": 1 } }, { - "id": "glm-4.5-flash", - "name": "GLM-4.5-Flash", - "display_name": "GLM-4.5-Flash", + "id": "anthropic--claude-3-haiku", + "name": "anthropic--claude-3-haiku", + "display_name": "anthropic--claude-3-haiku", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 98304 + "context": 200000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-28", - "last_updated": "2025-07-28", + "attachment": true, + "open_weights": false, + "knowledge": "2023-08-31", + "release_date": "2024-03-13", + "last_updated": "2024-03-13", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "input": 0.25, + "output": 1.25, + "cache_read": 0.03, + "cache_write": 0.3 } - } - ] - }, - "submodel": { - "id": "submodel", - "name": "submodel", - "display_name": "submodel", - "api": "https://llm.submodel.ai/v1", - "doc": "https://submodel.gitbook.io", - "models": [ + }, { - "id": "openai/gpt-oss-120b", - "name": "GPT OSS 120B", - "display_name": "GPT OSS 120B", + "id": "anthropic--claude-3-sonnet", + "name": "anthropic--claude-3-sonnet", + "display_name": "anthropic--claude-3-sonnet", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 200000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": false, - "open_weights": true, - "release_date": "2025-08-23", - "last_updated": "2025-08-23", + "attachment": true, + "open_weights": false, + "knowledge": "2023-08-31", + "release_date": "2024-03-04", + "last_updated": "2024-03-04", "cost": { - "input": 0.1, - "output": 0.5 + "input": 3, + "output": 15 } - } - ] - }, - "zai": { - "id": "zai", - "name": "Z.AI", - "display_name": "Z.AI", - "api": "https://api.z.ai/api/paas/v4", - "doc": "https://docs.z.ai/guides/overview/pricing", - "models": [ + }, { - "id": "glm-4.5-flash", - "name": "GLM-4.5-Flash", - "display_name": "GLM-4.5-Flash", + "id": "gpt-5-nano", + "name": "gpt-5-nano", + "display_name": "gpt-5-nano", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 98304 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-28", - "last_updated": "2025-07-28", + "attachment": true, + "open_weights": false, + "knowledge": "2024-05-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "input": 0.05, + "output": 0.4, + "cache_read": 0.01 } - }, - { - "id": "glm-4.5", - "name": "GLM-4.5", - "display_name": "GLM-4.5", + }, + { + "id": "anthropic--claude-3.7-sonnet", + "name": "anthropic--claude-3.7-sonnet", + "display_name": "anthropic--claude-3.7-sonnet", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 98304 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, @@ -31482,69 +38906,69 @@ "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-28", - "last_updated": "2025-07-28", + "attachment": true, + "open_weights": false, + "knowledge": "2024-10-31", + "release_date": "2025-02-24", + "last_updated": "2025-02-24", "cost": { - "input": 0.6, - "output": 2.2, - "cache_read": 0.11, - "cache_write": 0 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 } }, { - "id": "glm-4.5-air", - "name": "GLM-4.5-Air", - "display_name": "GLM-4.5-Air", + "id": "gpt-5-mini", + "name": "gpt-5-mini", + "display_name": "gpt-5-mini", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 98304 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-28", - "last_updated": "2025-07-28", + "attachment": true, + "open_weights": false, + "knowledge": "2024-05-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 0.2, - "output": 1.1, - "cache_read": 0.03, - "cache_write": 0 + "input": 0.25, + "output": 2, + "cache_read": 0.03 } }, { - "id": "glm-4.5v", - "name": "GLM 4.5V", - "display_name": "GLM 4.5V", + "id": "anthropic--claude-4.5-sonnet", + "name": "anthropic--claude-4.5-sonnet", + "display_name": "anthropic--claude-4.5-sonnet", "modalities": { "input": [ "text", "image", - "video" + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 64000, - "output": 16384 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, @@ -31553,30 +38977,36 @@ "default": true }, "attachment": true, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-08-11", - "last_updated": "2025-08-11", + "open_weights": false, + "knowledge": "2025-01-31", + "release_date": "2025-09-29", + "last_updated": "2025-09-29", "cost": { - "input": 0.6, - "output": 1.8 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 } }, { - "id": "glm-4.6", - "name": "GLM-4.6", - "display_name": "GLM-4.6", + "id": "gemini-2.5-pro", + "name": "gemini-2.5-pro", + "display_name": "gemini-2.5-pro", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -31584,41 +39014,33 @@ "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-09-30", - "last_updated": "2025-09-30", + "attachment": true, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-03-25", + "last_updated": "2025-06-05", "cost": { - "input": 0.6, - "output": 2.2, - "cache_read": 0.11, - "cache_write": 0 + "input": 1.25, + "output": 10, + "cache_read": 0.31 } - } - ] - }, - "inference": { - "id": "inference", - "name": "Inference", - "display_name": "Inference", - "api": "https://inference.net/v1", - "doc": "https://inference.net/models", - "models": [ + }, { - "id": "mistral/mistral-nemo-12b-instruct", - "name": "Mistral Nemo 12B Instruct", - "display_name": "Mistral Nemo 12B Instruct", + "id": "anthropic--claude-3-opus", + "name": "anthropic--claude-3-opus", + "display_name": "anthropic--claude-3-opus", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 16000, + "context": 200000, "output": 4096 }, "temperature": true, @@ -31626,126 +39048,147 @@ "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-12", - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "attachment": true, + "open_weights": false, + "knowledge": "2023-08-31", + "release_date": "2024-02-29", + "last_updated": "2024-02-29", "cost": { - "input": 0.038, - "output": 0.1 + "input": 15, + "output": 75 } }, { - "id": "google/gemma-3", - "name": "Google Gemma 3", - "display_name": "Google Gemma 3", + "id": "anthropic--claude-4-sonnet", + "name": "anthropic--claude-4-sonnet", + "display_name": "anthropic--claude-4-sonnet", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 125000, - "output": 4096 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, - "open_weights": true, - "knowledge": "2024-12", - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "open_weights": false, + "knowledge": "2025-01-31", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", "cost": { - "input": 0.15, - "output": 0.3 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 } }, { - "id": "osmosis/osmosis-structure-0.6b", - "name": "Osmosis Structure 0.6B", - "display_name": "Osmosis Structure 0.6B", + "id": "gpt-5", + "name": "gpt-5", + "display_name": "gpt-5", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 4000, - "output": 2048 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-12", - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "attachment": true, + "open_weights": false, + "knowledge": "2024-09-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 0.1, - "output": 0.5 + "input": 1.25, + "output": 10, + "cache_read": 0.13 } - }, + } + ] + }, + "anthropic": { + "id": "anthropic", + "name": "Anthropic", + "display_name": "Anthropic", + "doc": "https://docs.anthropic.com/en/docs/about-claude/models", + "models": [ { - "id": "qwen/qwen3-embedding-4b", - "name": "Qwen 3 Embedding 4B", - "display_name": "Qwen 3 Embedding 4B", + "id": "claude-opus-4-0", + "name": "Claude Opus 4 (latest)", + "display_name": "Claude Opus 4 (latest)", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 32000, - "output": 2048 + "context": 200000, + "output": 32000 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-12", - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "attachment": true, + "open_weights": false, + "knowledge": "2025-03-31", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", "cost": { - "input": 0.01, - "output": 0 + "input": 15, + "output": 75, + "cache_read": 1.5, + "cache_write": 18.75 } }, { - "id": "qwen/qwen-2.5-7b-vision-instruct", - "name": "Qwen 2.5 7B Vision Instruct", - "display_name": "Qwen 2.5 7B Vision Instruct", + "id": "claude-3-5-sonnet-20241022", + "name": "Claude Sonnet 3.5 v2", + "display_name": "Claude Sonnet 3.5 v2", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 125000, - "output": 4096 + "context": 200000, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -31753,164 +39196,175 @@ "supported": false }, "attachment": true, - "open_weights": true, - "knowledge": "2024-12", - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "open_weights": false, + "knowledge": "2024-04-30", + "release_date": "2024-10-22", + "last_updated": "2024-10-22", "cost": { - "input": 0.2, - "output": 0.2 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 } }, { - "id": "meta/llama-3.2-11b-vision-instruct", - "name": "Llama 3.2 11B Vision Instruct", - "display_name": "Llama 3.2 11B Vision Instruct", + "id": "claude-opus-4-1", + "name": "Claude Opus 4.1 (latest)", + "display_name": "Claude Opus 4.1 (latest)", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 16000, - "output": 4096 + "context": 200000, + "output": 32000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "open_weights": false, + "knowledge": "2025-03-31", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 0.055, - "output": 0.055 + "input": 15, + "output": 75, + "cache_read": 1.5, + "cache_write": 18.75 } }, { - "id": "meta/llama-3.1-8b-instruct", - "name": "Llama 3.1 8B Instruct", - "display_name": "Llama 3.1 8B Instruct", + "id": "claude-haiku-4-5", + "name": "Claude Haiku 4.5 (latest)", + "display_name": "Claude Haiku 4.5 (latest)", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 16000, - "output": 4096 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "attachment": true, + "open_weights": false, + "knowledge": "2025-02-28", + "release_date": "2025-10-15", + "last_updated": "2025-10-15", "cost": { - "input": 0.025, - "output": 0.025 + "input": 1, + "output": 5, + "cache_read": 0.1, + "cache_write": 1.25 } }, { - "id": "meta/llama-3.2-3b-instruct", - "name": "Llama 3.2 3B Instruct", - "display_name": "Llama 3.2 3B Instruct", + "id": "claude-3-5-sonnet-20240620", + "name": "Claude Sonnet 3.5", + "display_name": "Claude Sonnet 3.5", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 16000, - "output": 4096 + "context": 200000, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "attachment": true, + "open_weights": false, + "knowledge": "2024-04-30", + "release_date": "2024-06-20", + "last_updated": "2024-06-20", "cost": { - "input": 0.02, - "output": 0.02 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 } }, { - "id": "meta/llama-3.2-1b-instruct", - "name": "Llama 3.2 1B Instruct", - "display_name": "Llama 3.2 1B Instruct", + "id": "claude-3-5-haiku-latest", + "name": "Claude Haiku 3.5 (latest)", + "display_name": "Claude Haiku 3.5 (latest)", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 16000, - "output": 4096 + "context": 200000, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "attachment": true, + "open_weights": false, + "knowledge": "2024-07-31", + "release_date": "2024-10-22", + "last_updated": "2024-10-22", "cost": { - "input": 0.01, - "output": 0.01 + "input": 0.8, + "output": 4, + "cache_read": 0.08, + "cache_write": 1 } - } - ] - }, - "requesty": { - "id": "requesty", - "name": "Requesty", - "display_name": "Requesty", - "api": "https://router.requesty.ai/v1", - "doc": "https://requesty.ai/solution/llm-routing/models", - "models": [ + }, { - "id": "xai/grok-4", - "name": "Grok 4", - "display_name": "Grok 4", + "id": "claude-opus-4-5", + "name": "Claude Opus 4.5 (latest)", + "display_name": "Claude Opus 4.5 (latest)", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 256000, + "context": 200000, "output": 64000 }, "temperature": true, @@ -31921,60 +39375,59 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-09-09", - "last_updated": "2025-09-09", + "knowledge": "2025-03-31", + "release_date": "2025-11-24", + "last_updated": "2025-11-24", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.75, - "cache_write": 3 + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 } }, { - "id": "xai/grok-4-fast", - "name": "Grok 4 Fast", - "display_name": "Grok 4 Fast", + "id": "claude-3-opus-20240229", + "name": "Claude Opus 3", + "display_name": "Claude Opus 3", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 2000000, - "output": 64000 + "context": 200000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-09-19", - "last_updated": "2025-09-19", + "knowledge": "2023-08-31", + "release_date": "2024-02-29", + "last_updated": "2024-02-29", "cost": { - "input": 0.2, - "output": 0.5, - "cache_read": 0.05, - "cache_write": 0.2 + "input": 15, + "output": 75, + "cache_read": 1.5, + "cache_write": 18.75 } }, { - "id": "google/gemini-3-pro-preview", - "name": "Gemini 3 Pro", - "display_name": "Gemini 3 Pro", + "id": "claude-opus-4-5-20251101", + "name": "Claude Opus 4.5", + "display_name": "Claude Opus 4.5", "modalities": { "input": [ "text", "image", - "audio", - "video", "pdf" ], "output": [ @@ -31982,8 +39435,8 @@ ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, @@ -31993,26 +39446,24 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-11-18", - "last_updated": "2025-11-18", + "knowledge": "2025-03-31", + "release_date": "2025-11-01", + "last_updated": "2025-11-01", "cost": { - "input": 2, - "output": 12, - "cache_read": 0.2, - "cache_write": 4.5 + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 } }, { - "id": "google/gemini-2.5-flash", - "name": "Gemini 2.5 Flash", - "display_name": "Gemini 2.5 Flash", + "id": "claude-sonnet-4-5", + "name": "Claude Sonnet 4.5 (latest)", + "display_name": "Claude Sonnet 4.5 (latest)", "modalities": { "input": [ "text", "image", - "audio", - "video", "pdf" ], "output": [ @@ -32020,8 +39471,8 @@ ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, @@ -32031,26 +39482,24 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-06-17", - "last_updated": "2025-06-17", + "knowledge": "2025-07-31", + "release_date": "2025-09-29", + "last_updated": "2025-09-29", "cost": { - "input": 0.3, - "output": 2.5, - "cache_read": 0.075, - "cache_write": 0.55 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 } }, { - "id": "google/gemini-2.5-pro", - "name": "Gemini 2.5 Pro", - "display_name": "Gemini 2.5 Pro", + "id": "claude-sonnet-4-5-20250929", + "name": "Claude Sonnet 4.5", + "display_name": "Claude Sonnet 4.5", "modalities": { "input": [ "text", "image", - "audio", - "video", "pdf" ], "output": [ @@ -32058,8 +39507,8 @@ ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, @@ -32069,66 +39518,71 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-06-17", - "last_updated": "2025-06-17", + "knowledge": "2025-07-31", + "release_date": "2025-09-29", + "last_updated": "2025-09-29", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.31, - "cache_write": 2.375 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 } }, { - "id": "openai/gpt-4.1-mini", - "name": "GPT-4.1 Mini", - "display_name": "GPT-4.1 Mini", + "id": "claude-sonnet-4-20250514", + "name": "Claude Sonnet 4", + "display_name": "Claude Sonnet 4", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 1047576, - "output": 32768 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", + "knowledge": "2025-03-31", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", "cost": { - "input": 0.4, - "output": 1.6, - "cache_read": 0.1 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 } }, { - "id": "openai/gpt-5-nano", - "name": "GPT-5 Nano", - "display_name": "GPT-5 Nano", + "id": "claude-opus-4-20250514", + "name": "Claude Opus 4", + "display_name": "Claude Opus 4", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 16000, - "output": 4000 + "context": 200000, + "output": 32000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -32136,31 +39590,33 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2024-05-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "knowledge": "2025-03-31", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", "cost": { - "input": 0.05, - "output": 0.4, - "cache_read": 0.01 + "input": 15, + "output": 75, + "cache_read": 1.5, + "cache_write": 18.75 } }, { - "id": "openai/gpt-4.1", - "name": "GPT-4.1", - "display_name": "GPT-4.1", + "id": "claude-3-5-haiku-20241022", + "name": "Claude Haiku 3.5", + "display_name": "Claude Haiku 3.5", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 1047576, - "output": 32768 + "context": 200000, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -32169,23 +39625,25 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", + "knowledge": "2024-07-31", + "release_date": "2024-10-22", + "last_updated": "2024-10-22", "cost": { - "input": 2, - "output": 8, - "cache_read": 0.5 + "input": 0.8, + "output": 4, + "cache_read": 0.08, + "cache_write": 1 } }, { - "id": "openai/o4-mini", - "name": "o4 Mini", - "display_name": "o4 Mini", + "id": "claude-3-haiku-20240307", + "name": "Claude Haiku 3", + "display_name": "Claude Haiku 3", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" @@ -32193,43 +39651,44 @@ }, "limit": { "context": 200000, - "output": 100000 + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2024-06", - "release_date": "2025-04-16", - "last_updated": "2025-04-16", + "knowledge": "2023-08-31", + "release_date": "2024-03-13", + "last_updated": "2024-03-13", "cost": { - "input": 1.1, - "output": 4.4, - "cache_read": 0.28 + "input": 0.25, + "output": 1.25, + "cache_read": 0.03, + "cache_write": 0.3 } }, { - "id": "openai/gpt-5-mini", - "name": "GPT-5 Mini", - "display_name": "GPT-5 Mini", + "id": "claude-3-7-sonnet-20250219", + "name": "Claude Sonnet 3.7", + "display_name": "Claude Sonnet 3.7", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 32000 + "context": 200000, + "output": 64000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -32237,70 +39696,71 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2024-05-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "knowledge": "2024-10-31", + "release_date": "2025-02-19", + "last_updated": "2025-02-19", "cost": { - "input": 0.25, - "output": 2, - "cache_read": 0.03 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 } }, { - "id": "openai/gpt-4o-mini", - "name": "GPT-4o Mini", - "display_name": "GPT-4o Mini", + "id": "claude-3-7-sonnet-latest", + "name": "Claude Sonnet 3.7 (latest)", + "display_name": "Claude Sonnet 3.7 (latest)", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": false, - "knowledge": "2024-10", - "release_date": "2024-07-18", - "last_updated": "2024-07-18", + "knowledge": "2024-10-31", + "release_date": "2025-02-19", + "last_updated": "2025-02-19", "cost": { - "input": 0.15, - "output": 0.6, - "cache_read": 0.08 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 } }, { - "id": "openai/gpt-5", - "name": "GPT-5", - "display_name": "GPT-5", + "id": "claude-sonnet-4-0", + "name": "Claude Sonnet 4 (latest)", + "display_name": "Claude Sonnet 4 (latest)", "modalities": { "input": [ "text", - "audio", "image", - "video" + "pdf" ], "output": [ - "text", - "audio", - "image" + "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 200000, + "output": 64000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -32308,23 +39768,25 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "knowledge": "2025-03-31", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.13 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 } }, { - "id": "anthropic/claude-opus-4", - "name": "Claude Opus 4", - "display_name": "Claude Opus 4", + "id": "claude-opus-4-1-20250805", + "name": "Claude Opus 4.1", + "display_name": "Claude Opus 4.1", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" @@ -32343,8 +39805,8 @@ "attachment": true, "open_weights": false, "knowledge": "2025-03-31", - "release_date": "2025-05-22", - "last_updated": "2025-05-22", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { "input": 15, "output": 75, @@ -32353,13 +39815,14 @@ } }, { - "id": "anthropic/claude-opus-4-1", - "name": "Claude Opus 4.1", - "display_name": "Claude Opus 4.1", + "id": "claude-3-sonnet-20240229", + "name": "Claude Sonnet 3", + "display_name": "Claude Sonnet 3", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" @@ -32367,34 +39830,34 @@ }, "limit": { "context": 200000, - "output": 32000 + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "knowledge": "2023-08-31", + "release_date": "2024-03-04", + "last_updated": "2024-03-04", "cost": { - "input": 15, - "output": 75, - "cache_read": 1.5, - "cache_write": 18.75 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 0.3 } }, { - "id": "anthropic/claude-haiku-4-5", + "id": "claude-haiku-4-5-20251001", "name": "Claude Haiku 4.5", "display_name": "Claude Haiku 4.5", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" @@ -32402,7 +39865,7 @@ }, "limit": { "context": 200000, - "output": 62000 + "output": 64000 }, "temperature": true, "tool_call": true, @@ -32412,7 +39875,7 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2025-02-01", + "knowledge": "2025-02-28", "release_date": "2025-10-15", "last_updated": "2025-10-15", "cost": { @@ -32421,23 +39884,31 @@ "cache_read": 0.1, "cache_write": 1.25 } - }, + } + ] + }, + "fireworks-ai": { + "id": "fireworks-ai", + "name": "Fireworks AI", + "display_name": "Fireworks AI", + "api": "https://api.fireworks.ai/inference/v1/", + "doc": "https://fireworks.ai/docs/", + "models": [ { - "id": "anthropic/claude-opus-4-5", - "name": "Claude Opus 4.5", - "display_name": "Claude Opus 4.5", + "id": "accounts/fireworks/models/deepseek-r1-0528", + "name": "Deepseek R1 05/28", + "display_name": "Deepseek R1 05/28", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 160000, + "output": 16384 }, "temperature": true, "tool_call": true, @@ -32445,34 +39916,31 @@ "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-11-24", - "last_updated": "2025-11-24", + "attachment": false, + "open_weights": true, + "knowledge": "2025-05", + "release_date": "2025-05-28", + "last_updated": "2025-05-28", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25 + "input": 3, + "output": 8 } }, { - "id": "anthropic/claude-sonnet-4-5", - "name": "Claude Sonnet 4.5", - "display_name": "Claude Sonnet 4.5", + "id": "accounts/fireworks/models/deepseek-v3p1", + "name": "DeepSeek V3.1", + "display_name": "DeepSeek V3.1", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 64000 + "context": 163840, + "output": 163840 }, "temperature": true, "tool_call": true, @@ -32480,34 +39948,31 @@ "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-07-31", - "release_date": "2025-09-29", - "last_updated": "2025-09-29", + "attachment": false, + "open_weights": true, + "knowledge": "2025-07", + "release_date": "2025-08-21", + "last_updated": "2025-08-21", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 0.56, + "output": 1.68 } }, { - "id": "anthropic/claude-3-7-sonnet", - "name": "Claude Sonnet 3.7", - "display_name": "Claude Sonnet 3.7", + "id": "accounts/fireworks/models/minimax-m2", + "name": "MiniMax-M2", + "display_name": "MiniMax-M2", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 128000, + "output": 16384 }, "temperature": true, "tool_call": true, @@ -32515,34 +39980,62 @@ "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-01", - "release_date": "2025-02-19", - "last_updated": "2025-02-19", + "attachment": false, + "open_weights": true, + "knowledge": "2024-11", + "release_date": "2025-10-27", + "last_updated": "2025-10-27", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 0.3, + "output": 1.2 } }, { - "id": "anthropic/claude-sonnet-4", - "name": "Claude Sonnet 4", - "display_name": "Claude Sonnet 4", + "id": "accounts/fireworks/models/deepseek-v3-0324", + "name": "Deepseek V3 03-24", + "display_name": "Deepseek V3 03-24", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 160000, + "output": 16384 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "knowledge": "2024-10", + "release_date": "2025-03-24", + "last_updated": "2025-03-24", + "cost": { + "input": 0.9, + "output": 0.9 + } + }, + { + "id": "accounts/fireworks/models/kimi-k2-thinking", + "name": "Kimi K2 Thinking", + "display_name": "Kimi K2 Thinking", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 256000, + "output": 16384 }, "temperature": true, "tool_call": true, @@ -32550,31 +40043,19 @@ "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-05-22", - "last_updated": "2025-05-22", + "attachment": false, + "open_weights": true, + "release_date": "2025-11-06", + "last_updated": "2025-11-06", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 0.6, + "output": 2.5 } - } - ] - }, - "morph": { - "id": "morph", - "name": "Morph", - "display_name": "Morph", - "api": "https://api.morphllm.com/v1", - "doc": "https://docs.morphllm.com/api-reference/introduction", - "models": [ + }, { - "id": "morph-v3-large", - "name": "Morph v3 Large", - "display_name": "Morph v3 Large", + "id": "accounts/fireworks/models/kimi-k2-instruct", + "name": "Kimi K2 Instruct", + "display_name": "Kimi K2 Instruct", "modalities": { "input": [ "text" @@ -32584,27 +40065,60 @@ ] }, "limit": { - "context": 32000, - "output": 32000 + "context": 128000, + "output": 16384 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2024-08-15", - "last_updated": "2024-08-15", + "open_weights": true, + "knowledge": "2024-10", + "release_date": "2025-07-11", + "last_updated": "2025-07-11", "cost": { - "input": 0.9, - "output": 1.9 + "input": 1, + "output": 3 + } + }, + { + "id": "accounts/fireworks/models/qwen3-235b-a22b", + "name": "Qwen3 235B-A22B", + "display_name": "Qwen3 235B-A22B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 16384 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-04-29", + "last_updated": "2025-04-29", + "cost": { + "input": 0.22, + "output": 0.88 } }, { - "id": "auto", - "name": "Auto", - "display_name": "Auto", + "id": "accounts/fireworks/models/gpt-oss-20b", + "name": "GPT OSS 20B", + "display_name": "GPT OSS 20B", "modalities": { "input": [ "text" @@ -32614,27 +40128,28 @@ ] }, "limit": { - "context": 32000, - "output": 32000 + "context": 131072, + "output": 32768 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": false, - "release_date": "2024-06-01", - "last_updated": "2024-06-01", + "open_weights": true, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 0.85, - "output": 1.55 + "input": 0.05, + "output": 0.2 } }, { - "id": "morph-v3-fast", - "name": "Morph v3 Fast", - "display_name": "Morph v3 Fast", + "id": "accounts/fireworks/models/gpt-oss-120b", + "name": "GPT OSS 120B", + "display_name": "GPT OSS 120B", "modalities": { "input": [ "text" @@ -32644,36 +40159,28 @@ ] }, "limit": { - "context": 16000, - "output": 16000 + "context": 131072, + "output": 32768 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": false, - "release_date": "2024-08-15", - "last_updated": "2024-08-15", + "open_weights": true, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 0.8, - "output": 1.2 + "input": 0.15, + "output": 0.6 } - } - ] - }, - "lmstudio": { - "id": "lmstudio", - "name": "LMStudio", - "display_name": "LMStudio", - "api": "http://127.0.0.1:1234/v1", - "doc": "https://lmstudio.ai/models", - "models": [ + }, { - "id": "openai/gpt-oss-20b", - "name": "GPT OSS 20B", - "display_name": "GPT OSS 20B", + "id": "accounts/fireworks/models/glm-4p5-air", + "name": "GLM 4.5 Air", + "display_name": "GLM 4.5 Air", "modalities": { "input": [ "text" @@ -32684,7 +40191,7 @@ }, "limit": { "context": 131072, - "output": 32768 + "output": 131072 }, "temperature": true, "tool_call": true, @@ -32694,17 +40201,18 @@ }, "attachment": false, "open_weights": true, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "knowledge": "2025-04", + "release_date": "2025-08-01", + "last_updated": "2025-08-01", "cost": { - "input": 0, - "output": 0 + "input": 0.22, + "output": 0.88 } }, { - "id": "qwen/qwen3-30b-a3b-2507", - "name": "Qwen3 30B A3B 2507", - "display_name": "Qwen3 30B A3B 2507", + "id": "accounts/fireworks/models/qwen3-coder-480b-a35b-instruct", + "name": "Qwen3 Coder 480B A35B Instruct", + "display_name": "Qwen3 Coder 480B A35B Instruct", "modalities": { "input": [ "text" @@ -32714,8 +40222,8 @@ ] }, "limit": { - "context": 262144, - "output": 16384 + "context": 256000, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -32724,18 +40232,17 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-30", - "last_updated": "2025-07-30", + "release_date": "2025-07-22", + "last_updated": "2025-07-22", "cost": { - "input": 0, - "output": 0 + "input": 0.45, + "output": 1.8 } }, { - "id": "qwen/qwen3-coder-30b", - "name": "Qwen3 Coder 30B", - "display_name": "Qwen3 Coder 30B", + "id": "accounts/fireworks/models/glm-4p5", + "name": "GLM 4.5", + "display_name": "GLM 4.5", "modalities": { "input": [ "text" @@ -32745,140 +40252,143 @@ ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 131072, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": true, "knowledge": "2025-04", - "release_date": "2025-07-23", - "last_updated": "2025-07-23", + "release_date": "2025-07-29", + "last_updated": "2025-07-29", "cost": { - "input": 0, - "output": 0 + "input": 0.55, + "output": 2.19 } } ] }, - "anthropic": { - "id": "anthropic", - "name": "Anthropic", - "display_name": "Anthropic", - "doc": "https://docs.anthropic.com/en/docs/about-claude/models", + "io-net": { + "id": "io-net", + "name": "IO.NET", + "display_name": "IO.NET", + "api": "https://api.intelligence.io.solutions/api/v1", + "doc": "https://io.net/docs/guides/intelligence/io-intelligence", "models": [ { - "id": "claude-opus-4-0", - "name": "Claude Opus 4 (latest)", - "display_name": "Claude Opus 4 (latest)", + "id": "openai/gpt-oss-20b", + "name": "GPT-OSS 20B", + "display_name": "GPT-OSS 20B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 32000 + "context": 64000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-05-22", - "last_updated": "2025-05-22", + "attachment": false, + "open_weights": true, + "knowledge": "2024-10", + "release_date": "2024-12-01", + "last_updated": "2024-12-01", "cost": { - "input": 15, - "output": 75, - "cache_read": 1.5, - "cache_write": 18.75 + "input": 0.03, + "output": 0.14, + "cache_read": 0.015, + "cache_write": 0.06 } }, { - "id": "claude-3-5-sonnet-20241022", - "name": "Claude Sonnet 3.5 v2", - "display_name": "Claude Sonnet 3.5 v2", + "id": "openai/gpt-oss-120b", + "name": "GPT-OSS 120B", + "display_name": "GPT-OSS 120B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 8192 + "context": 131072, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-04-30", - "release_date": "2024-10-22", - "last_updated": "2024-10-22", + "attachment": false, + "open_weights": true, + "knowledge": "2024-10", + "release_date": "2024-12-01", + "last_updated": "2024-12-01", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 0.04, + "output": 0.4, + "cache_read": 0.02, + "cache_write": 0.08 } - }, + } + ] + }, + "azure-cognitive-services": { + "id": "azure-cognitive-services", + "name": "Azure Cognitive Services", + "display_name": "Azure Cognitive Services", + "doc": "https://learn.microsoft.com/en-us/azure/ai-services/openai/concepts/models", + "models": [ { - "id": "claude-opus-4-1", - "name": "Claude Opus 4.1 (latest)", - "display_name": "Claude Opus 4.1 (latest)", + "id": "gpt-3.5-turbo-1106", + "name": "GPT-3.5 Turbo 1106", + "display_name": "GPT-3.5 Turbo 1106", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 32000 + "context": 16384, + "output": 16384 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "knowledge": "2021-08", + "release_date": "2023-11-06", + "last_updated": "2023-11-06", "cost": { - "input": 15, - "output": 75, - "cache_read": 1.5, - "cache_write": 18.75 + "input": 1, + "output": 2 } }, { - "id": "claude-haiku-4-5", - "name": "Claude Haiku 4.5 (latest)", - "display_name": "Claude Haiku 4.5 (latest)", + "id": "mistral-small-2503", + "name": "Mistral Small 3.1", + "display_name": "Mistral Small 3.1", "modalities": { "input": [ "text", @@ -32889,99 +40399,90 @@ ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 128000, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2025-02-28", - "release_date": "2025-10-15", - "last_updated": "2025-10-15", + "knowledge": "2024-09", + "release_date": "2025-03-01", + "last_updated": "2025-03-01", "cost": { - "input": 1, - "output": 5, - "cache_read": 0.1, - "cache_write": 1.25 + "input": 0.1, + "output": 0.3 } }, { - "id": "claude-3-5-sonnet-20240620", - "name": "Claude Sonnet 3.5", - "display_name": "Claude Sonnet 3.5", + "id": "codestral-2501", + "name": "Codestral 25.01", + "display_name": "Codestral 25.01", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 8192 + "context": 256000, + "output": 256000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-04-30", - "release_date": "2024-06-20", - "last_updated": "2024-06-20", + "knowledge": "2024-03", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 0.3, + "output": 0.9 } }, { - "id": "claude-3-5-haiku-latest", - "name": "Claude Haiku 3.5 (latest)", - "display_name": "Claude Haiku 3.5 (latest)", + "id": "mistral-large-2411", + "name": "Mistral Large 24.11", + "display_name": "Mistral Large 24.11", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 8192 + "context": 128000, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-07-31", - "release_date": "2024-10-22", - "last_updated": "2024-10-22", + "knowledge": "2024-09", + "release_date": "2024-11-01", + "last_updated": "2024-11-01", "cost": { - "input": 0.8, - "output": 4, - "cache_read": 0.08, - "cache_write": 1 + "input": 2, + "output": 6 } }, { - "id": "claude-opus-4-5", - "name": "Claude Opus 4.5 (latest)", - "display_name": "Claude Opus 4.5 (latest)", + "id": "gpt-5-pro", + "name": "GPT-5 Pro", + "display_name": "GPT-5 Pro", "modalities": { "input": [ "text", @@ -32992,10 +40493,10 @@ ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 400000, + "output": 272000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -33003,54 +40504,50 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-11-24", - "last_updated": "2025-11-24", + "knowledge": "2024-09-30", + "release_date": "2025-10-06", + "last_updated": "2025-10-06", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25 + "input": 15, + "output": 120 } }, { - "id": "claude-3-opus-20240229", - "name": "Claude Opus 3", - "display_name": "Claude Opus 3", + "id": "mai-ds-r1", + "name": "MAI-DS-R1", + "display_name": "MAI-DS-R1", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 4096 + "context": 128000, + "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2023-08-31", - "release_date": "2024-02-29", - "last_updated": "2024-02-29", + "knowledge": "2024-06", + "release_date": "2025-01-20", + "last_updated": "2025-01-20", "cost": { - "input": 15, - "output": 75, - "cache_read": 1.5, - "cache_write": 18.75 + "input": 1.35, + "output": 5.4 } }, { - "id": "claude-opus-4-5-20251101", - "name": "Claude Opus 4.5", - "display_name": "Claude Opus 4.5", + "id": "gpt-5", + "name": "GPT-5", + "display_name": "GPT-5", "modalities": { "input": [ "text", @@ -33061,10 +40558,10 @@ ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 272000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -33072,20 +40569,19 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-11-01", - "last_updated": "2025-11-01", + "knowledge": "2024-09-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25 + "input": 1.25, + "output": 10, + "cache_read": 0.13 } }, { - "id": "claude-sonnet-4-5", - "name": "Claude Sonnet 4.5 (latest)", - "display_name": "Claude Sonnet 4.5 (latest)", + "id": "gpt-4o-mini", + "name": "GPT-4o mini", + "display_name": "GPT-4o mini", "modalities": { "input": [ "text", @@ -33096,66 +40592,61 @@ ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 128000, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2025-07-31", - "release_date": "2025-09-29", - "last_updated": "2025-09-29", + "knowledge": "2023-09", + "release_date": "2024-07-18", + "last_updated": "2024-07-18", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 0.15, + "output": 0.6, + "cache_read": 0.08 } }, { - "id": "claude-sonnet-4-5-20250929", - "name": "Claude Sonnet 4.5", - "display_name": "Claude Sonnet 4.5", + "id": "phi-4-reasoning-plus", + "name": "Phi-4-reasoning-plus", + "display_name": "Phi-4-reasoning-plus", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 32000, + "output": 4096 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-07-31", - "release_date": "2025-09-29", - "last_updated": "2025-09-29", + "attachment": false, + "open_weights": true, + "knowledge": "2023-10", + "release_date": "2024-12-11", + "last_updated": "2024-12-11", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 0.125, + "output": 0.5 } }, { - "id": "claude-sonnet-4-20250514", - "name": "Claude Sonnet 4", - "display_name": "Claude Sonnet 4", + "id": "gpt-4-turbo-vision", + "name": "GPT-4 Turbo Vision", + "display_name": "GPT-4 Turbo Vision", "modalities": { "input": [ "text", @@ -33166,104 +40657,94 @@ ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-05-22", - "last_updated": "2025-05-22", + "knowledge": "2023-11", + "release_date": "2023-11-06", + "last_updated": "2024-04-09", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 10, + "output": 30 } }, { - "id": "claude-opus-4-20250514", - "name": "Claude Opus 4", - "display_name": "Claude Opus 4", + "id": "phi-4-reasoning", + "name": "Phi-4-reasoning", + "display_name": "Phi-4-reasoning", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 32000 + "context": 32000, + "output": 4096 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-05-22", - "last_updated": "2025-05-22", - "cost": { - "input": 15, - "output": 75, - "cache_read": 1.5, - "cache_write": 18.75 + "attachment": false, + "open_weights": true, + "knowledge": "2023-10", + "release_date": "2024-12-11", + "last_updated": "2024-12-11", + "cost": { + "input": 0.125, + "output": 0.5 } }, { - "id": "claude-3-5-haiku-20241022", - "name": "Claude Haiku 3.5", - "display_name": "Claude Haiku 3.5", + "id": "phi-3-medium-4k-instruct", + "name": "Phi-3-medium-instruct (4k)", + "display_name": "Phi-3-medium-instruct (4k)", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 8192 + "context": 4096, + "output": 1024 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-07-31", - "release_date": "2024-10-22", - "last_updated": "2024-10-22", + "attachment": false, + "open_weights": true, + "knowledge": "2023-10", + "release_date": "2024-04-23", + "last_updated": "2024-04-23", "cost": { - "input": 0.8, - "output": 4, - "cache_read": 0.08, - "cache_write": 1 + "input": 0.17, + "output": 0.68 } }, { - "id": "claude-3-haiku-20240307", - "name": "Claude Haiku 3", - "display_name": "Claude Haiku 3", + "id": "codex-mini", + "name": "Codex Mini", + "display_name": "Codex Mini", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" @@ -33271,29 +40752,29 @@ }, "limit": { "context": 200000, - "output": 4096 + "output": 100000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": false, - "knowledge": "2023-08-31", - "release_date": "2024-03-13", - "last_updated": "2024-03-13", + "knowledge": "2024-04", + "release_date": "2025-05-16", + "last_updated": "2025-05-16", "cost": { - "input": 0.25, - "output": 1.25, - "cache_read": 0.03, - "cache_write": 0.3 + "input": 1.5, + "output": 6, + "cache_read": 0.375 } }, { - "id": "claude-3-7-sonnet-20250219", - "name": "Claude Sonnet 3.7", - "display_name": "Claude Sonnet 3.7", + "id": "o3", + "name": "o3", + "display_name": "o3", "modalities": { "input": [ "text", @@ -33305,9 +40786,9 @@ }, "limit": { "context": 200000, - "output": 64000 + "output": 100000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -33315,235 +40796,203 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2024-10-31", - "release_date": "2025-02-19", - "last_updated": "2025-02-19", + "knowledge": "2024-05", + "release_date": "2025-04-16", + "last_updated": "2025-04-16", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 2, + "output": 8, + "cache_read": 0.5 } }, { - "id": "claude-3-7-sonnet-latest", - "name": "Claude Sonnet 3.7 (latest)", - "display_name": "Claude Sonnet 3.7 (latest)", + "id": "mistral-nemo", + "name": "Mistral Nemo", + "display_name": "Mistral Nemo", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 128000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-10-31", - "release_date": "2025-02-19", - "last_updated": "2025-02-19", + "attachment": false, + "open_weights": true, + "knowledge": "2024-07", + "release_date": "2024-07-18", + "last_updated": "2024-07-18", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 0.15, + "output": 0.15 } }, { - "id": "claude-sonnet-4-0", - "name": "Claude Sonnet 4 (latest)", - "display_name": "Claude Sonnet 4 (latest)", + "id": "gpt-3.5-turbo-instruct", + "name": "GPT-3.5 Turbo Instruct", + "display_name": "GPT-3.5 Turbo Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 4096, + "output": 4096 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-05-22", - "last_updated": "2025-05-22", + "knowledge": "2021-08", + "release_date": "2023-09-21", + "last_updated": "2023-09-21", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 1.5, + "output": 2 } }, { - "id": "claude-opus-4-1-20250805", - "name": "Claude Opus 4.1", - "display_name": "Claude Opus 4.1", + "id": "meta-llama-3.1-8b-instruct", + "name": "Meta-Llama-3.1-8B-Instruct", + "display_name": "Meta-Llama-3.1-8B-Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 32000 + "context": 128000, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "attachment": false, + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2024-07-23", + "last_updated": "2024-07-23", "cost": { - "input": 15, - "output": 75, - "cache_read": 1.5, - "cache_write": 18.75 + "input": 0.3, + "output": 0.61 } }, { - "id": "claude-3-sonnet-20240229", - "name": "Claude Sonnet 3", - "display_name": "Claude Sonnet 3", + "id": "text-embedding-ada-002", + "name": "text-embedding-ada-002", + "display_name": "text-embedding-ada-002", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 4096 + "context": 8192, + "output": 1536 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2023-08-31", - "release_date": "2024-03-04", - "last_updated": "2024-03-04", + "release_date": "2022-12-15", + "last_updated": "2022-12-15", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 0.3 + "input": 0.1, + "output": 0 } }, { - "id": "claude-haiku-4-5-20251001", - "name": "Claude Haiku 4.5", - "display_name": "Claude Haiku 4.5", + "id": "cohere-embed-v3-english", + "name": "Embed v3 English", + "display_name": "Embed v3 English", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 512, + "output": 1024 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-02-28", - "release_date": "2025-10-15", - "last_updated": "2025-10-15", + "attachment": false, + "open_weights": true, + "release_date": "2023-11-07", + "last_updated": "2023-11-07", "cost": { - "input": 1, - "output": 5, - "cache_read": 0.1, - "cache_write": 1.25 + "input": 0.1, + "output": 0 } - } - ] - }, - "fireworks-ai": { - "id": "fireworks-ai", - "name": "Fireworks AI", - "display_name": "Fireworks AI", - "api": "https://api.fireworks.ai/inference/v1/", - "doc": "https://fireworks.ai/docs/", - "models": [ + }, { - "id": "accounts/fireworks/models/deepseek-r1-0528", - "name": "Deepseek R1 05/28", - "display_name": "Deepseek R1 05/28", + "id": "llama-4-scout-17b-16e-instruct", + "name": "Llama 4 Scout 17B 16E Instruct", + "display_name": "Llama 4 Scout 17B 16E Instruct", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 160000, - "output": 16384 + "context": 128000, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2025-05", - "release_date": "2025-05-28", - "last_updated": "2025-05-28", + "knowledge": "2024-08", + "release_date": "2025-04-05", + "last_updated": "2025-04-05", "cost": { - "input": 3, - "output": 8 + "input": 0.2, + "output": 0.78 } }, { - "id": "accounts/fireworks/models/deepseek-v3p1", - "name": "DeepSeek V3.1", - "display_name": "DeepSeek V3.1", + "id": "o1-mini", + "name": "o1-mini", + "display_name": "o1-mini", "modalities": { "input": [ "text" @@ -33553,61 +41002,64 @@ ] }, "limit": { - "context": 163840, - "output": 163840 + "context": 128000, + "output": 65536 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, "attachment": false, - "open_weights": true, - "knowledge": "2025-07", - "release_date": "2025-08-21", - "last_updated": "2025-08-21", + "open_weights": false, + "knowledge": "2023-09", + "release_date": "2024-09-12", + "last_updated": "2024-09-12", "cost": { - "input": 0.56, - "output": 1.68 + "input": 1.1, + "output": 4.4, + "cache_read": 0.55 } }, { - "id": "accounts/fireworks/models/minimax-m2", - "name": "MiniMax-M2", - "display_name": "MiniMax-M2", + "id": "gpt-5-mini", + "name": "GPT-5 Mini", + "display_name": "GPT-5 Mini", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 272000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-11", - "release_date": "2025-10-27", - "last_updated": "2025-10-27", + "attachment": true, + "open_weights": false, + "knowledge": "2024-05-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 0.3, - "output": 1.2 + "input": 0.25, + "output": 2, + "cache_read": 0.03 } }, { - "id": "accounts/fireworks/models/deepseek-v3-0324", - "name": "Deepseek V3 03-24", - "display_name": "Deepseek V3 03-24", + "id": "phi-3.5-moe-instruct", + "name": "Phi-3.5-MoE-instruct", + "display_name": "Phi-3.5-MoE-instruct", "modalities": { "input": [ "text" @@ -33617,59 +41069,65 @@ ] }, "limit": { - "context": 160000, - "output": 16384 + "context": 128000, + "output": 4096 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2024-10", - "release_date": "2025-03-24", - "last_updated": "2025-03-24", + "knowledge": "2023-10", + "release_date": "2024-08-20", + "last_updated": "2024-08-20", "cost": { - "input": 0.9, - "output": 0.9 + "input": 0.16, + "output": 0.64 } }, { - "id": "accounts/fireworks/models/kimi-k2-thinking", - "name": "Kimi K2 Thinking", - "display_name": "Kimi K2 Thinking", + "id": "gpt-5.1-chat", + "name": "GPT-5.1 Chat", + "display_name": "GPT-5.1 Chat", "modalities": { "input": [ - "text" + "text", + "image", + "audio" ], "output": [ - "text" + "text", + "image", + "audio" ] }, "limit": { - "context": 256000, + "context": 128000, "output": 16384 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2025-11-06", - "last_updated": "2025-11-06", + "attachment": true, + "open_weights": false, + "knowledge": "2024-09-30", + "release_date": "2025-11-14", + "last_updated": "2025-11-14", "cost": { - "input": 0.6, - "output": 2.5 + "input": 1.25, + "output": 10, + "cache_read": 0.125 } }, { - "id": "accounts/fireworks/models/kimi-k2-instruct", - "name": "Kimi K2 Instruct", - "display_name": "Kimi K2 Instruct", + "id": "grok-3-mini", + "name": "Grok 3 Mini", + "display_name": "Grok 3 Mini", "modalities": { "input": [ "text" @@ -33679,60 +41137,65 @@ ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": true, - "knowledge": "2024-10", - "release_date": "2025-07-11", - "last_updated": "2025-07-11", + "open_weights": false, + "knowledge": "2024-11", + "release_date": "2025-02-17", + "last_updated": "2025-02-17", "cost": { - "input": 1, - "output": 3 + "input": 0.3, + "output": 0.5, + "reasoning": 0.5, + "cache_read": 0.075 } }, { - "id": "accounts/fireworks/models/qwen3-235b-a22b", - "name": "Qwen3 235B-A22B", - "display_name": "Qwen3 235B-A22B", + "id": "o1", + "name": "o1", + "display_name": "o1", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 200000, + "output": 100000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-04-29", - "last_updated": "2025-04-29", + "open_weights": false, + "knowledge": "2023-09", + "release_date": "2024-12-05", + "last_updated": "2024-12-05", "cost": { - "input": 0.22, - "output": 0.88 + "input": 15, + "output": 60, + "cache_read": 7.5 } }, { - "id": "accounts/fireworks/models/gpt-oss-20b", - "name": "GPT OSS 20B", - "display_name": "GPT OSS 20B", + "id": "meta-llama-3-8b-instruct", + "name": "Meta-Llama-3-8B-Instruct", + "display_name": "Meta-Llama-3-8B-Instruct", "modalities": { "input": [ "text" @@ -33742,101 +41205,107 @@ ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 8192, + "output": 2048 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "knowledge": "2023-12", + "release_date": "2024-04-18", + "last_updated": "2024-04-18", "cost": { - "input": 0.05, - "output": 0.2 + "input": 0.3, + "output": 0.61 } }, { - "id": "accounts/fireworks/models/gpt-oss-120b", - "name": "GPT OSS 120B", - "display_name": "GPT OSS 120B", + "id": "phi-4-multimodal", + "name": "Phi-4-multimodal", + "display_name": "Phi-4-multimodal", "modalities": { "input": [ - "text" + "text", + "image", + "audio" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 128000, + "output": 4096 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": true, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "knowledge": "2023-10", + "release_date": "2024-12-11", + "last_updated": "2024-12-11", "cost": { - "input": 0.15, - "output": 0.6 + "input": 0.08, + "output": 0.32, + "input_audio": 4 } }, { - "id": "accounts/fireworks/models/glm-4p5-air", - "name": "GLM 4.5 Air", - "display_name": "GLM 4.5 Air", + "id": "o4-mini", + "name": "o4-mini", + "display_name": "o4-mini", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 200000, + "output": 100000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-08-01", - "last_updated": "2025-08-01", + "attachment": true, + "open_weights": false, + "knowledge": "2024-05", + "release_date": "2025-04-16", + "last_updated": "2025-04-16", "cost": { - "input": 0.22, - "output": 0.88 + "input": 1.1, + "output": 4.4, + "cache_read": 0.28 } }, { - "id": "accounts/fireworks/models/qwen3-coder-480b-a35b-instruct", - "name": "Qwen3 Coder 480B A35B Instruct", - "display_name": "Qwen3 Coder 480B A35B Instruct", + "id": "gpt-4.1", + "name": "GPT-4.1", + "display_name": "GPT-4.1", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 256000, + "context": 1047576, "output": 32768 }, "temperature": true, @@ -33844,19 +41313,21 @@ "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "release_date": "2025-07-22", - "last_updated": "2025-07-22", + "attachment": true, + "open_weights": false, + "knowledge": "2024-05", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { - "input": 0.45, - "output": 1.8 + "input": 2, + "output": 8, + "cache_read": 0.5 } }, { - "id": "accounts/fireworks/models/glm-4p5", - "name": "GLM 4.5", - "display_name": "GLM 4.5", + "id": "ministral-3b", + "name": "Ministral 3B", + "display_name": "Ministral 3B", "modalities": { "input": [ "text" @@ -33866,38 +41337,28 @@ ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 128000, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-29", - "last_updated": "2025-07-29", + "knowledge": "2024-03", + "release_date": "2024-10-22", + "last_updated": "2024-10-22", "cost": { - "input": 0.55, - "output": 2.19 + "input": 0.04, + "output": 0.04 } - } - ] - }, - "io-net": { - "id": "io-net", - "name": "IO.NET", - "display_name": "IO.NET", - "api": "https://api.intelligence.io.solutions/api/v1", - "doc": "https://io.net/docs/guides/intelligence/io-intelligence", - "models": [ + }, { - "id": "openai/gpt-oss-20b", - "name": "GPT-OSS 20B", - "display_name": "GPT-OSS 20B", + "id": "gpt-3.5-turbo-0301", + "name": "GPT-3.5 Turbo 0301", + "display_name": "GPT-3.5 Turbo 0301", "modalities": { "input": [ "text" @@ -33907,71 +41368,61 @@ ] }, "limit": { - "context": 64000, + "context": 4096, "output": 4096 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2024-10", - "release_date": "2024-12-01", - "last_updated": "2024-12-01", + "open_weights": false, + "knowledge": "2021-08", + "release_date": "2023-03-01", + "last_updated": "2023-03-01", "cost": { - "input": 0.03, - "output": 0.14, - "cache_read": 0.015, - "cache_write": 0.06 + "input": 1.5, + "output": 2 } }, { - "id": "openai/gpt-oss-120b", - "name": "GPT-OSS 120B", - "display_name": "GPT-OSS 120B", + "id": "gpt-4o", + "name": "GPT-4o", + "display_name": "GPT-4o", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 4096 + "context": 128000, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-10", - "release_date": "2024-12-01", - "last_updated": "2024-12-01", + "attachment": true, + "open_weights": false, + "knowledge": "2023-09", + "release_date": "2024-05-13", + "last_updated": "2024-05-13", "cost": { - "input": 0.04, - "output": 0.4, - "cache_read": 0.02, - "cache_write": 0.08 + "input": 2.5, + "output": 10, + "cache_read": 1.25 } - } - ] - }, - "azure-cognitive-services": { - "id": "azure-cognitive-services", - "name": "Azure Cognitive Services", - "display_name": "Azure Cognitive Services", - "doc": "https://learn.microsoft.com/en-us/azure/ai-services/openai/concepts/models", - "models": [ + }, { - "id": "gpt-3.5-turbo-1106", - "name": "GPT-3.5 Turbo 1106", - "display_name": "GPT-3.5 Turbo 1106", + "id": "phi-3-mini-128k-instruct", + "name": "Phi-3-mini-instruct (128k)", + "display_name": "Phi-3-mini-instruct (128k)", "modalities": { "input": [ "text" @@ -33981,8 +41432,8 @@ ] }, "limit": { - "context": 16384, - "output": 16384 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": false, @@ -33990,19 +41441,19 @@ "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2021-08", - "release_date": "2023-11-06", - "last_updated": "2023-11-06", + "open_weights": true, + "knowledge": "2023-10", + "release_date": "2024-04-23", + "last_updated": "2024-04-23", "cost": { - "input": 1, - "output": 2 + "input": 0.13, + "output": 0.52 } }, { - "id": "mistral-small-2503", - "name": "Mistral Small 3.1", - "display_name": "Mistral Small 3.1", + "id": "llama-3.2-90b-vision-instruct", + "name": "Llama-3.2-90B-Vision-Instruct", + "display_name": "Llama-3.2-90B-Vision-Instruct", "modalities": { "input": [ "text", @@ -34014,7 +41465,7 @@ }, "limit": { "context": 128000, - "output": 32768 + "output": 8192 }, "temperature": true, "tool_call": true, @@ -34022,125 +41473,135 @@ "supported": false }, "attachment": true, - "open_weights": false, - "knowledge": "2024-09", - "release_date": "2025-03-01", - "last_updated": "2025-03-01", + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2024-09-25", + "last_updated": "2024-09-25", "cost": { - "input": 0.1, - "output": 0.3 + "input": 2.04, + "output": 2.04 } }, { - "id": "codestral-2501", - "name": "Codestral 25.01", - "display_name": "Codestral 25.01", + "id": "gpt-5-codex", + "name": "GPT-5-Codex", + "display_name": "GPT-5-Codex", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 256000 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": false, - "knowledge": "2024-03", - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "knowledge": "2024-09-30", + "release_date": "2025-09-15", + "last_updated": "2025-09-15", "cost": { - "input": 0.3, - "output": 0.9 + "input": 1.25, + "output": 10, + "cache_read": 0.13 } }, { - "id": "mistral-large-2411", - "name": "Mistral Large 24.11", - "display_name": "Mistral Large 24.11", + "id": "gpt-5-nano", + "name": "GPT-5 Nano", + "display_name": "GPT-5 Nano", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 272000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-09", - "release_date": "2024-11-01", - "last_updated": "2024-11-01", + "knowledge": "2024-05-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 2, - "output": 6 + "input": 0.05, + "output": 0.4, + "cache_read": 0.01 } }, { - "id": "mai-ds-r1", - "name": "MAI-DS-R1", - "display_name": "MAI-DS-R1", + "id": "gpt-5.1", + "name": "GPT-5.1", + "display_name": "GPT-5.1", "modalities": { "input": [ - "text" + "text", + "image", + "audio" ], "output": [ - "text" + "text", + "image", + "audio" ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 272000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-06", - "release_date": "2025-01-20", - "last_updated": "2025-01-20", + "knowledge": "2024-09-30", + "release_date": "2025-11-14", + "last_updated": "2025-11-14", "cost": { - "input": 1.35, - "output": 5.4 + "input": 1.25, + "output": 10, + "cache_read": 0.125 } }, { - "id": "gpt-5", - "name": "GPT-5", - "display_name": "GPT-5", + "id": "o3-mini", + "name": "o3-mini", + "display_name": "o3-mini", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 272000, - "output": 128000 + "context": 200000, + "output": 100000 }, "temperature": false, "tool_call": true, @@ -34148,21 +41609,21 @@ "supported": true, "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "knowledge": "2024-05", + "release_date": "2024-12-20", + "last_updated": "2025-01-29", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.13 + "input": 1.1, + "output": 4.4, + "cache_read": 0.55 } }, { - "id": "gpt-4o-mini", - "name": "GPT-4o mini", - "display_name": "GPT-4o mini", + "id": "model-router", + "name": "Model Router", + "display_name": "Model Router", "modalities": { "input": [ "text", @@ -34176,62 +41637,63 @@ "context": 128000, "output": 16384 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2023-09", - "release_date": "2024-07-18", - "last_updated": "2024-07-18", + "release_date": "2025-05-19", + "last_updated": "2025-11-18", "cost": { - "input": 0.15, - "output": 0.6, - "cache_read": 0.08 + "input": 0.14, + "output": 0 } }, { - "id": "phi-4-reasoning-plus", - "name": "Phi-4-reasoning-plus", - "display_name": "Phi-4-reasoning-plus", + "id": "gpt-5.1-codex-mini", + "name": "GPT-5.1 Codex Mini", + "display_name": "GPT-5.1 Codex Mini", "modalities": { "input": [ - "text" + "text", + "image", + "audio" ], "output": [ - "text" + "text", + "image", + "audio" ] }, "limit": { - "context": 32000, - "output": 4096 + "context": 400000, + "output": 128000 }, - "temperature": true, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { "supported": true, "default": true }, "attachment": false, - "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-12-11", - "last_updated": "2024-12-11", + "open_weights": false, + "knowledge": "2024-09-30", + "release_date": "2025-11-14", + "last_updated": "2025-11-14", "cost": { - "input": 0.125, - "output": 0.5 + "input": 0.25, + "output": 2, + "cache_read": 0.025 } }, { - "id": "gpt-4-turbo-vision", - "name": "GPT-4 Turbo Vision", - "display_name": "GPT-4 Turbo Vision", + "id": "llama-3.3-70b-instruct", + "name": "Llama-3.3-70B-Instruct", + "display_name": "Llama-3.3-70B-Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" @@ -34239,27 +41701,27 @@ }, "limit": { "context": 128000, - "output": 4096 + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2023-11", - "release_date": "2023-11-06", - "last_updated": "2024-04-09", + "attachment": false, + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2024-12-06", + "last_updated": "2024-12-06", "cost": { - "input": 10, - "output": 30 + "input": 0.71, + "output": 0.71 } }, { - "id": "phi-4-reasoning", - "name": "Phi-4-reasoning", - "display_name": "Phi-4-reasoning", + "id": "o1-preview", + "name": "o1-preview", + "display_name": "o1-preview", "modalities": { "input": [ "text" @@ -34269,29 +41731,30 @@ ] }, "limit": { - "context": 32000, - "output": 4096 + "context": 128000, + "output": 32768 }, - "temperature": true, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { "supported": true, "default": true }, "attachment": false, - "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-12-11", - "last_updated": "2024-12-11", + "open_weights": false, + "knowledge": "2023-09", + "release_date": "2024-09-12", + "last_updated": "2024-09-12", "cost": { - "input": 0.125, - "output": 0.5 + "input": 16.5, + "output": 66, + "cache_read": 8.25 } }, { - "id": "phi-3-medium-4k-instruct", - "name": "Phi-3-medium-instruct (4k)", - "display_name": "Phi-3-medium-instruct (4k)", + "id": "phi-3.5-mini-instruct", + "name": "Phi-3.5-mini-instruct", + "display_name": "Phi-3.5-mini-instruct", "modalities": { "input": [ "text" @@ -34301,8 +41764,8 @@ ] }, "limit": { - "context": 4096, - "output": 1024 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": false, @@ -34312,17 +41775,17 @@ "attachment": false, "open_weights": true, "knowledge": "2023-10", - "release_date": "2024-04-23", - "last_updated": "2024-04-23", + "release_date": "2024-08-20", + "last_updated": "2024-08-20", "cost": { - "input": 0.17, - "output": 0.68 + "input": 0.13, + "output": 0.52 } }, { - "id": "codex-mini", - "name": "Codex Mini", - "display_name": "Codex Mini", + "id": "gpt-3.5-turbo-0613", + "name": "GPT-3.5 Turbo 0613", + "display_name": "GPT-3.5 Turbo 0613", "modalities": { "input": [ "text" @@ -34332,30 +41795,28 @@ ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 16384, + "output": 16384 }, - "temperature": false, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-05-16", - "last_updated": "2025-05-16", + "knowledge": "2021-08", + "release_date": "2023-06-13", + "last_updated": "2023-06-13", "cost": { - "input": 1.5, - "output": 6, - "cache_read": 0.375 + "input": 3, + "output": 4 } }, { - "id": "o3", - "name": "o3", - "display_name": "o3", + "id": "gpt-4-turbo", + "name": "GPT-4 Turbo", + "display_name": "GPT-4 Turbo", "modalities": { "input": [ "text", @@ -34366,30 +41827,28 @@ ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 128000, + "output": 4096 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2024-05", - "release_date": "2025-04-16", - "last_updated": "2025-04-16", + "knowledge": "2023-11", + "release_date": "2023-11-06", + "last_updated": "2024-04-09", "cost": { - "input": 2, - "output": 8, - "cache_read": 0.5 + "input": 10, + "output": 30 } }, { - "id": "mistral-nemo", - "name": "Mistral Nemo", - "display_name": "Mistral Nemo", + "id": "meta-llama-3.1-70b-instruct", + "name": "Meta-Llama-3.1-70B-Instruct", + "display_name": "Meta-Llama-3.1-70B-Instruct", "modalities": { "input": [ "text" @@ -34400,7 +41859,7 @@ }, "limit": { "context": 128000, - "output": 128000 + "output": 32768 }, "temperature": true, "tool_call": true, @@ -34409,18 +41868,18 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2024-07", - "release_date": "2024-07-18", - "last_updated": "2024-07-18", + "knowledge": "2023-12", + "release_date": "2024-07-23", + "last_updated": "2024-07-23", "cost": { - "input": 0.15, - "output": 0.15 + "input": 2.68, + "output": 3.54 } }, { - "id": "gpt-3.5-turbo-instruct", - "name": "GPT-3.5 Turbo Instruct", - "display_name": "GPT-3.5 Turbo Instruct", + "id": "phi-3-small-8k-instruct", + "name": "Phi-3-small-instruct (8k)", + "display_name": "Phi-3-small-instruct (8k)", "modalities": { "input": [ "text" @@ -34430,8 +41889,8 @@ ] }, "limit": { - "context": 4096, - "output": 4096 + "context": 8192, + "output": 2048 }, "temperature": true, "tool_call": false, @@ -34439,19 +41898,19 @@ "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2021-08", - "release_date": "2023-09-21", - "last_updated": "2023-09-21", + "open_weights": true, + "knowledge": "2023-10", + "release_date": "2024-04-23", + "last_updated": "2024-04-23", "cost": { - "input": 1.5, - "output": 2 + "input": 0.15, + "output": 0.6 } }, { - "id": "meta-llama-3.1-8b-instruct", - "name": "Meta-Llama-3.1-8B-Instruct", - "display_name": "Meta-Llama-3.1-8B-Instruct", + "id": "deepseek-v3-0324", + "name": "DeepSeek-V3-0324", + "display_name": "DeepSeek-V3-0324", "modalities": { "input": [ "text" @@ -34461,8 +41920,8 @@ ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 131072, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -34471,18 +41930,18 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-07-23", - "last_updated": "2024-07-23", + "knowledge": "2024-07", + "release_date": "2025-03-24", + "last_updated": "2025-03-24", "cost": { - "input": 0.3, - "output": 0.61 + "input": 1.14, + "output": 4.56 } }, { - "id": "text-embedding-ada-002", - "name": "text-embedding-ada-002", - "display_name": "text-embedding-ada-002", + "id": "meta-llama-3-70b-instruct", + "name": "Meta-Llama-3-70B-Instruct", + "display_name": "Meta-Llama-3-70B-Instruct", "modalities": { "input": [ "text" @@ -34493,25 +41952,27 @@ }, "limit": { "context": 8192, - "output": 1536 + "output": 2048 }, + "temperature": true, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2022-12-15", - "last_updated": "2022-12-15", + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2024-04-18", + "last_updated": "2024-04-18", "cost": { - "input": 0.1, - "output": 0 + "input": 2.68, + "output": 3.54 } }, { - "id": "cohere-embed-v3-english", - "name": "Embed v3 English", - "display_name": "Embed v3 English", + "id": "text-embedding-3-large", + "name": "text-embedding-3-large", + "display_name": "text-embedding-3-large", "modalities": { "input": [ "text" @@ -34521,38 +41982,36 @@ ] }, "limit": { - "context": 512, - "output": 1024 + "context": 8191, + "output": 3072 }, - "temperature": false, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2023-11-07", - "last_updated": "2023-11-07", + "open_weights": false, + "release_date": "2024-01-25", + "last_updated": "2024-01-25", "cost": { - "input": 0.1, + "input": 0.13, "output": 0 } }, { - "id": "llama-4-scout-17b-16e-instruct", - "name": "Llama 4 Scout 17B 16E Instruct", - "display_name": "Llama 4 Scout 17B 16E Instruct", + "id": "grok-3", + "name": "Grok 3", + "display_name": "Grok 3", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, + "context": 131072, "output": 8192 }, "temperature": true, @@ -34560,20 +42019,21 @@ "reasoning": { "supported": false }, - "attachment": true, - "open_weights": true, - "knowledge": "2024-08", - "release_date": "2025-04-05", - "last_updated": "2025-04-05", + "attachment": false, + "open_weights": false, + "knowledge": "2024-11", + "release_date": "2025-02-17", + "last_updated": "2025-02-17", "cost": { - "input": 0.2, - "output": 0.78 + "input": 3, + "output": 15, + "cache_read": 0.75 } }, { - "id": "o1-mini", - "name": "o1-mini", - "display_name": "o1-mini", + "id": "gpt-3.5-turbo-0125", + "name": "GPT-3.5 Turbo 0125", + "display_name": "GPT-3.5 Turbo 0125", "modalities": { "input": [ "text" @@ -34583,44 +42043,43 @@ ] }, "limit": { - "context": 128000, - "output": 65536 + "context": 16384, + "output": 16384 }, - "temperature": false, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2023-09", - "release_date": "2024-09-12", - "last_updated": "2024-09-12", + "knowledge": "2021-08", + "release_date": "2024-01-25", + "last_updated": "2024-01-25", "cost": { - "input": 1.1, - "output": 4.4, - "cache_read": 0.55 + "input": 0.5, + "output": 1.5 } }, { - "id": "gpt-5-mini", - "name": "GPT-5 Mini", - "display_name": "GPT-5 Mini", + "id": "claude-sonnet-4-5", + "name": "Claude Sonnet 4.5", + "display_name": "Claude Sonnet 4.5", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 272000, - "output": 128000 + "context": 200000, + "output": 64000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -34628,19 +42087,20 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2024-05-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "knowledge": "2025-07-31", + "release_date": "2025-11-18", + "last_updated": "2025-11-18", "cost": { - "input": 0.25, - "output": 2, - "cache_read": 0.03 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 } }, { - "id": "phi-3.5-moe-instruct", - "name": "Phi-3.5-MoE-instruct", - "display_name": "Phi-3.5-MoE-instruct", + "id": "phi-4-mini-reasoning", + "name": "Phi-4-mini-reasoning", + "display_name": "Phi-4-mini-reasoning", "modalities": { "input": [ "text" @@ -34654,61 +42114,56 @@ "output": 4096 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": true, "knowledge": "2023-10", - "release_date": "2024-08-20", - "last_updated": "2024-08-20", + "release_date": "2024-12-11", + "last_updated": "2024-12-11", "cost": { - "input": 0.16, - "output": 0.64 + "input": 0.075, + "output": 0.3 } }, { - "id": "gpt-5.1-chat", - "name": "GPT-5.1 Chat", - "display_name": "GPT-5.1 Chat", + "id": "phi-4", + "name": "Phi-4", + "display_name": "Phi-4", "modalities": { "input": [ - "text", - "image", - "audio" + "text" ], "output": [ - "text", - "image", - "audio" + "text" ] }, "limit": { "context": 128000, - "output": 16384 + "output": 4096 }, - "temperature": false, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-14", - "last_updated": "2025-11-14", + "attachment": false, + "open_weights": true, + "knowledge": "2023-10", + "release_date": "2024-12-11", + "last_updated": "2024-12-11", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125 + "input": 0.125, + "output": 0.5 } }, { - "id": "grok-3-mini", - "name": "Grok 3 Mini", - "display_name": "Grok 3 Mini", + "id": "deepseek-v3.1", + "name": "DeepSeek-V3.1", + "display_name": "DeepSeek-V3.1", "modalities": { "input": [ "text" @@ -34719,7 +42174,7 @@ }, "limit": { "context": 131072, - "output": 8192 + "output": 131072 }, "temperature": true, "tool_call": true, @@ -34728,21 +42183,19 @@ "default": true }, "attachment": false, - "open_weights": false, - "knowledge": "2024-11", - "release_date": "2025-02-17", - "last_updated": "2025-02-17", + "open_weights": true, + "knowledge": "2024-07", + "release_date": "2025-08-21", + "last_updated": "2025-08-21", "cost": { - "input": 0.3, - "output": 0.5, - "reasoning": 0.5, - "cache_read": 0.075 + "input": 0.56, + "output": 1.68 } }, { - "id": "o1", - "name": "o1", - "display_name": "o1", + "id": "gpt-5-chat", + "name": "GPT-5 Chat", + "display_name": "GPT-5 Chat", "modalities": { "input": [ "text", @@ -34753,66 +42206,67 @@ ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 128000, + "output": 16384 }, "temperature": false, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2023-09", - "release_date": "2024-12-05", - "last_updated": "2024-12-05", + "knowledge": "2024-10-24", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 15, - "output": 60, - "cache_read": 7.5 + "input": 1.25, + "output": 10, + "cache_read": 0.13 } }, { - "id": "meta-llama-3-8b-instruct", - "name": "Meta-Llama-3-8B-Instruct", - "display_name": "Meta-Llama-3-8B-Instruct", + "id": "gpt-4.1-mini", + "name": "GPT-4.1 mini", + "display_name": "GPT-4.1 mini", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 8192, - "output": 2048 + "context": 1047576, + "output": 32768 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-04-18", - "last_updated": "2024-04-18", + "attachment": true, + "open_weights": false, + "knowledge": "2024-05", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { - "input": 0.3, - "output": 0.61 + "input": 0.4, + "output": 1.6, + "cache_read": 0.1 } }, { - "id": "phi-4-multimodal", - "name": "Phi-4-multimodal", - "display_name": "Phi-4-multimodal", + "id": "llama-4-maverick-17b-128e-instruct-fp8", + "name": "Llama 4 Maverick 17B 128E Instruct FP8", + "display_name": "Llama 4 Maverick 17B 128E Instruct FP8", "modalities": { "input": [ "text", - "image", - "audio" + "image" ], "output": [ "text" @@ -34820,95 +42274,91 @@ }, "limit": { "context": 128000, - "output": 4096 + "output": 8192 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": true, "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-12-11", - "last_updated": "2024-12-11", + "knowledge": "2024-08", + "release_date": "2025-04-05", + "last_updated": "2025-04-05", "cost": { - "input": 0.08, - "output": 0.32, - "input_audio": 4 + "input": 0.25, + "output": 1 } }, { - "id": "o4-mini", - "name": "o4-mini", - "display_name": "o4-mini", + "id": "cohere-command-r-plus-08-2024", + "name": "Command R+", + "display_name": "Command R+", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 128000, + "output": 4000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-05", - "release_date": "2025-04-16", - "last_updated": "2025-04-16", + "attachment": false, + "open_weights": true, + "knowledge": "2024-06-01", + "release_date": "2024-08-30", + "last_updated": "2024-08-30", "cost": { - "input": 1.1, - "output": 4.4, - "cache_read": 0.28 + "input": 2.5, + "output": 10 } }, { - "id": "gpt-4.1", - "name": "GPT-4.1", - "display_name": "GPT-4.1", + "id": "cohere-command-a", + "name": "Command A", + "display_name": "Command A", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1047576, - "output": 32768 + "context": 256000, + "output": 8000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-05", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", + "attachment": false, + "open_weights": true, + "knowledge": "2024-06-01", + "release_date": "2025-03-13", + "last_updated": "2025-03-13", "cost": { - "input": 2, - "output": 8, - "cache_read": 0.5 + "input": 2.5, + "output": 10 } }, { - "id": "ministral-3b", - "name": "Ministral 3B", - "display_name": "Ministral 3B", + "id": "phi-3-small-128k-instruct", + "name": "Phi-3-small-instruct (128k)", + "display_name": "Phi-3-small-instruct (128k)", "modalities": { "input": [ "text" @@ -34919,58 +42369,63 @@ }, "limit": { "context": 128000, - "output": 8192 + "output": 4096 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2024-03", - "release_date": "2024-10-22", - "last_updated": "2024-10-22", + "knowledge": "2023-10", + "release_date": "2024-04-23", + "last_updated": "2024-04-23", "cost": { - "input": 0.04, - "output": 0.04 + "input": 0.15, + "output": 0.6 } }, { - "id": "gpt-3.5-turbo-0301", - "name": "GPT-3.5 Turbo 0301", - "display_name": "GPT-3.5 Turbo 0301", + "id": "claude-opus-4-5", + "name": "Claude Opus 4.5", + "display_name": "Claude Opus 4.5", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 4096, - "output": 4096 + "context": 200000, + "output": 64000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2021-08", - "release_date": "2023-03-01", - "last_updated": "2023-03-01", + "knowledge": "2025-03-31", + "release_date": "2025-11-24", + "last_updated": "2025-08-01", "cost": { - "input": 1.5, - "output": 2 + "input": 5, + "output": 25, + "cache_read": 1.5, + "cache_write": 18.75 } }, { - "id": "gpt-4o", - "name": "GPT-4o", - "display_name": "GPT-4o", + "id": "mistral-medium-2505", + "name": "Mistral Medium 3", + "display_name": "Mistral Medium 3", "modalities": { "input": [ "text", @@ -34982,7 +42437,7 @@ }, "limit": { "context": 128000, - "output": 16384 + "output": 128000 }, "temperature": true, "tool_call": true, @@ -34991,89 +42446,95 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2023-09", - "release_date": "2024-05-13", - "last_updated": "2024-05-13", + "knowledge": "2025-05", + "release_date": "2025-05-07", + "last_updated": "2025-05-07", "cost": { - "input": 2.5, - "output": 10, - "cache_read": 1.25 + "input": 0.4, + "output": 2 } }, { - "id": "phi-3-mini-128k-instruct", - "name": "Phi-3-mini-instruct (128k)", - "display_name": "Phi-3-mini-instruct (128k)", + "id": "claude-haiku-4-5", + "name": "Claude Haiku 4.5", + "display_name": "Claude Haiku 4.5", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 200000, + "output": 64000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-04-23", - "last_updated": "2024-04-23", + "attachment": true, + "open_weights": false, + "knowledge": "2025-02-31", + "release_date": "2025-11-18", + "last_updated": "2025-11-18", "cost": { - "input": 0.13, - "output": 0.52 + "input": 1, + "output": 5, + "cache_read": 0.1, + "cache_write": 1.25 } }, { - "id": "llama-3.2-90b-vision-instruct", - "name": "Llama-3.2-90B-Vision-Instruct", - "display_name": "Llama-3.2-90B-Vision-Instruct", + "id": "phi-3-mini-4k-instruct", + "name": "Phi-3-mini-instruct (4k)", + "display_name": "Phi-3-mini-instruct (4k)", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 4096, + "output": 1024 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-09-25", - "last_updated": "2024-09-25", + "knowledge": "2023-10", + "release_date": "2024-04-23", + "last_updated": "2024-04-23", "cost": { - "input": 2.04, - "output": 2.04 + "input": 0.13, + "output": 0.52 } }, { - "id": "gpt-5-codex", - "name": "GPT-5-Codex", - "display_name": "GPT-5-Codex", + "id": "gpt-5.1-codex", + "name": "GPT-5.1 Codex", + "display_name": "GPT-5.1 Codex", "modalities": { "input": [ "text", - "image" + "image", + "audio" ], "output": [ - "text" + "text", + "image", + "audio" ] }, "limit": { @@ -35089,89 +42550,83 @@ "attachment": false, "open_weights": false, "knowledge": "2024-09-30", - "release_date": "2025-09-15", - "last_updated": "2025-09-15", + "release_date": "2025-11-14", + "last_updated": "2025-11-14", "cost": { "input": 1.25, "output": 10, - "cache_read": 0.13 + "cache_read": 0.125 } }, { - "id": "gpt-5-nano", - "name": "GPT-5 Nano", - "display_name": "GPT-5 Nano", + "id": "grok-code-fast-1", + "name": "Grok Code Fast 1", + "display_name": "Grok Code Fast 1", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 272000, - "output": 128000 + "context": 256000, + "output": 10000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-05-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "knowledge": "2023-10", + "release_date": "2025-08-28", + "last_updated": "2025-08-28", "cost": { - "input": 0.05, - "output": 0.4, - "cache_read": 0.01 + "input": 0.2, + "output": 1.5, + "cache_read": 0.02 } }, { - "id": "gpt-5.1", - "name": "GPT-5.1", - "display_name": "GPT-5.1", + "id": "deepseek-r1", + "name": "DeepSeek-R1", + "display_name": "DeepSeek-R1", "modalities": { "input": [ - "text", - "image", - "audio" + "text" ], "output": [ - "text", - "image", - "audio" + "text" ] }, "limit": { - "context": 272000, - "output": 128000 + "context": 163840, + "output": 163840 }, - "temperature": false, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-14", - "last_updated": "2025-11-14", + "attachment": false, + "open_weights": true, + "knowledge": "2024-07", + "release_date": "2025-01-20", + "last_updated": "2025-01-20", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125 + "input": 1.35, + "output": 5.4 } }, { - "id": "o3-mini", - "name": "o3-mini", - "display_name": "o3-mini", + "id": "meta-llama-3.1-405b-instruct", + "name": "Meta-Llama-3.1-405B-Instruct", + "display_name": "Meta-Llama-3.1-405B-Instruct", "modalities": { "input": [ "text" @@ -35181,97 +42636,90 @@ ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 128000, + "output": 32768 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2024-05", - "release_date": "2024-12-20", - "last_updated": "2025-01-29", + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2024-07-23", + "last_updated": "2024-07-23", "cost": { - "input": 1.1, - "output": 4.4, - "cache_read": 0.55 + "input": 5.33, + "output": 16 } }, { - "id": "model-router", - "name": "Model Router", - "display_name": "Model Router", + "id": "gpt-4-32k", + "name": "GPT-4 32K", + "display_name": "GPT-4 32K", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 32768, + "output": 32768 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-05-19", - "last_updated": "2025-11-18", + "knowledge": "2023-11", + "release_date": "2023-03-14", + "last_updated": "2023-03-14", "cost": { - "input": 0.14, - "output": 0 + "input": 60, + "output": 120 } }, { - "id": "gpt-5.1-codex-mini", - "name": "GPT-5.1 Codex Mini", - "display_name": "GPT-5.1 Codex Mini", + "id": "phi-4-mini", + "name": "Phi-4-mini", + "display_name": "Phi-4-mini", "modalities": { "input": [ - "text", - "image", - "audio" + "text" ], "output": [ - "text", - "image", - "audio" + "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 128000, + "output": 4096 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-14", - "last_updated": "2025-11-14", + "open_weights": true, + "knowledge": "2023-10", + "release_date": "2024-12-11", + "last_updated": "2024-12-11", "cost": { - "input": 0.25, - "output": 2, - "cache_read": 0.025 + "input": 0.075, + "output": 0.3 } }, { - "id": "llama-3.3-70b-instruct", - "name": "Llama-3.3-70B-Instruct", - "display_name": "Llama-3.3-70B-Instruct", + "id": "cohere-embed-v3-multilingual", + "name": "Embed v3 Multilingual", + "display_name": "Embed v3 Multilingual", "modalities": { "input": [ "text" @@ -35281,28 +42729,27 @@ ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 512, + "output": 1024 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "release_date": "2023-11-07", + "last_updated": "2023-11-07", "cost": { - "input": 0.71, - "output": 0.71 + "input": 0.1, + "output": 0 } }, { - "id": "o1-preview", - "name": "o1-preview", - "display_name": "o1-preview", + "id": "grok-4", + "name": "Grok 4", + "display_name": "Grok 4", "modalities": { "input": [ "text" @@ -35312,10 +42759,10 @@ ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 256000, + "output": 64000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -35323,19 +42770,20 @@ }, "attachment": false, "open_weights": false, - "knowledge": "2023-09", - "release_date": "2024-09-12", - "last_updated": "2024-09-12", + "knowledge": "2025-07", + "release_date": "2025-07-09", + "last_updated": "2025-07-09", "cost": { - "input": 16.5, - "output": 66, - "cache_read": 8.25 + "input": 3, + "output": 15, + "reasoning": 15, + "cache_read": 0.75 } }, { - "id": "phi-3.5-mini-instruct", - "name": "Phi-3.5-mini-instruct", - "display_name": "Phi-3.5-mini-instruct", + "id": "cohere-command-r-08-2024", + "name": "Command R", + "display_name": "Command R", "modalities": { "input": [ "text" @@ -35346,58 +42794,59 @@ }, "limit": { "context": 128000, - "output": 4096 + "output": 4000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-08-20", - "last_updated": "2024-08-20", + "knowledge": "2024-06-01", + "release_date": "2024-08-30", + "last_updated": "2024-08-30", "cost": { - "input": 0.13, - "output": 0.52 + "input": 0.15, + "output": 0.6 } }, { - "id": "gpt-3.5-turbo-0613", - "name": "GPT-3.5 Turbo 0613", - "display_name": "GPT-3.5 Turbo 0613", + "id": "cohere-embed-v-4-0", + "name": "Embed v4", + "display_name": "Embed v4", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 16384, - "output": 16384 + "context": 128000, + "output": 1536 }, - "temperature": true, + "temperature": false, "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": false, - "knowledge": "2021-08", - "release_date": "2023-06-13", - "last_updated": "2023-06-13", + "attachment": true, + "open_weights": true, + "release_date": "2025-04-15", + "last_updated": "2025-04-15", "cost": { - "input": 3, - "output": 4 + "input": 0.12, + "output": 0 } }, { - "id": "gpt-4-turbo", - "name": "GPT-4 Turbo", - "display_name": "GPT-4 Turbo", + "id": "llama-3.2-11b-vision-instruct", + "name": "Llama-3.2-11B-Vision-Instruct", + "display_name": "Llama-3.2-11B-Vision-Instruct", "modalities": { "input": [ "text", @@ -35409,7 +42858,7 @@ }, "limit": { "context": 128000, - "output": 4096 + "output": 8192 }, "temperature": true, "tool_call": true, @@ -35417,19 +42866,55 @@ "supported": false }, "attachment": true, + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2024-09-25", + "last_updated": "2024-09-25", + "cost": { + "input": 0.37, + "output": 0.37 + } + }, + { + "id": "claude-opus-4-1", + "name": "Claude Opus 4.1", + "display_name": "Claude Opus 4.1", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 200000, + "output": 32000 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, "open_weights": false, - "knowledge": "2023-11", - "release_date": "2023-11-06", - "last_updated": "2024-04-09", + "knowledge": "2025-03-31", + "release_date": "2025-11-18", + "last_updated": "2025-11-18", "cost": { - "input": 10, - "output": 30 + "input": 15, + "output": 75, + "cache_read": 1.5, + "cache_write": 18.75 } }, { - "id": "meta-llama-3.1-70b-instruct", - "name": "Meta-Llama-3.1-70B-Instruct", - "display_name": "Meta-Llama-3.1-70B-Instruct", + "id": "gpt-4", + "name": "GPT-4", + "display_name": "GPT-4", "modalities": { "input": [ "text" @@ -35439,8 +42924,8 @@ ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 8192, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -35448,19 +42933,19 @@ "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-07-23", - "last_updated": "2024-07-23", + "open_weights": false, + "knowledge": "2023-11", + "release_date": "2023-03-14", + "last_updated": "2023-03-14", "cost": { - "input": 2.68, - "output": 3.54 + "input": 60, + "output": 120 } }, { - "id": "phi-3-small-8k-instruct", - "name": "Phi-3-small-instruct (8k)", - "display_name": "Phi-3-small-instruct (8k)", + "id": "phi-3-medium-128k-instruct", + "name": "Phi-3-medium-instruct (128k)", + "display_name": "Phi-3-medium-instruct (128k)", "modalities": { "input": [ "text" @@ -35470,8 +42955,8 @@ ] }, "limit": { - "context": 8192, - "output": 2048 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": false, @@ -35484,14 +42969,48 @@ "release_date": "2024-04-23", "last_updated": "2024-04-23", "cost": { - "input": 0.15, - "output": 0.6 + "input": 0.17, + "output": 0.68 } }, { - "id": "deepseek-v3-0324", - "name": "DeepSeek-V3-0324", - "display_name": "DeepSeek-V3-0324", + "id": "grok-4-fast-reasoning", + "name": "Grok 4 Fast (Reasoning)", + "display_name": "Grok 4 Fast (Reasoning)", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 2000000, + "output": 30000 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-07", + "release_date": "2025-09-19", + "last_updated": "2025-09-19", + "cost": { + "input": 0.2, + "output": 0.5, + "cache_read": 0.05 + } + }, + { + "id": "deepseek-r1-0528", + "name": "DeepSeek-R1-0528", + "display_name": "DeepSeek-R1-0528", "modalities": { "input": [ "text" @@ -35501,59 +43020,62 @@ ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 163840, + "output": 163840 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": true, "knowledge": "2024-07", - "release_date": "2025-03-24", - "last_updated": "2025-03-24", + "release_date": "2025-05-28", + "last_updated": "2025-05-28", "cost": { - "input": 1.14, - "output": 4.56 + "input": 1.35, + "output": 5.4 } }, { - "id": "meta-llama-3-70b-instruct", - "name": "Meta-Llama-3-70B-Instruct", - "display_name": "Meta-Llama-3-70B-Instruct", + "id": "grok-4-fast-non-reasoning", + "name": "Grok 4 Fast (Non-Reasoning)", + "display_name": "Grok 4 Fast (Non-Reasoning)", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 8192, - "output": 2048 + "context": 2000000, + "output": 30000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-04-18", - "last_updated": "2024-04-18", + "attachment": true, + "open_weights": false, + "knowledge": "2025-07", + "release_date": "2025-09-19", + "last_updated": "2025-09-19", "cost": { - "input": 2.68, - "output": 3.54 + "input": 0.2, + "output": 0.5, + "cache_read": 0.05 } }, { - "id": "text-embedding-3-large", - "name": "text-embedding-3-large", - "display_name": "text-embedding-3-large", + "id": "text-embedding-3-small", + "name": "text-embedding-3-small", + "display_name": "text-embedding-3-small", "modalities": { "input": [ "text" @@ -35564,7 +43086,7 @@ }, "limit": { "context": 8191, - "output": 3072 + "output": 1536 }, "tool_call": false, "reasoning": { @@ -35575,46 +43097,56 @@ "release_date": "2024-01-25", "last_updated": "2024-01-25", "cost": { - "input": 0.13, + "input": 0.02, "output": 0 } }, { - "id": "grok-3", - "name": "Grok 3", - "display_name": "Grok 3", + "id": "gpt-4.1-nano", + "name": "GPT-4.1 nano", + "display_name": "GPT-4.1 nano", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 1047576, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-11", - "release_date": "2025-02-17", - "last_updated": "2025-02-17", + "knowledge": "2024-05", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.75 + "input": 0.1, + "output": 0.4, + "cache_read": 0.03 } - }, + } + ] + }, + "llama": { + "id": "llama", + "name": "Llama", + "display_name": "Llama", + "api": "https://api.llama.com/compat/v1/", + "doc": "https://llama.developer.meta.com/docs/models", + "models": [ { - "id": "gpt-3.5-turbo-0125", - "name": "GPT-3.5 Turbo 0125", - "display_name": "GPT-3.5 Turbo 0125", + "id": "llama-3.3-8b-instruct", + "name": "Llama-3.3-8B-Instruct", + "display_name": "Llama-3.3-8B-Instruct", "modalities": { "input": [ "text" @@ -35624,28 +43156,28 @@ ] }, "limit": { - "context": 16384, - "output": 16384 + "context": 128000, + "output": 4096 }, "temperature": true, - "tool_call": false, - "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": false, - "knowledge": "2021-08", - "release_date": "2024-01-25", - "last_updated": "2024-01-25", + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2024-12-06", + "last_updated": "2024-12-06", "cost": { - "input": 0.5, - "output": 1.5 + "input": 0, + "output": 0 } }, { - "id": "claude-sonnet-4-5", - "name": "Claude Sonnet 4.5", - "display_name": "Claude Sonnet 4.5", + "id": "llama-4-maverick-17b-128e-instruct-fp8", + "name": "Llama-4-Maverick-17B-128E-Instruct-FP8", + "display_name": "Llama-4-Maverick-17B-128E-Instruct-FP8", "modalities": { "input": [ "text", @@ -35656,31 +43188,28 @@ ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, - "open_weights": false, - "knowledge": "2025-07-31", - "release_date": "2025-11-18", - "last_updated": "2025-11-18", + "open_weights": true, + "knowledge": "2024-08", + "release_date": "2025-04-05", + "last_updated": "2025-04-05", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 0, + "output": 0 } }, { - "id": "phi-4-mini-reasoning", - "name": "Phi-4-mini-reasoning", - "display_name": "Phi-4-mini-reasoning", + "id": "llama-3.3-70b-instruct", + "name": "Llama-3.3-70B-Instruct", + "display_name": "Llama-3.3-70B-Instruct", "modalities": { "input": [ "text" @@ -35696,26 +43225,26 @@ "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-12-11", - "last_updated": "2024-12-11", + "knowledge": "2023-12", + "release_date": "2024-12-06", + "last_updated": "2024-12-06", "cost": { - "input": 0.075, - "output": 0.3 + "input": 0, + "output": 0 } }, { - "id": "phi-4", - "name": "Phi-4", - "display_name": "Phi-4", + "id": "llama-4-scout-17b-16e-instruct-fp8", + "name": "Llama-4-Scout-17B-16E-Instruct-FP8", + "display_name": "Llama-4-Scout-17B-16E-Instruct-FP8", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -35726,24 +43255,24 @@ "output": 4096 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-12-11", - "last_updated": "2024-12-11", + "knowledge": "2024-08", + "release_date": "2025-04-05", + "last_updated": "2025-04-05", "cost": { - "input": 0.125, - "output": 0.5 + "input": 0, + "output": 0 } }, { - "id": "deepseek-v3.1", - "name": "DeepSeek-V3.1", - "display_name": "DeepSeek-V3.1", + "id": "groq-llama-4-maverick-17b-128e-instruct", + "name": "Groq-Llama-4-Maverick-17B-128E-Instruct", + "display_name": "Groq-Llama-4-Maverick-17B-128E-Instruct", "modalities": { "input": [ "text" @@ -35753,33 +43282,31 @@ ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2024-07", - "release_date": "2025-08-21", - "last_updated": "2025-08-21", + "knowledge": "2025-01", + "release_date": "2025-04-05", + "last_updated": "2025-04-05", "cost": { - "input": 0.56, - "output": 1.68 + "input": 0, + "output": 0 } }, { - "id": "gpt-5-chat", - "name": "GPT-5 Chat", - "display_name": "GPT-5 Chat", + "id": "cerebras-llama-4-scout-17b-16e-instruct", + "name": "Cerebras-Llama-4-Scout-17B-16E-Instruct", + "display_name": "Cerebras-Llama-4-Scout-17B-16E-Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" @@ -35787,41 +43314,38 @@ }, "limit": { "context": 128000, - "output": 16384 + "output": 4096 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, - "open_weights": false, - "knowledge": "2024-10-24", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2025-04-05", + "last_updated": "2025-04-05", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.13 + "input": 0, + "output": 0 } }, { - "id": "gpt-4.1-mini", - "name": "GPT-4.1 mini", - "display_name": "GPT-4.1 mini", + "id": "cerebras-llama-4-maverick-17b-128e-instruct", + "name": "Cerebras-Llama-4-Maverick-17B-128E-Instruct", + "display_name": "Cerebras-Llama-4-Maverick-17B-128E-Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1047576, - "output": 32768 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, @@ -35829,31 +43353,38 @@ "supported": false }, "attachment": true, - "open_weights": false, - "knowledge": "2024-05", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2025-04-05", + "last_updated": "2025-04-05", "cost": { - "input": 0.4, - "output": 1.6, - "cache_read": 0.1 + "input": 0, + "output": 0 } - }, + } + ] + }, + "scaleway": { + "id": "scaleway", + "name": "Scaleway", + "display_name": "Scaleway", + "api": "https://api.scaleway.ai/v1", + "doc": "https://www.scaleway.com/en/docs/generative-apis/", + "models": [ { - "id": "llama-4-maverick-17b-128e-instruct-fp8", - "name": "Llama 4 Maverick 17B 128E Instruct FP8", - "display_name": "Llama 4 Maverick 17B 128E Instruct FP8", + "id": "qwen3-235b-a22b-instruct-2507", + "name": "Qwen3 235B A22B Instruct 2507", + "display_name": "Qwen3 235B A22B Instruct 2507", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, + "context": 260000, "output": 8192 }, "temperature": true, @@ -35863,21 +43394,21 @@ }, "attachment": true, "open_weights": true, - "knowledge": "2024-08", - "release_date": "2025-04-05", - "last_updated": "2025-04-05", + "release_date": "2025-07-01", + "last_updated": "2025-07-01", "cost": { - "input": 0.25, - "output": 1 + "input": 0.75, + "output": 2.25 } }, { - "id": "cohere-command-r-plus-08-2024", - "name": "Command R+", - "display_name": "Command R+", + "id": "pixtral-12b-2409", + "name": "Pixtral 12B 2409", + "display_name": "Pixtral 12B 2409", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -35885,28 +43416,26 @@ }, "limit": { "context": 128000, - "output": 4000 + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2024-06-01", - "release_date": "2024-08-30", - "last_updated": "2024-08-30", + "release_date": "2024-09-25", + "last_updated": "2024-09-25", "cost": { - "input": 2.5, - "output": 10 + "input": 0.2, + "output": 0.2 } }, { - "id": "cohere-command-a", - "name": "Command A", - "display_name": "Command A", + "id": "llama-3.1-8b-instruct", + "name": "Llama 3.1 8B Instruct", + "display_name": "Llama 3.1 8B Instruct", "modalities": { "input": [ "text" @@ -35916,29 +43445,28 @@ ] }, "limit": { - "context": 256000, - "output": 8000 + "context": 128000, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2024-06-01", - "release_date": "2025-03-13", - "last_updated": "2025-03-13", + "knowledge": "2023-12", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 2.5, - "output": 10 + "input": 0.2, + "output": 0.2 } }, { - "id": "phi-3-small-128k-instruct", - "name": "Phi-3-small-instruct (128k)", - "display_name": "Phi-3-small-instruct (128k)", + "id": "mistral-nemo-instruct-2407", + "name": "Mistral Nemo Instruct 2407", + "display_name": "Mistral Nemo Instruct 2407", "modalities": { "input": [ "text" @@ -35949,27 +43477,26 @@ }, "limit": { "context": 128000, - "output": 4096 + "output": 8192 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-04-23", - "last_updated": "2024-04-23", + "release_date": "2024-07-25", + "last_updated": "2024-07-25", "cost": { - "input": 0.15, - "output": 0.6 + "input": 0.2, + "output": 0.2 } }, { - "id": "claude-opus-4-5", - "name": "Claude Opus 4.5", - "display_name": "Claude Opus 4.5", + "id": "mistral-small-3.2-24b-instruct-2506", + "name": "Mistral Small 3.2 24B Instruct (2506)", + "display_name": "Mistral Small 3.2 24B Instruct (2506)", "modalities": { "input": [ "text", @@ -35980,35 +43507,30 @@ ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 128000, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-11-24", - "last_updated": "2025-08-01", + "attachment": false, + "open_weights": true, + "release_date": "2025-06-20", + "last_updated": "2025-06-20", "cost": { - "input": 5, - "output": 25, - "cache_read": 1.5, - "cache_write": 18.75 + "input": 0.15, + "output": 0.35 } }, { - "id": "mistral-medium-2505", - "name": "Mistral Medium 3", - "display_name": "Mistral Medium 3", + "id": "qwen3-coder-30b-a3b-instruct", + "name": "Qwen3-Coder 30B-A3B Instruct", + "display_name": "Qwen3-Coder 30B-A3B Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" @@ -36016,163 +43538,152 @@ }, "limit": { "context": 128000, - "output": 128000 + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-05", - "release_date": "2025-05-07", - "last_updated": "2025-05-07", + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-04", + "last_updated": "2025-04", "cost": { - "input": 0.4, - "output": 2 + "input": 0.2, + "output": 0.8 } }, { - "id": "claude-haiku-4-5", - "name": "Claude Haiku 4.5", - "display_name": "Claude Haiku 4.5", + "id": "llama-3.3-70b-instruct", + "name": "Llama-3.3-70B-Instruct", + "display_name": "Llama-3.3-70B-Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 100000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, - "open_weights": false, - "knowledge": "2025-02-31", - "release_date": "2025-11-18", - "last_updated": "2025-11-18", + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2024-12-06", + "last_updated": "2024-12-06", "cost": { - "input": 1, - "output": 5, - "cache_read": 0.1, - "cache_write": 1.25 + "input": 0.9, + "output": 0.9 } }, { - "id": "phi-3-mini-4k-instruct", - "name": "Phi-3-mini-instruct (4k)", - "display_name": "Phi-3-mini-instruct (4k)", + "id": "whisper-large-v3", + "name": "Whisper Large v3", + "display_name": "Whisper Large v3", "modalities": { "input": [ - "text" + "audio" ], "output": [ "text" ] }, "limit": { - "context": 4096, - "output": 1024 + "context": 0, + "output": 4096 }, - "temperature": true, + "temperature": false, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-04-23", - "last_updated": "2024-04-23", + "knowledge": "2023-09", + "release_date": "2023-09-01", + "last_updated": "2025-09-05", "cost": { - "input": 0.13, - "output": 0.52 + "input": 0.003, + "output": 0 } }, { - "id": "gpt-5.1-codex", - "name": "GPT-5.1 Codex", - "display_name": "GPT-5.1 Codex", + "id": "deepseek-r1-distill-llama-70b", + "name": "DeepSeek R1 Distill Llama 70B", + "display_name": "DeepSeek R1 Distill Llama 70B", "modalities": { "input": [ - "text", - "image", - "audio" + "text" ], "output": [ - "text", - "image", - "audio" + "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 32000, + "output": 4096 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, "attachment": false, - "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-14", - "last_updated": "2025-11-14", + "open_weights": true, + "knowledge": "2024-07", + "release_date": "2025-01-20", + "last_updated": "2025-01-20", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125 + "input": 0.9, + "output": 0.9 } }, { - "id": "grok-code-fast-1", - "name": "Grok Code Fast 1", - "display_name": "Grok Code Fast 1", + "id": "voxtral-small-24b-2507", + "name": "Voxtral Small 24B 2507", + "display_name": "Voxtral Small 24B 2507", "modalities": { "input": [ - "text" + "text", + "audio" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 10000 + "context": 32000, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": false, - "open_weights": false, - "knowledge": "2023-10", - "release_date": "2025-08-28", - "last_updated": "2025-08-28", + "attachment": true, + "open_weights": true, + "release_date": "2025-07-01", + "last_updated": "2025-07-01", "cost": { - "input": 0.2, - "output": 1.5, - "cache_read": 0.02 + "input": 0.15, + "output": 0.35 } }, { - "id": "deepseek-r1", - "name": "DeepSeek-R1", - "display_name": "DeepSeek-R1", + "id": "gpt-oss-120b", + "name": "GPT-OSS 120B", + "display_name": "GPT-OSS 120B", "modalities": { "input": [ "text" @@ -36182,29 +43693,27 @@ ] }, "limit": { - "context": 163840, - "output": 163840 + "context": 128000, + "output": 8192 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2024-07", - "release_date": "2025-01-20", - "last_updated": "2025-01-20", + "release_date": "2024-01-01", + "last_updated": "2024-01-01", "cost": { - "input": 1.35, - "output": 5.4 + "input": 0.15, + "output": 0.6 } }, { - "id": "meta-llama-3.1-405b-instruct", - "name": "Meta-Llama-3.1-405B-Instruct", - "display_name": "Meta-Llama-3.1-405B-Instruct", + "id": "bge-multilingual-gemma2", + "name": "BGE Multilingual Gemma2", + "display_name": "BGE Multilingual Gemma2", "modalities": { "input": [ "text" @@ -36214,59 +43723,68 @@ ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 8191, + "output": 3072 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-07-23", - "last_updated": "2024-07-23", + "open_weights": false, + "release_date": "2024-07-26", + "last_updated": "2025-06-15", "cost": { - "input": 5.33, - "output": 16 + "input": 0.13, + "output": 0 } }, { - "id": "gpt-4-32k", - "name": "GPT-4 32K", - "display_name": "GPT-4 32K", + "id": "gemma-3-27b-it", + "name": "Gemma-3-27B-IT", + "display_name": "Gemma-3-27B-IT", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 32768, - "output": 32768 + "context": 40000, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2023-11", - "release_date": "2023-03-14", - "last_updated": "2023-03-14", + "knowledge": "2024-12", + "release_date": "2024-12-01", + "last_updated": "2025-09-05", "cost": { - "input": 60, - "output": 120 + "input": 0.25, + "output": 0.5 } - }, + } + ] + }, + "amazon-bedrock": { + "id": "amazon-bedrock", + "name": "Amazon Bedrock", + "display_name": "Amazon Bedrock", + "doc": "https://docs.aws.amazon.com/bedrock/latest/userguide/models-supported.html", + "models": [ { - "id": "phi-4-mini", - "name": "Phi-4-mini", - "display_name": "Phi-4-mini", + "id": "cohere.command-r-plus-v1:0", + "name": "Command R+", + "display_name": "Command R+", "modalities": { "input": [ "text" @@ -36286,18 +43804,18 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-12-11", - "last_updated": "2024-12-11", + "knowledge": "2024-04", + "release_date": "2024-04-04", + "last_updated": "2024-04-04", "cost": { - "input": 0.075, - "output": 0.3 + "input": 3, + "output": 15 } }, { - "id": "cohere-embed-v3-multilingual", - "name": "Embed v3 Multilingual", - "display_name": "Embed v3 Multilingual", + "id": "anthropic.claude-v2", + "name": "Claude 2", + "display_name": "Claude 2", "modalities": { "input": [ "text" @@ -36307,72 +43825,76 @@ ] }, "limit": { - "context": 512, - "output": 1024 + "context": 100000, + "output": 4096 }, - "temperature": false, + "temperature": true, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2023-11-07", - "last_updated": "2023-11-07", + "open_weights": false, + "knowledge": "2023-08", + "release_date": "2023-07-11", + "last_updated": "2023-07-11", "cost": { - "input": 0.1, - "output": 0 + "input": 8, + "output": 24 } }, { - "id": "grok-4", - "name": "Grok 4", - "display_name": "Grok 4", + "id": "anthropic.claude-3-7-sonnet-20250219-v1:0", + "name": "Claude Sonnet 3.7", + "display_name": "Claude Sonnet 3.7", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 64000 + "context": 200000, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2025-07", - "release_date": "2025-07-09", - "last_updated": "2025-07-09", + "knowledge": "2024-04", + "release_date": "2025-02-19", + "last_updated": "2025-02-19", "cost": { "input": 3, "output": 15, - "reasoning": 15, - "cache_read": 0.75 + "cache_read": 0.3, + "cache_write": 3.75 } }, { - "id": "cohere-command-r-08-2024", - "name": "Command R", - "display_name": "Command R", + "id": "anthropic.claude-sonnet-4-20250514-v1:0", + "name": "Claude Sonnet 4", + "display_name": "Claude Sonnet 4", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4000 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, @@ -36380,51 +43902,53 @@ "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-06-01", - "release_date": "2024-08-30", - "last_updated": "2024-08-30", + "attachment": true, + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", "cost": { - "input": 0.15, - "output": 0.6 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 } }, { - "id": "cohere-embed-v-4-0", - "name": "Embed v4", - "display_name": "Embed v4", + "id": "qwen.qwen3-coder-30b-a3b-v1:0", + "name": "Qwen3 Coder 30B A3B Instruct", + "display_name": "Qwen3 Coder 30B A3B Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 1536 + "context": 262144, + "output": 131072 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": true, - "release_date": "2025-04-15", - "last_updated": "2025-04-15", + "attachment": false, + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2025-09-18", + "last_updated": "2025-09-18", "cost": { - "input": 0.12, - "output": 0 + "input": 0.15, + "output": 0.6 } }, { - "id": "llama-3.2-11b-vision-instruct", - "name": "Llama-3.2-11B-Vision-Instruct", - "display_name": "Llama-3.2-11B-Vision-Instruct", + "id": "meta.llama3-2-11b-instruct-v1:0", + "name": "Llama 3.2 11B Instruct", + "display_name": "Llama 3.2 11B Instruct", "modalities": { "input": [ "text", @@ -36436,7 +43960,7 @@ }, "limit": { "context": 128000, - "output": 8192 + "output": 4096 }, "temperature": true, "tool_call": true, @@ -36449,18 +43973,19 @@ "release_date": "2024-09-25", "last_updated": "2024-09-25", "cost": { - "input": 0.37, - "output": 0.37 + "input": 0.16, + "output": 0.16 } }, { - "id": "claude-opus-4-1", - "name": "Claude Opus 4.1", - "display_name": "Claude Opus 4.1", + "id": "anthropic.claude-3-haiku-20240307-v1:0", + "name": "Claude Haiku 3", + "display_name": "Claude Haiku 3", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" @@ -36468,61 +43993,59 @@ }, "limit": { "context": 200000, - "output": 32000 + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-11-18", - "last_updated": "2025-11-18", + "knowledge": "2024-02", + "release_date": "2024-03-13", + "last_updated": "2024-03-13", "cost": { - "input": 15, - "output": 75, - "cache_read": 1.5, - "cache_write": 18.75 + "input": 0.25, + "output": 1.25 } }, { - "id": "gpt-4", - "name": "GPT-4", - "display_name": "GPT-4", + "id": "meta.llama3-2-90b-instruct-v1:0", + "name": "Llama 3.2 90B Instruct", + "display_name": "Llama 3.2 90B Instruct", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": false, - "knowledge": "2023-11", - "release_date": "2023-03-14", - "last_updated": "2023-03-14", + "attachment": true, + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2024-09-25", + "last_updated": "2024-09-25", "cost": { - "input": 60, - "output": 120 + "input": 0.72, + "output": 0.72 } }, { - "id": "phi-3-medium-128k-instruct", - "name": "Phi-3-medium-instruct (128k)", - "display_name": "Phi-3-medium-instruct (128k)", + "id": "meta.llama3-2-1b-instruct-v1:0", + "name": "Llama 3.2 1B Instruct", + "display_name": "Llama 3.2 1B Instruct", "modalities": { "input": [ "text" @@ -36532,62 +44055,59 @@ ] }, "limit": { - "context": 128000, + "context": 131000, "output": 4096 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-04-23", - "last_updated": "2024-04-23", + "knowledge": "2023-12", + "release_date": "2024-09-25", + "last_updated": "2024-09-25", "cost": { - "input": 0.17, - "output": 0.68 + "input": 0.1, + "output": 0.1 } }, { - "id": "grok-4-fast-reasoning", - "name": "Grok 4 Fast (Reasoning)", - "display_name": "Grok 4 Fast (Reasoning)", + "id": "anthropic.claude-v2:1", + "name": "Claude 2.1", + "display_name": "Claude 2.1", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 2000000, - "output": 30000 + "context": 200000, + "output": 4096 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-07", - "release_date": "2025-09-19", - "last_updated": "2025-09-19", + "knowledge": "2023-08", + "release_date": "2023-11-21", + "last_updated": "2023-11-21", "cost": { - "input": 0.2, - "output": 0.5, - "cache_read": 0.05 + "input": 8, + "output": 24 } }, { - "id": "deepseek-r1-0528", - "name": "DeepSeek-R1-0528", - "display_name": "DeepSeek-R1-0528", + "id": "deepseek.v3-v1:0", + "name": "DeepSeek-V3.1", + "display_name": "DeepSeek-V3.1", "modalities": { "input": [ "text" @@ -36598,10 +44118,10 @@ }, "limit": { "context": 163840, - "output": 163840 + "output": 81920 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, "default": true @@ -36609,50 +44129,48 @@ "attachment": false, "open_weights": true, "knowledge": "2024-07", - "release_date": "2025-05-28", - "last_updated": "2025-05-28", + "release_date": "2025-09-18", + "last_updated": "2025-09-18", "cost": { - "input": 1.35, - "output": 5.4 + "input": 0.58, + "output": 1.68 } }, { - "id": "grok-4-fast-non-reasoning", - "name": "Grok 4 Fast (Non-Reasoning)", - "display_name": "Grok 4 Fast (Non-Reasoning)", + "id": "cohere.command-light-text-v14", + "name": "Command Light", + "display_name": "Command Light", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 2000000, - "output": 30000 + "context": 4096, + "output": 4096 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-07", - "release_date": "2025-09-19", - "last_updated": "2025-09-19", + "attachment": false, + "open_weights": true, + "knowledge": "2023-08", + "release_date": "2023-11-01", + "last_updated": "2023-11-01", "cost": { - "input": 0.2, - "output": 0.5, - "cache_read": 0.05 + "input": 0.3, + "output": 0.6 } }, { - "id": "text-embedding-3-small", - "name": "text-embedding-3-small", - "display_name": "text-embedding-3-small", + "id": "ai21.jamba-1-5-large-v1:0", + "name": "Jamba 1.5 Large", + "display_name": "Jamba 1.5 Large", "modalities": { "input": [ "text" @@ -36662,78 +44180,71 @@ ] }, "limit": { - "context": 8191, - "output": 1536 + "context": 256000, + "output": 4096 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2024-01-25", - "last_updated": "2024-01-25", + "open_weights": true, + "knowledge": "2024-08", + "release_date": "2024-08-15", + "last_updated": "2024-08-15", "cost": { - "input": 0.02, - "output": 0 + "input": 2, + "output": 8 } }, { - "id": "gpt-4.1-nano", - "name": "GPT-4.1 nano", - "display_name": "GPT-4.1 nano", + "id": "meta.llama3-3-70b-instruct-v1:0", + "name": "Llama 3.3 70B Instruct", + "display_name": "Llama 3.3 70B Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1047576, - "output": 32768 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-05", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", + "attachment": false, + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2024-12-06", + "last_updated": "2024-12-06", "cost": { - "input": 0.1, - "output": 0.4, - "cache_read": 0.03 + "input": 0.72, + "output": 0.72 } - } - ] - }, - "llama": { - "id": "llama", - "name": "Llama", - "display_name": "Llama", - "api": "https://api.llama.com/compat/v1/", - "doc": "https://llama.developer.meta.com/docs/models", - "models": [ + }, { - "id": "llama-3.3-8b-instruct", - "name": "Llama-3.3-8B-Instruct", - "display_name": "Llama-3.3-8B-Instruct", + "id": "anthropic.claude-3-opus-20240229-v1:0", + "name": "Claude Opus 3", + "display_name": "Claude Opus 3", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, + "context": 200000, "output": 4096 }, "temperature": true, @@ -36742,31 +44253,32 @@ "supported": false }, "attachment": true, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "open_weights": false, + "knowledge": "2023-08", + "release_date": "2024-02-29", + "last_updated": "2024-02-29", "cost": { - "input": 0, - "output": 0 + "input": 15, + "output": 75 } }, { - "id": "llama-4-maverick-17b-128e-instruct-fp8", - "name": "Llama-4-Maverick-17B-128E-Instruct-FP8", - "display_name": "Llama-4-Maverick-17B-128E-Instruct-FP8", + "id": "amazon.nova-pro-v1:0", + "name": "Nova Pro", + "display_name": "Nova Pro", "modalities": { "input": [ "text", - "image" + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 300000, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -36774,19 +44286,20 @@ "supported": false }, "attachment": true, - "open_weights": true, - "knowledge": "2024-08", - "release_date": "2025-04-05", - "last_updated": "2025-04-05", + "open_weights": false, + "knowledge": "2024-10", + "release_date": "2024-12-03", + "last_updated": "2024-12-03", "cost": { - "input": 0, - "output": 0 + "input": 0.8, + "output": 3.2, + "cache_read": 0.2 } }, { - "id": "llama-3.3-70b-instruct", - "name": "Llama-3.3-70B-Instruct", - "display_name": "Llama-3.3-70B-Instruct", + "id": "meta.llama3-1-8b-instruct-v1:0", + "name": "Llama 3.1 8B Instruct", + "display_name": "Llama 3.1 8B Instruct", "modalities": { "input": [ "text" @@ -36804,63 +44317,65 @@ "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": true, "knowledge": "2023-12", - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "release_date": "2024-07-23", + "last_updated": "2024-07-23", "cost": { - "input": 0, - "output": 0 + "input": 0.22, + "output": 0.22 } }, { - "id": "llama-4-scout-17b-16e-instruct-fp8", - "name": "Llama-4-Scout-17B-16E-Instruct-FP8", - "display_name": "Llama-4-Scout-17B-16E-Instruct-FP8", + "id": "qwen.qwen3-32b-v1:0", + "name": "Qwen3 32B (dense)", + "display_name": "Qwen3 32B (dense)", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 16384, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "attachment": false, "open_weights": true, - "knowledge": "2024-08", - "release_date": "2025-04-05", - "last_updated": "2025-04-05", + "knowledge": "2024-04", + "release_date": "2025-09-18", + "last_updated": "2025-09-18", "cost": { - "input": 0, - "output": 0 + "input": 0.15, + "output": 0.6 } }, { - "id": "groq-llama-4-maverick-17b-128e-instruct", - "name": "Groq-Llama-4-Maverick-17B-128E-Instruct", - "display_name": "Groq-Llama-4-Maverick-17B-128E-Instruct", + "id": "anthropic.claude-3-5-sonnet-20240620-v1:0", + "name": "Claude Sonnet 3.5", + "display_name": "Claude Sonnet 3.5", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 200000, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -36868,50 +44383,57 @@ "supported": false }, "attachment": true, - "open_weights": true, - "knowledge": "2025-01", - "release_date": "2025-04-05", - "last_updated": "2025-04-05", + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2024-06-20", + "last_updated": "2024-06-20", "cost": { - "input": 0, - "output": 0 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 } }, { - "id": "cerebras-llama-4-scout-17b-16e-instruct", - "name": "Cerebras-Llama-4-Scout-17B-16E-Instruct", - "display_name": "Cerebras-Llama-4-Scout-17B-16E-Instruct", + "id": "anthropic.claude-haiku-4-5-20251001-v1:0", + "name": "Claude Haiku 4.5", + "display_name": "Claude Haiku 4.5", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false - }, - "attachment": true, - "open_weights": true, - "knowledge": "2025-01", - "release_date": "2025-04-05", - "last_updated": "2025-04-05", + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-02-28", + "release_date": "2025-10-15", + "last_updated": "2025-10-15", "cost": { - "input": 0, - "output": 0 + "input": 1, + "output": 5, + "cache_read": 0.1, + "cache_write": 1.25 } }, { - "id": "cerebras-llama-4-maverick-17b-128e-instruct", - "name": "Cerebras-Llama-4-Maverick-17B-128E-Instruct", - "display_name": "Cerebras-Llama-4-Maverick-17B-128E-Instruct", + "id": "cohere.command-r-v1:0", + "name": "Command R", + "display_name": "Command R", "modalities": { "input": [ "text" @@ -36929,29 +44451,20 @@ "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": true, - "knowledge": "2025-01", - "release_date": "2025-04-05", - "last_updated": "2025-04-05", + "knowledge": "2024-04", + "release_date": "2024-03-11", + "last_updated": "2024-03-11", "cost": { - "input": 0, - "output": 0 + "input": 0.5, + "output": 1.5 } - } - ] - }, - "scaleway": { - "id": "scaleway", - "name": "Scaleway", - "display_name": "Scaleway", - "api": "https://api.scaleway.ai/v1", - "doc": "https://www.scaleway.com/en/docs/generative-apis/", - "models": [ + }, { - "id": "qwen3-235b-a22b-instruct-2507", - "name": "Qwen3 235B A22B Instruct 2507", - "display_name": "Qwen3 235B A22B Instruct 2507", + "id": "amazon.nova-micro-v1:0", + "name": "Nova Micro", + "display_name": "Nova Micro", "modalities": { "input": [ "text" @@ -36961,7 +44474,7 @@ ] }, "limit": { - "context": 260000, + "context": 128000, "output": 8192 }, "temperature": true, @@ -36969,23 +44482,24 @@ "reasoning": { "supported": false }, - "attachment": true, - "open_weights": true, - "release_date": "2025-07-01", - "last_updated": "2025-07-01", + "attachment": false, + "open_weights": false, + "knowledge": "2024-10", + "release_date": "2024-12-03", + "last_updated": "2024-12-03", "cost": { - "input": 0.75, - "output": 2.25 + "input": 0.035, + "output": 0.14, + "cache_read": 0.00875 } }, { - "id": "pixtral-12b-2409", - "name": "Pixtral 12B 2409", - "display_name": "Pixtral 12B 2409", + "id": "meta.llama3-1-70b-instruct-v1:0", + "name": "Llama 3.1 70B Instruct", + "display_name": "Llama 3.1 70B Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" @@ -37000,19 +44514,20 @@ "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": true, - "release_date": "2024-09-25", - "last_updated": "2024-09-25", + "knowledge": "2023-12", + "release_date": "2024-07-23", + "last_updated": "2024-07-23", "cost": { - "input": 0.2, - "output": 0.2 + "input": 0.72, + "output": 0.72 } }, { - "id": "llama-3.1-8b-instruct", - "name": "Llama 3.1 8B Instruct", - "display_name": "Llama 3.1 8B Instruct", + "id": "meta.llama3-70b-instruct-v1:0", + "name": "Llama 3 70B Instruct", + "display_name": "Llama 3 70B Instruct", "modalities": { "input": [ "text" @@ -37022,28 +44537,28 @@ ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 8192, + "output": 2048 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": true, "knowledge": "2023-12", - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "release_date": "2024-07-23", + "last_updated": "2024-07-23", "cost": { - "input": 0.2, - "output": 0.2 + "input": 2.65, + "output": 3.5 } }, { - "id": "mistral-nemo-instruct-2407", - "name": "Mistral Nemo Instruct 2407", - "display_name": "Mistral Nemo Instruct 2407", + "id": "deepseek.r1-v1:0", + "name": "DeepSeek-R1", + "display_name": "DeepSeek-R1", "modalities": { "input": [ "text" @@ -37054,37 +44569,40 @@ }, "limit": { "context": 128000, - "output": 8192 + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": true, - "release_date": "2024-07-25", - "last_updated": "2024-07-25", + "attachment": false, + "open_weights": false, + "knowledge": "2024-07", + "release_date": "2025-01-20", + "last_updated": "2025-05-29", "cost": { - "input": 0.2, - "output": 0.2 + "input": 1.35, + "output": 5.4 } }, { - "id": "mistral-small-3.2-24b-instruct-2506", - "name": "Mistral Small 3.2 24B Instruct (2506)", - "display_name": "Mistral Small 3.2 24B Instruct (2506)", + "id": "anthropic.claude-3-5-sonnet-20241022-v2:0", + "name": "Claude Sonnet 3.5 v2", + "display_name": "Claude Sonnet 3.5 v2", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, + "context": 200000, "output": 8192 }, "temperature": true, @@ -37092,19 +44610,22 @@ "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "release_date": "2025-06-20", - "last_updated": "2025-06-20", + "attachment": true, + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2024-10-22", + "last_updated": "2024-10-22", "cost": { - "input": 0.15, - "output": 0.35 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 } }, { - "id": "qwen3-coder-30b-a3b-instruct", - "name": "Qwen3-Coder 30B-A3B Instruct", - "display_name": "Qwen3-Coder 30B-A3B Instruct", + "id": "cohere.command-text-v14", + "name": "Command", + "display_name": "Command", "modalities": { "input": [ "text" @@ -37114,90 +44635,100 @@ ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 4096, + "output": 4096 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-04", - "last_updated": "2025-04", + "knowledge": "2023-08", + "release_date": "2023-11-01", + "last_updated": "2023-11-01", "cost": { - "input": 0.2, - "output": 0.8 + "input": 1.5, + "output": 2 } }, { - "id": "llama-3.3-70b-instruct", - "name": "Llama-3.3-70B-Instruct", - "display_name": "Llama-3.3-70B-Instruct", + "id": "anthropic.claude-opus-4-20250514-v1:0", + "name": "Claude Opus 4", + "display_name": "Claude Opus 4", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 100000, - "output": 4096 + "context": 200000, + "output": 32000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", "cost": { - "input": 0.9, - "output": 0.9 + "input": 15, + "output": 75, + "cache_read": 1.5, + "cache_write": 18.75 } }, { - "id": "whisper-large-v3", - "name": "Whisper Large v3", - "display_name": "Whisper Large v3", + "id": "global.anthropic.claude-opus-4-5-20251101-v1:0", + "name": "Claude Opus 4.5 (Global)", + "display_name": "Claude Opus 4.5 (Global)", "modalities": { "input": [ - "audio" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 0, - "output": 4096 + "context": 200000, + "output": 64000 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2023-09", - "release_date": "2023-09-01", - "last_updated": "2025-09-05", + "attachment": true, + "open_weights": false, + "knowledge": "2025-03-31", + "release_date": "2025-11-24", + "last_updated": "2025-08-01", "cost": { - "input": 0.003, - "output": 0 + "input": 5, + "output": 25, + "cache_read": 1.5, + "cache_write": 18.75 } }, { - "id": "deepseek-r1-distill-llama-70b", - "name": "DeepSeek R1 Distill Llama 70B", - "display_name": "DeepSeek R1 Distill Llama 70B", + "id": "qwen.qwen3-coder-480b-a35b-v1:0", + "name": "Qwen3 Coder 480B A35B Instruct", + "display_name": "Qwen3 Coder 480B A35B Instruct", "modalities": { "input": [ "text" @@ -37207,60 +44738,64 @@ ] }, "limit": { - "context": 32000, - "output": 4096 + "context": 131072, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2024-07", - "release_date": "2025-01-20", - "last_updated": "2025-01-20", + "knowledge": "2024-04", + "release_date": "2025-09-18", + "last_updated": "2025-09-18", "cost": { - "input": 0.9, - "output": 0.9 + "input": 0.22, + "output": 1.8 } }, { - "id": "voxtral-small-24b-2507", - "name": "Voxtral Small 24B 2507", - "display_name": "Voxtral Small 24B 2507", + "id": "anthropic.claude-sonnet-4-5-20250929-v1:0", + "name": "Claude Sonnet 4.5", + "display_name": "Claude Sonnet 4.5", "modalities": { "input": [ "text", - "audio" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 32000, - "output": 8192 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, - "open_weights": true, - "release_date": "2025-07-01", - "last_updated": "2025-07-01", + "open_weights": false, + "knowledge": "2025-07-31", + "release_date": "2025-09-29", + "last_updated": "2025-09-29", "cost": { - "input": 0.15, - "output": 0.35 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 } }, { - "id": "gpt-oss-120b", - "name": "GPT-OSS 120B", - "display_name": "GPT-OSS 120B", + "id": "meta.llama3-2-3b-instruct-v1:0", + "name": "Llama 3.2 3B Instruct", + "display_name": "Llama 3.2 3B Instruct", "modalities": { "input": [ "text" @@ -37270,27 +44805,28 @@ ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 131000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": true, - "release_date": "2024-01-01", - "last_updated": "2024-01-01", + "knowledge": "2023-12", + "release_date": "2024-09-25", + "last_updated": "2024-09-25", "cost": { "input": 0.15, - "output": 0.6 + "output": 0.15 } }, { - "id": "bge-multilingual-gemma2", - "name": "BGE Multilingual Gemma2", - "display_name": "BGE Multilingual Gemma2", + "id": "anthropic.claude-instant-v1", + "name": "Claude Instant", + "display_name": "Claude Instant", "modalities": { "input": [ "text" @@ -37300,39 +44836,41 @@ ] }, "limit": { - "context": 8191, - "output": 3072 + "context": 100000, + "output": 4096 }, - "temperature": false, + "temperature": true, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2024-07-26", - "last_updated": "2025-06-15", + "knowledge": "2023-08", + "release_date": "2023-03-01", + "last_updated": "2023-03-01", "cost": { - "input": 0.13, - "output": 0 + "input": 0.8, + "output": 2.4 } }, { - "id": "gemma-3-27b-it", - "name": "Gemma-3-27B-IT", - "display_name": "Gemma-3-27B-IT", + "id": "amazon.nova-premier-v1:0", + "name": "Nova Premier", + "display_name": "Nova Premier", "modalities": { "input": [ "text", - "image" + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 40000, - "output": 8192 + "context": 1000000, + "output": 16384 }, "temperature": true, "tool_call": true, @@ -37342,188 +44880,181 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2024-12", - "release_date": "2024-12-01", - "last_updated": "2025-09-05", + "knowledge": "2024-10", + "release_date": "2024-12-03", + "last_updated": "2024-12-03", "cost": { - "input": 0.25, - "output": 0.5 + "input": 2.5, + "output": 12.5 } - } - ] - }, - "amazon-bedrock": { - "id": "amazon-bedrock", - "name": "Amazon Bedrock", - "display_name": "Amazon Bedrock", - "doc": "https://docs.aws.amazon.com/bedrock/latest/userguide/models-supported.html", - "models": [ + }, { - "id": "cohere.command-r-plus-v1:0", - "name": "Command R+", - "display_name": "Command R+", + "id": "anthropic.claude-opus-4-1-20250805-v1:0", + "name": "Claude Opus 4.1", + "display_name": "Claude Opus 4.1", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 200000, + "output": 32000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-04", - "release_date": "2024-04-04", - "last_updated": "2024-04-04", + "attachment": true, + "open_weights": false, + "knowledge": "2025-03-31", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 3, - "output": 15 + "input": 15, + "output": 75, + "cache_read": 1.5, + "cache_write": 18.75 } }, { - "id": "anthropic.claude-v2", - "name": "Claude 2", - "display_name": "Claude 2", + "id": "meta.llama4-scout-17b-instruct-v1:0", + "name": "Llama 4 Scout 17B Instruct", + "display_name": "Llama 4 Scout 17B Instruct", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 100000, - "output": 4096 + "context": 3500000, + "output": 16384 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": false, - "knowledge": "2023-08", - "release_date": "2023-07-11", - "last_updated": "2023-07-11", + "attachment": true, + "open_weights": true, + "knowledge": "2024-08", + "release_date": "2025-04-05", + "last_updated": "2025-04-05", "cost": { - "input": 8, - "output": 24 + "input": 0.17, + "output": 0.66 } }, { - "id": "anthropic.claude-3-7-sonnet-20250219-v1:0", - "name": "Claude Sonnet 3.7", - "display_name": "Claude Sonnet 3.7", + "id": "ai21.jamba-1-5-mini-v1:0", + "name": "Jamba 1.5 Mini", + "display_name": "Jamba 1.5 Mini", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 8192 + "context": 256000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-02-19", - "last_updated": "2025-02-19", + "attachment": false, + "open_weights": true, + "knowledge": "2024-08", + "release_date": "2024-08-15", + "last_updated": "2024-08-15", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 0.2, + "output": 0.4 } }, { - "id": "anthropic.claude-sonnet-4-20250514-v1:0", - "name": "Claude Sonnet 4", - "display_name": "Claude Sonnet 4", + "id": "meta.llama3-8b-instruct-v1:0", + "name": "Llama 3 8B Instruct", + "display_name": "Llama 3 8B Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 8192, + "output": 2048 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-05-22", - "last_updated": "2025-05-22", + "attachment": false, + "open_weights": true, + "knowledge": "2023-03", + "release_date": "2024-07-23", + "last_updated": "2024-07-23", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 0.3, + "output": 0.6 } }, { - "id": "qwen.qwen3-coder-30b-a3b-v1:0", - "name": "Qwen3 Coder 30B A3B Instruct", - "display_name": "Qwen3 Coder 30B A3B Instruct", + "id": "anthropic.claude-3-sonnet-20240229-v1:0", + "name": "Claude Sonnet 3", + "display_name": "Claude Sonnet 3", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 131072 + "context": 200000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-09-18", - "last_updated": "2025-09-18", + "knowledge": "2023-08", + "release_date": "2024-03-04", + "last_updated": "2024-03-04", "cost": { - "input": 0.15, - "output": 0.6 + "input": 3, + "output": 15 } }, { - "id": "meta.llama3-2-11b-instruct-v1:0", - "name": "Llama 3.2 11B Instruct", - "display_name": "Llama 3.2 11B Instruct", + "id": "meta.llama4-maverick-17b-instruct-v1:0", + "name": "Llama 4 Maverick 17B Instruct", + "display_name": "Llama 4 Maverick 17B Instruct", "modalities": { "input": [ "text", @@ -37534,8 +45065,8 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 1000000, + "output": 16384 }, "temperature": true, "tool_call": true, @@ -37544,62 +45075,62 @@ }, "attachment": true, "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-09-25", - "last_updated": "2024-09-25", + "knowledge": "2024-08", + "release_date": "2025-04-05", + "last_updated": "2025-04-05", "cost": { - "input": 0.16, - "output": 0.16 + "input": 0.24, + "output": 0.97 } }, { - "id": "anthropic.claude-3-haiku-20240307-v1:0", - "name": "Claude Haiku 3", - "display_name": "Claude Haiku 3", + "id": "qwen.qwen3-235b-a22b-2507-v1:0", + "name": "Qwen3 235B A22B 2507", + "display_name": "Qwen3 235B A22B 2507", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 4096 + "context": 262144, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-02", - "release_date": "2024-03-13", - "last_updated": "2024-03-13", + "attachment": false, + "open_weights": true, + "knowledge": "2024-04", + "release_date": "2025-09-18", + "last_updated": "2025-09-18", "cost": { - "input": 0.25, - "output": 1.25 + "input": 0.22, + "output": 0.88 } }, { - "id": "meta.llama3-2-90b-instruct-v1:0", - "name": "Llama 3.2 90B Instruct", - "display_name": "Llama 3.2 90B Instruct", + "id": "amazon.nova-lite-v1:0", + "name": "Nova Lite", + "display_name": "Nova Lite", "modalities": { "input": [ "text", - "image" + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 300000, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -37607,50 +45138,64 @@ "supported": false }, "attachment": true, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-09-25", - "last_updated": "2024-09-25", + "open_weights": false, + "knowledge": "2024-10", + "release_date": "2024-12-03", + "last_updated": "2024-12-03", "cost": { - "input": 0.72, - "output": 0.72 + "input": 0.06, + "output": 0.24, + "cache_read": 0.015 } }, { - "id": "meta.llama3-2-1b-instruct-v1:0", - "name": "Llama 3.2 1B Instruct", - "display_name": "Llama 3.2 1B Instruct", + "id": "anthropic.claude-3-5-haiku-20241022-v1:0", + "name": "Claude Haiku 3.5", + "display_name": "Claude Haiku 3.5", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131000, - "output": 4096 + "context": 200000, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-09-25", - "last_updated": "2024-09-25", + "attachment": true, + "open_weights": false, + "knowledge": "2024-07", + "release_date": "2024-10-22", + "last_updated": "2024-10-22", "cost": { - "input": 0.1, - "output": 0.1 + "input": 0.8, + "output": 4, + "cache_read": 0.08, + "cache_write": 1 } - }, + } + ] + }, + "poe": { + "id": "poe", + "name": "Poe", + "display_name": "Poe", + "api": "https://api.poe.com/v1", + "doc": "https://creator.poe.com/docs/external-applications/openai-compatible-api", + "models": [ { - "id": "anthropic.claude-v2:1", - "name": "Claude 2.1", - "display_name": "Claude 2.1", + "id": "xai/grok-4-fast-non-reasoning", + "name": "Grok-4-Fast-Non-Reasoning", + "display_name": "Grok-4-Fast-Non-Reasoning", "modalities": { "input": [ "text" @@ -37660,28 +45205,28 @@ ] }, "limit": { - "context": 200000, - "output": 4096 + "context": 2000000, + "output": 128000 }, - "temperature": true, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2023-08", - "release_date": "2023-11-21", - "last_updated": "2023-11-21", + "release_date": "2025-09-16", + "last_updated": "2025-09-16", "cost": { - "input": 8, - "output": 24 + "input": 0.2, + "output": 0.5, + "cache_read": 0.05 } }, { - "id": "deepseek.v3-v1:0", - "name": "DeepSeek-V3.1", - "display_name": "DeepSeek-V3.1", + "id": "xai/grok-4-fast-reasoning", + "name": "Grok 4 Fast Reasoning", + "display_name": "Grok 4 Fast Reasoning", "modalities": { "input": [ "text" @@ -37691,29 +45236,29 @@ ] }, "limit": { - "context": 163840, - "output": 81920 + "context": 2000000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-07", - "release_date": "2025-09-18", - "last_updated": "2025-09-18", + "attachment": true, + "open_weights": false, + "release_date": "2025-09-16", + "last_updated": "2025-09-16", "cost": { - "input": 0.58, - "output": 1.68 + "input": 0.2, + "output": 0.5, + "cache_read": 0.05 } }, { - "id": "cohere.command-light-text-v14", - "name": "Command Light", - "display_name": "Command Light", + "id": "xai/grok-4.1-fast-reasoning", + "name": "Grok-4.1-Fast-Reasoning", + "display_name": "Grok-4.1-Fast-Reasoning", "modalities": { "input": [ "text" @@ -37723,31 +45268,28 @@ ] }, "limit": { - "context": 4096, - "output": 4096 + "context": 2000000, + "output": 30000 }, - "temperature": true, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2023-08", - "release_date": "2023-11-01", - "last_updated": "2023-11-01", - "cost": { - "input": 0.3, - "output": 0.6 - } + "attachment": true, + "open_weights": false, + "release_date": "2025-11-19", + "last_updated": "2025-11-19" }, { - "id": "ai21.jamba-1-5-large-v1:0", - "name": "Jamba 1.5 Large", - "display_name": "Jamba 1.5 Large", + "id": "xai/grok-4", + "name": "Grok 4", + "display_name": "Grok 4", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -37755,155 +45297,150 @@ }, "limit": { "context": 256000, - "output": 4096 + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-08", - "release_date": "2024-08-15", - "last_updated": "2024-08-15", + "attachment": true, + "open_weights": false, + "release_date": "2025-07-10", + "last_updated": "2025-07-10", "cost": { - "input": 2, - "output": 8 + "input": 3, + "output": 15, + "cache_read": 0.75 } }, { - "id": "meta.llama3-3-70b-instruct-v1:0", - "name": "Llama 3.3 70B Instruct", - "display_name": "Llama 3.3 70B Instruct", + "id": "xai/grok-code-fast-1", + "name": "Grok Code Fast 1", + "display_name": "Grok Code Fast 1", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 256000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "attachment": true, + "open_weights": false, + "release_date": "2025-08-22", + "last_updated": "2025-08-22", "cost": { - "input": 0.72, - "output": 0.72 + "input": 0.2, + "output": 1.5, + "cache_read": 0.02 } }, { - "id": "anthropic.claude-3-opus-20240229-v1:0", - "name": "Claude Opus 3", - "display_name": "Claude Opus 3", + "id": "xai/grok-2", + "name": "Grok-2", + "display_name": "Grok-2", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 4096 + "context": 131072, + "output": 8192 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2023-08", - "release_date": "2024-02-29", - "last_updated": "2024-02-29", + "release_date": "2025-01-14", + "last_updated": "2025-01-14", "cost": { - "input": 15, - "output": 75 + "input": 2, + "output": 10 } }, { - "id": "amazon.nova-pro-v1:0", - "name": "Nova Pro", - "display_name": "Nova Pro", + "id": "xai/grok-4.1-fast-non-reasoning", + "name": "Grok-4.1-Fast-Non-Reasoning", + "display_name": "Grok-4.1-Fast-Non-Reasoning", "modalities": { "input": [ "text", - "image", - "video" + "image" ], "output": [ "text" ] }, "limit": { - "context": 300000, - "output": 8192 + "context": 2000000, + "output": 30000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2024-10", - "release_date": "2024-12-03", - "last_updated": "2024-12-03", - "cost": { - "input": 0.8, - "output": 3.2, - "cache_read": 0.2 - } + "release_date": "2025-11-19", + "last_updated": "2025-11-19" }, { - "id": "meta.llama3-1-8b-instruct-v1:0", - "name": "Llama 3.1 8B Instruct", - "display_name": "Llama 3.1 8B Instruct", + "id": "xai/grok-3", + "name": "Grok 3", + "display_name": "Grok 3", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 131072, + "output": 8192 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-07-23", - "last_updated": "2024-07-23", + "attachment": true, + "open_weights": false, + "release_date": "2025-04-11", + "last_updated": "2025-04-11", "cost": { - "input": 0.22, - "output": 0.22 + "input": 3, + "output": 15, + "cache_read": 0.75 } }, { - "id": "qwen.qwen3-32b-v1:0", - "name": "Qwen3 32B (dense)", - "display_name": "Qwen3 32B (dense)", + "id": "xai/grok-3-mini", + "name": "Grok 3 Mini", + "display_name": "Grok 3 Mini", "modalities": { "input": [ "text" @@ -37913,533 +45450,461 @@ ] }, "limit": { - "context": 16384, - "output": 16384 + "context": 131072, + "output": 8192 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-04", - "release_date": "2025-09-18", - "last_updated": "2025-09-18", + "attachment": true, + "open_weights": false, + "release_date": "2025-04-11", + "last_updated": "2025-04-11", "cost": { - "input": 0.15, - "output": 0.6 + "input": 0.3, + "output": 0.5, + "cache_read": 0.075 } }, { - "id": "anthropic.claude-3-5-sonnet-20240620-v1:0", - "name": "Claude Sonnet 3.5", - "display_name": "Claude Sonnet 3.5", + "id": "ideogramai/ideogram", + "name": "Ideogram", + "display_name": "Ideogram", "modalities": { "input": [ "text", "image" ], "output": [ - "text" + "image" ] }, "limit": { - "context": 200000, - "output": 8192 + "context": 150, + "output": 0 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2024-06-20", - "last_updated": "2024-06-20", - "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 - } + "release_date": "2024-04-03", + "last_updated": "2024-04-03" }, { - "id": "anthropic.claude-haiku-4-5-20251001-v1:0", - "name": "Claude Haiku 4.5", - "display_name": "Claude Haiku 4.5", + "id": "ideogramai/ideogram-v2a", + "name": "Ideogram-v2a", + "display_name": "Ideogram-v2a", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ - "text" + "image" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 150, + "output": 0 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2025-02-28", - "release_date": "2025-10-15", - "last_updated": "2025-10-15", - "cost": { - "input": 1, - "output": 5, - "cache_read": 0.1, - "cache_write": 1.25 - } + "release_date": "2025-02-27", + "last_updated": "2025-02-27" }, { - "id": "cohere.command-r-v1:0", - "name": "Command R", - "display_name": "Command R", + "id": "ideogramai/ideogram-v2a-turbo", + "name": "Ideogram-v2a-Turbo", + "display_name": "Ideogram-v2a-Turbo", "modalities": { "input": [ "text" ], "output": [ - "text" + "image" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 150, + "output": 0 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-04", - "release_date": "2024-03-11", - "last_updated": "2024-03-11", - "cost": { - "input": 0.5, - "output": 1.5 - } + "attachment": true, + "open_weights": false, + "release_date": "2025-02-27", + "last_updated": "2025-02-27" }, { - "id": "amazon.nova-micro-v1:0", - "name": "Nova Micro", - "display_name": "Nova Micro", + "id": "ideogramai/ideogram-v2", + "name": "Ideogram-v2", + "display_name": "Ideogram-v2", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ - "text" + "image" ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 150, + "output": 0 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-10", - "release_date": "2024-12-03", - "last_updated": "2024-12-03", - "cost": { - "input": 0.035, - "output": 0.14, - "cache_read": 0.00875 - } + "release_date": "2024-08-21", + "last_updated": "2024-08-21" }, { - "id": "meta.llama3-1-70b-instruct-v1:0", - "name": "Llama 3.1 70B Instruct", - "display_name": "Llama 3.1 70B Instruct", + "id": "runwayml/runway", + "name": "Runway", + "display_name": "Runway", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ - "text" + "video" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 256, + "output": 0 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-07-23", - "last_updated": "2024-07-23", - "cost": { - "input": 0.72, - "output": 0.72 - } + "attachment": true, + "open_weights": false, + "release_date": "2024-10-11", + "last_updated": "2024-10-11" }, { - "id": "meta.llama3-70b-instruct-v1:0", - "name": "Llama 3 70B Instruct", - "display_name": "Llama 3 70B Instruct", + "id": "runwayml/runway-gen-4-turbo", + "name": "Runway-Gen-4-Turbo", + "display_name": "Runway-Gen-4-Turbo", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ - "text" + "video" ] }, "limit": { - "context": 8192, - "output": 2048 + "context": 256, + "output": 0 }, - "temperature": true, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-07-23", - "last_updated": "2024-07-23", - "cost": { - "input": 2.65, - "output": 3.5 - } + "attachment": true, + "open_weights": false, + "release_date": "2025-05-09", + "last_updated": "2025-05-09" }, { - "id": "deepseek.r1-v1:0", - "name": "DeepSeek-R1", - "display_name": "DeepSeek-R1", + "id": "elevenlabs/elevenlabs-v3", + "name": "ElevenLabs-v3", + "display_name": "ElevenLabs-v3", "modalities": { "input": [ "text" ], "output": [ - "text" + "audio" ] }, "limit": { "context": 128000, - "output": 32768 + "output": 0 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-07", - "release_date": "2025-01-20", - "last_updated": "2025-05-29", - "cost": { - "input": 1.35, - "output": 5.4 - } + "release_date": "2025-06-05", + "last_updated": "2025-06-05" }, { - "id": "anthropic.claude-3-5-sonnet-20241022-v2:0", - "name": "Claude Sonnet 3.5 v2", - "display_name": "Claude Sonnet 3.5 v2", + "id": "elevenlabs/elevenlabs-music", + "name": "ElevenLabs-Music", + "display_name": "ElevenLabs-Music", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ - "text" + "audio" ] }, "limit": { - "context": 200000, - "output": 8192 + "context": 2000, + "output": 0 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2024-10-22", - "last_updated": "2024-10-22", - "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 - } + "release_date": "2025-08-29", + "last_updated": "2025-08-29" }, { - "id": "cohere.command-text-v14", - "name": "Command", - "display_name": "Command", + "id": "elevenlabs/elevenlabs-v2.5-turbo", + "name": "ElevenLabs-v2.5-Turbo", + "display_name": "ElevenLabs-v2.5-Turbo", "modalities": { "input": [ "text" ], "output": [ - "text" + "audio" ] }, "limit": { - "context": 4096, - "output": 4096 + "context": 128000, + "output": 0 }, - "temperature": true, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2023-08", - "release_date": "2023-11-01", - "last_updated": "2023-11-01", - "cost": { - "input": 1.5, - "output": 2 - } + "attachment": true, + "open_weights": false, + "release_date": "2024-10-28", + "last_updated": "2024-10-28" }, { - "id": "anthropic.claude-opus-4-20250514-v1:0", - "name": "Claude Opus 4", - "display_name": "Claude Opus 4", + "id": "google/nano-banana", + "name": "Nano-Banana", + "display_name": "Nano-Banana", "modalities": { "input": [ "text", "image" ], "output": [ - "text" + "text", + "image" ] }, "limit": { - "context": 200000, - "output": 32000 + "context": 32768, + "output": 0 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-05-22", - "last_updated": "2025-05-22", + "release_date": "2025-08-21", + "last_updated": "2025-08-21", "cost": { - "input": 15, - "output": 75, - "cache_read": 1.5, - "cache_write": 18.75 + "input": 0.21, + "output": 1.8 } }, { - "id": "global.anthropic.claude-opus-4-5-20251101-v1:0", - "name": "Claude Opus 4.5 (Global)", - "display_name": "Claude Opus 4.5 (Global)", + "id": "google/imagen-4", + "name": "Imagen-4", + "display_name": "Imagen-4", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ - "text" + "image" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 480, + "output": 0 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-11-24", - "last_updated": "2025-08-01", - "cost": { - "input": 5, - "output": 25, - "cache_read": 1.5, - "cache_write": 18.75 - } + "release_date": "2025-05-22", + "last_updated": "2025-05-22" }, { - "id": "qwen.qwen3-coder-480b-a35b-v1:0", - "name": "Qwen3 Coder 480B A35B Instruct", - "display_name": "Qwen3 Coder 480B A35B Instruct", + "id": "google/imagen-3", + "name": "Imagen-3", + "display_name": "Imagen-3", "modalities": { "input": [ "text" ], "output": [ - "text" + "image" ] }, "limit": { - "context": 131072, - "output": 65536 + "context": 480, + "output": 0 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-04", - "release_date": "2025-09-18", - "last_updated": "2025-09-18", - "cost": { - "input": 0.22, - "output": 1.8 - } + "attachment": true, + "open_weights": false, + "release_date": "2024-10-15", + "last_updated": "2024-10-15" }, { - "id": "anthropic.claude-sonnet-4-5-20250929-v1:0", - "name": "Claude Sonnet 4.5", - "display_name": "Claude Sonnet 4.5", + "id": "google/imagen-4-ultra", + "name": "Imagen-4-Ultra", + "display_name": "Imagen-4-Ultra", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ - "text" + "image" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 480, + "output": 0 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2025-07-31", - "release_date": "2025-09-29", - "last_updated": "2025-09-29", - "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 - } + "release_date": "2025-05-24", + "last_updated": "2025-05-24" }, { - "id": "meta.llama3-2-3b-instruct-v1:0", - "name": "Llama 3.2 3B Instruct", - "display_name": "Llama 3.2 3B Instruct", + "id": "google/gemini-2.5-flash", + "name": "Gemini 2.5 Flash", + "display_name": "Gemini 2.5 Flash", "modalities": { "input": [ - "text" + "text", + "image", + "video", + "audio" ], "output": [ "text" ] }, "limit": { - "context": 131000, - "output": 4096 + "context": 1065535, + "output": 65535 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-09-25", - "last_updated": "2024-09-25", + "attachment": true, + "open_weights": false, + "release_date": "2025-04-26", + "last_updated": "2025-04-26", "cost": { - "input": 0.15, - "output": 0.15 + "input": 0.21, + "output": 1.8, + "cache_read": 0.052 } }, { - "id": "anthropic.claude-instant-v1", - "name": "Claude Instant", - "display_name": "Claude Instant", + "id": "google/gemini-2.0-flash-lite", + "name": "Gemini-2.0-Flash-Lite", + "display_name": "Gemini-2.0-Flash-Lite", "modalities": { "input": [ - "text" + "text", + "image", + "video", + "audio" ], "output": [ "text" ] }, "limit": { - "context": 100000, - "output": 4096 + "context": 990000, + "output": 8192 }, - "temperature": true, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2023-08", - "release_date": "2023-03-01", - "last_updated": "2023-03-01", + "release_date": "2025-02-05", + "last_updated": "2025-02-05", "cost": { - "input": 0.8, - "output": 2.4 + "input": 0.052, + "output": 0.21 } }, { - "id": "amazon.nova-premier-v1:0", - "name": "Nova Premier", - "display_name": "Nova Premier", + "id": "google/gemini-3-pro", + "name": "Gemini-3-Pro", + "display_name": "Gemini-3-Pro", "modalities": { "input": [ "text", "image", - "video" + "video", + "audio" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 16384 + "context": 1048576, + "output": 64000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -38447,329 +45912,278 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2024-10", - "release_date": "2024-12-03", - "last_updated": "2024-12-03", + "release_date": "2025-10-22", + "last_updated": "2025-10-22", "cost": { - "input": 2.5, - "output": 12.5 + "input": 1.6, + "output": 9.6, + "cache_read": 0.16 } }, { - "id": "anthropic.claude-opus-4-1-20250805-v1:0", - "name": "Claude Opus 4.1", - "display_name": "Claude Opus 4.1", + "id": "google/veo-3.1", + "name": "Veo-3.1", + "display_name": "Veo-3.1", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ - "text" + "video" ] }, "limit": { - "context": 200000, - "output": 32000 + "context": 480, + "output": 0 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-08-05", - "last_updated": "2025-08-05", - "cost": { - "input": 15, - "output": 75, - "cache_read": 1.5, - "cache_write": 18.75 - } + "release_date": "2025-10-15", + "last_updated": "2025-10-15" }, { - "id": "meta.llama4-scout-17b-instruct-v1:0", - "name": "Llama 4 Scout 17B Instruct", - "display_name": "Llama 4 Scout 17B Instruct", + "id": "google/imagen-3-fast", + "name": "Imagen-3-Fast", + "display_name": "Imagen-3-Fast", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ - "text" + "image" ] }, "limit": { - "context": 3500000, - "output": 16384 + "context": 480, + "output": 0 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": false }, "attachment": true, - "open_weights": true, - "knowledge": "2024-08", - "release_date": "2025-04-05", - "last_updated": "2025-04-05", - "cost": { - "input": 0.17, - "output": 0.66 - } + "open_weights": false, + "release_date": "2024-10-17", + "last_updated": "2024-10-17" }, { - "id": "ai21.jamba-1-5-mini-v1:0", - "name": "Jamba 1.5 Mini", - "display_name": "Jamba 1.5 Mini", + "id": "google/lyria", + "name": "Lyria", + "display_name": "Lyria", "modalities": { "input": [ "text" ], "output": [ - "text" + "audio" ] }, "limit": { - "context": 256000, - "output": 4096 + "context": 0, + "output": 0 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-08", - "release_date": "2024-08-15", - "last_updated": "2024-08-15", - "cost": { - "input": 0.2, - "output": 0.4 - } + "attachment": true, + "open_weights": false, + "release_date": "2025-06-04", + "last_updated": "2025-06-04" }, { - "id": "meta.llama3-8b-instruct-v1:0", - "name": "Llama 3 8B Instruct", - "display_name": "Llama 3 8B Instruct", + "id": "google/gemini-2.0-flash", + "name": "Gemini-2.0-Flash", + "display_name": "Gemini-2.0-Flash", "modalities": { "input": [ - "text" + "text", + "image", + "video", + "audio" ], "output": [ "text" ] }, "limit": { - "context": 8192, - "output": 2048 + "context": 990000, + "output": 8192 }, - "temperature": true, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2023-03", - "release_date": "2024-07-23", - "last_updated": "2024-07-23", + "attachment": true, + "open_weights": false, + "release_date": "2024-12-11", + "last_updated": "2024-12-11", "cost": { - "input": 0.3, - "output": 0.6 + "input": 0.1, + "output": 0.42 } }, { - "id": "anthropic.claude-3-sonnet-20240229-v1:0", - "name": "Claude Sonnet 3", - "display_name": "Claude Sonnet 3", + "id": "google/gemini-2.5-flash-lite", + "name": "Gemini 2.5 Flash Lite", + "display_name": "Gemini 2.5 Flash Lite", "modalities": { "input": [ "text", - "image" + "image", + "video", + "audio" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 4096 + "context": 1024000, + "output": 64000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": false, - "knowledge": "2023-08", - "release_date": "2024-03-04", - "last_updated": "2024-03-04", + "release_date": "2025-06-19", + "last_updated": "2025-06-19", "cost": { - "input": 3, - "output": 15 + "input": 0.07, + "output": 0.28 } }, { - "id": "meta.llama4-maverick-17b-instruct-v1:0", - "name": "Llama 4 Maverick 17B Instruct", - "display_name": "Llama 4 Maverick 17B Instruct", + "id": "google/veo-3", + "name": "Veo-3", + "display_name": "Veo-3", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ - "text" + "video" ] }, "limit": { - "context": 1000000, - "output": 16384 + "context": 480, + "output": 0 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": false }, "attachment": true, - "open_weights": true, - "knowledge": "2024-08", - "release_date": "2025-04-05", - "last_updated": "2025-04-05", - "cost": { - "input": 0.24, - "output": 0.97 - } + "open_weights": false, + "release_date": "2025-05-21", + "last_updated": "2025-05-21" }, { - "id": "qwen.qwen3-235b-a22b-2507-v1:0", - "name": "Qwen3 235B A22B 2507", - "display_name": "Qwen3 235B A22B 2507", + "id": "google/veo-3-fast", + "name": "Veo-3-Fast", + "display_name": "Veo-3-Fast", "modalities": { "input": [ "text" ], "output": [ - "text" + "video" ] }, "limit": { - "context": 262144, - "output": 131072 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false + "context": 480, + "output": 0 }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-04", - "release_date": "2025-09-18", - "last_updated": "2025-09-18", - "cost": { - "input": 0.22, - "output": 0.88 - } + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": false, + "release_date": "2025-10-13", + "last_updated": "2025-10-13" }, { - "id": "amazon.nova-lite-v1:0", - "name": "Nova Lite", - "display_name": "Nova Lite", + "id": "google/imagen-4-fast", + "name": "Imagen-4-Fast", + "display_name": "Imagen-4-Fast", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ - "text" + "image" ] }, "limit": { - "context": 300000, - "output": 8192 + "context": 480, + "output": 0 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2024-10", - "release_date": "2024-12-03", - "last_updated": "2024-12-03", - "cost": { - "input": 0.06, - "output": 0.24, - "cache_read": 0.015 - } + "release_date": "2025-06-25", + "last_updated": "2025-06-25" }, { - "id": "anthropic.claude-3-5-haiku-20241022-v1:0", - "name": "Claude Haiku 3.5", - "display_name": "Claude Haiku 3.5", + "id": "google/veo-2", + "name": "Veo-2", + "display_name": "Veo-2", "modalities": { "input": [ "text" ], "output": [ - "text" + "video" ] }, "limit": { - "context": 200000, - "output": 8192 + "context": 480, + "output": 0 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2024-07", - "release_date": "2024-10-22", - "last_updated": "2024-10-22", - "cost": { - "input": 0.8, - "output": 4, - "cache_read": 0.08, - "cache_write": 1 - } - } - ] - }, - "poe": { - "id": "poe", - "name": "Poe", - "display_name": "Poe", - "api": "https://api.poe.com/v1", - "doc": "https://creator.poe.com/docs/external-applications/openai-compatible-api", - "models": [ + "release_date": "2024-12-02", + "last_updated": "2024-12-02" + }, { - "id": "facebook/llama-3.1-8b", - "name": "Llama-3.1-8B", - "display_name": "Llama-3.1-8B", + "id": "google/nano-banana-pro", + "name": "Nano-Banana-Pro", + "display_name": "Nano-Banana-Pro", "modalities": { "input": [ "text", "image" ], "output": [ - "text" + "image" ] }, "limit": { - "context": 8192, + "context": 65536, "output": 0 }, "temperature": false, @@ -38779,59 +46193,63 @@ }, "attachment": true, "open_weights": false, - "release_date": "2024-08-08", - "last_updated": "2024-08-08", + "release_date": "2025-11-19", + "last_updated": "2025-11-19", "cost": { - "input": 0.2, - "output": 0.2 + "input": 1.6, + "output": 9.6, + "cache_read": 0.16 } }, { - "id": "facebook/llama-3.1-405b", - "name": "Llama-3.1-405B", - "display_name": "Llama-3.1-405B", + "id": "google/gemini-2.5-pro", + "name": "Gemini 2.5 Pro", + "display_name": "Gemini 2.5 Pro", "modalities": { "input": [ "text", - "image" + "image", + "video", + "audio" ], "output": [ "text" ] }, "limit": { - "context": 8192, - "output": 0 + "context": 1065535, + "output": 65535 }, "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": false, - "release_date": "2024-08-08", - "last_updated": "2024-08-08", + "release_date": "2025-02-05", + "last_updated": "2025-02-05", "cost": { - "input": 3, - "output": 3 + "input": 0.87, + "output": 7, + "cache_read": 0.22 } }, { - "id": "facebook/llama-3.1-70b", - "name": "Llama-3.1-70B", - "display_name": "Llama-3.1-70B", + "id": "google/veo-3.1-fast", + "name": "Veo-3.1-Fast", + "display_name": "Veo-3.1-Fast", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ - "text" + "video" ] }, "limit": { - "context": 8192, + "context": 480, "output": 0 }, "temperature": false, @@ -38841,28 +46259,25 @@ }, "attachment": true, "open_weights": false, - "release_date": "2024-08-08", - "last_updated": "2024-08-08", - "cost": { - "input": 0.9, - "output": 0.9 - } + "release_date": "2025-10-15", + "last_updated": "2025-10-15" }, { - "id": "xai/grok-4-fast-non-reasoning", - "name": "Grok-4-Fast-Non-Reasoning", - "display_name": "Grok-4-Fast-Non-Reasoning", + "id": "openai/gpt-4.1-nano", + "name": "GPT-4.1-nano", + "display_name": "GPT-4.1-nano", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 128000 + "context": 1047576, + "output": 32768 }, "temperature": false, "tool_call": true, @@ -38871,50 +46286,45 @@ }, "attachment": true, "open_weights": false, - "release_date": "2025-09-16", - "last_updated": "2025-09-16", + "release_date": "2025-04-15", + "last_updated": "2025-04-15", "cost": { - "input": 0.2, - "output": 0.5, - "cache_read": 0.05 + "input": 0.09, + "output": 0.36, + "cache_read": 0.022 } }, { - "id": "xai/grok-4-fast-reasoning", - "name": "Grok 4 Fast Reasoning", - "display_name": "Grok 4 Fast Reasoning", + "id": "openai/sora-2", + "name": "Sora-2", + "display_name": "Sora-2", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ - "text" + "video" ] }, "limit": { - "context": 256000, - "output": 128000 + "context": 0, + "output": 0 }, "temperature": false, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2025-09-16", - "last_updated": "2025-09-16", - "cost": { - "input": 0.2, - "output": 0.5, - "cache_read": 0.05 - } + "release_date": "2025-10-06", + "last_updated": "2025-10-06" }, { - "id": "xai/grok-4", - "name": "Grok 4", - "display_name": "Grok 4", + "id": "openai/o1-pro", + "name": "o1-pro", + "display_name": "o1-pro", "modalities": { "input": [ "text", @@ -38925,8 +46335,8 @@ ] }, "limit": { - "context": 256000, - "output": 128000 + "context": 200000, + "output": 100000 }, "temperature": false, "tool_call": true, @@ -38936,18 +46346,17 @@ }, "attachment": true, "open_weights": false, - "release_date": "2025-07-10", - "last_updated": "2025-07-10", + "release_date": "2025-03-19", + "last_updated": "2025-03-19", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.75 + "input": 140, + "output": 540 } }, { - "id": "xai/grok-code-fast-1", - "name": "Grok Code Fast 1", - "display_name": "Grok Code Fast 1", + "id": "openai/gpt-5.1-codex", + "name": "GPT-5.1-Codex", + "display_name": "GPT-5.1-Codex", "modalities": { "input": [ "text", @@ -38958,7 +46367,7 @@ ] }, "limit": { - "context": 256000, + "context": 400000, "output": 128000 }, "temperature": false, @@ -38969,29 +46378,30 @@ }, "attachment": true, "open_weights": false, - "release_date": "2025-08-22", - "last_updated": "2025-08-22", + "release_date": "2025-11-12", + "last_updated": "2025-11-12", "cost": { - "input": 0.2, - "output": 1.5, - "cache_read": 0.02 + "input": 1.1, + "output": 9, + "cache_read": 0.11 } }, { - "id": "xai/grok-2", - "name": "Grok-2", - "display_name": "Grok-2", + "id": "openai/gpt-3.5-turbo-raw", + "name": "GPT-3.5-Turbo-Raw", + "display_name": "GPT-3.5-Turbo-Raw", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 4524, + "output": 2048 }, "temperature": false, "tool_call": true, @@ -39000,17 +46410,17 @@ }, "attachment": true, "open_weights": false, - "release_date": "2025-01-14", - "last_updated": "2025-01-14", + "release_date": "2023-09-27", + "last_updated": "2023-09-27", "cost": { - "input": 2, - "output": 10 + "input": 0.45, + "output": 1.4 } }, { - "id": "xai/grok-3", - "name": "Grok 3", - "display_name": "Grok 3", + "id": "openai/gpt-4-classic", + "name": "GPT-4-Classic", + "display_name": "GPT-4-Classic", "modalities": { "input": [ "text", @@ -39021,8 +46431,8 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 8192, + "output": 4096 }, "temperature": false, "tool_call": true, @@ -39031,62 +46441,61 @@ }, "attachment": true, "open_weights": false, - "release_date": "2025-04-11", - "last_updated": "2025-04-11", + "release_date": "2024-03-25", + "last_updated": "2024-03-25", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.75 + "input": 27, + "output": 54 } }, { - "id": "xai/grok-3-mini", - "name": "Grok 3 Mini", - "display_name": "Grok 3 Mini", + "id": "openai/gpt-4.1-mini", + "name": "GPT-4.1-mini", + "display_name": "GPT-4.1-mini", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 1047576, + "output": 32768 }, "temperature": false, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2025-04-11", - "last_updated": "2025-04-11", + "release_date": "2025-04-15", + "last_updated": "2025-04-15", "cost": { - "input": 0.3, - "output": 0.5, - "cache_read": 0.075 + "input": 0.36, + "output": 1.4, + "cache_read": 0.09 } }, { - "id": "ideogramai/ideogram", - "name": "Ideogram", - "display_name": "Ideogram", + "id": "openai/gpt-5-chat", + "name": "GPT-5-Chat", + "display_name": "GPT-5-Chat", "modalities": { "input": [ "text", "image" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 150, - "output": 0 + "context": 128000, + "output": 16384 }, "temperature": false, "tool_call": true, @@ -39095,50 +46504,61 @@ }, "attachment": true, "open_weights": false, - "release_date": "2024-04-03", - "last_updated": "2024-04-03" + "release_date": "2025-08-07", + "last_updated": "2025-08-07", + "cost": { + "input": 1.1, + "output": 9, + "cache_read": 0.11 + } }, { - "id": "ideogramai/ideogram-v2a", - "name": "Ideogram-v2a", - "display_name": "Ideogram-v2a", + "id": "openai/o3-deep-research", + "name": "o3-deep-research", + "display_name": "o3-deep-research", "modalities": { "input": [ "text" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 150, - "output": 0 + "context": 200000, + "output": 100000 }, "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": false, - "release_date": "2025-02-27", - "last_updated": "2025-02-27" + "release_date": "2025-06-27", + "last_updated": "2025-06-27", + "cost": { + "input": 9, + "output": 36, + "cache_read": 2.2 + } }, { - "id": "ideogramai/ideogram-v2a-turbo", - "name": "Ideogram-v2a-Turbo", - "display_name": "Ideogram-v2a-Turbo", + "id": "openai/gpt-4o-search", + "name": "GPT-4o-Search", + "display_name": "GPT-4o-Search", "modalities": { "input": [ "text" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 150, - "output": 0 + "context": 128000, + "output": 8192 }, "temperature": false, "tool_call": true, @@ -39147,13 +46567,17 @@ }, "attachment": true, "open_weights": false, - "release_date": "2025-02-27", - "last_updated": "2025-02-27" + "release_date": "2025-03-11", + "last_updated": "2025-03-11", + "cost": { + "input": 2.2, + "output": 9 + } }, { - "id": "ideogramai/ideogram-v2", - "name": "Ideogram-v2", - "display_name": "Ideogram-v2", + "id": "openai/gpt-image-1-mini", + "name": "GPT-Image-1-Mini", + "display_name": "GPT-Image-1-Mini", "modalities": { "input": [ "text", @@ -39164,7 +46588,7 @@ ] }, "limit": { - "context": 150, + "context": 0, "output": 0 }, "temperature": false, @@ -39174,25 +46598,25 @@ }, "attachment": true, "open_weights": false, - "release_date": "2024-08-21", - "last_updated": "2024-08-21" + "release_date": "2025-08-26", + "last_updated": "2025-08-26" }, { - "id": "runwayml/runway", - "name": "Runway", - "display_name": "Runway", + "id": "openai/gpt-3.5-turbo", + "name": "GPT-3.5-Turbo", + "display_name": "GPT-3.5-Turbo", "modalities": { "input": [ "text", "image" ], "output": [ - "video" + "text" ] }, "limit": { - "context": 256, - "output": 0 + "context": 16384, + "output": 2048 }, "temperature": false, "tool_call": true, @@ -39201,51 +46625,61 @@ }, "attachment": true, "open_weights": false, - "release_date": "2024-10-11", - "last_updated": "2024-10-11" + "release_date": "2023-09-13", + "last_updated": "2023-09-13", + "cost": { + "input": 0.45, + "output": 1.4 + } }, { - "id": "runwayml/runway-gen-4-turbo", - "name": "Runway-Gen-4-Turbo", - "display_name": "Runway-Gen-4-Turbo", + "id": "openai/o3-mini-high", + "name": "o3-mini-high", + "display_name": "o3-mini-high", "modalities": { "input": [ "text", "image" ], "output": [ - "video" + "text" ] }, "limit": { - "context": 256, - "output": 0 + "context": 200000, + "output": 100000 }, "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": false, - "release_date": "2025-05-09", - "last_updated": "2025-05-09" + "release_date": "2025-01-31", + "last_updated": "2025-01-31", + "cost": { + "input": 0.99, + "output": 4 + } }, { - "id": "elevenlabs/elevenlabs-v3", - "name": "ElevenLabs-v3", - "display_name": "ElevenLabs-v3", + "id": "openai/chatgpt-4o-latest", + "name": "ChatGPT-4o-Latest", + "display_name": "ChatGPT-4o-Latest", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ - "audio" + "text" ] }, "limit": { "context": 128000, - "output": 0 + "output": 8192 }, "temperature": false, "tool_call": true, @@ -39254,24 +46688,29 @@ }, "attachment": true, "open_weights": false, - "release_date": "2025-06-05", - "last_updated": "2025-06-05" + "release_date": "2024-08-14", + "last_updated": "2024-08-14", + "cost": { + "input": 4.5, + "output": 14 + } }, { - "id": "elevenlabs/elevenlabs-music", - "name": "ElevenLabs-Music", - "display_name": "ElevenLabs-Music", + "id": "openai/gpt-4-turbo", + "name": "GPT-4-Turbo", + "display_name": "GPT-4-Turbo", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ - "audio" + "text" ] }, "limit": { - "context": 2000, - "output": 0 + "context": 128000, + "output": 4096 }, "temperature": false, "tool_call": true, @@ -39280,52 +46719,61 @@ }, "attachment": true, "open_weights": false, - "release_date": "2025-08-29", - "last_updated": "2025-08-29" + "release_date": "2023-09-13", + "last_updated": "2023-09-13", + "cost": { + "input": 9, + "output": 27 + } }, { - "id": "elevenlabs/elevenlabs-v2.5-turbo", - "name": "ElevenLabs-v2.5-Turbo", - "display_name": "ElevenLabs-v2.5-Turbo", + "id": "openai/gpt-5.1-codex-mini", + "name": "GPT-5.1-Codex-Mini", + "display_name": "GPT-5.1-Codex-Mini", "modalities": { "input": [ "text" ], "output": [ - "audio" + "text" ] }, "limit": { - "context": 128000, - "output": 0 + "context": 400000, + "output": 128000 }, "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": false, - "release_date": "2024-10-28", - "last_updated": "2024-10-28" + "release_date": "2025-11-12", + "last_updated": "2025-11-12", + "cost": { + "input": 0.22, + "output": 1.8, + "cache_read": 0.022 + } }, { - "id": "google/nano-banana", - "name": "Nano-Banana", - "display_name": "Nano-Banana", + "id": "openai/gpt-5.1-instant", + "name": "GPT-5.1-Instant", + "display_name": "GPT-5.1-Instant", "modalities": { "input": [ "text", "image" ], "output": [ - "text", - "image" + "text" ] }, "limit": { - "context": 32768, - "output": 0 + "context": 128000, + "output": 16384 }, "temperature": false, "tool_call": true, @@ -39334,109 +46782,128 @@ }, "attachment": true, "open_weights": false, - "release_date": "2025-08-21", - "last_updated": "2025-08-21", + "release_date": "2025-11-12", + "last_updated": "2025-11-12", "cost": { - "input": 0.21, - "output": 1.7 + "input": 1.1, + "output": 9, + "cache_read": 0.11 } }, { - "id": "google/imagen-4", - "name": "Imagen-4", - "display_name": "Imagen-4", + "id": "openai/o3-mini", + "name": "o3-mini", + "display_name": "o3-mini", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 480, - "output": 0 + "context": 200000, + "output": 100000 }, "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": false, - "release_date": "2025-05-22", - "last_updated": "2025-05-22" + "release_date": "2025-01-31", + "last_updated": "2025-01-31", + "cost": { + "input": 0.99, + "output": 4 + } }, { - "id": "google/imagen-3", - "name": "Imagen-3", - "display_name": "Imagen-3", + "id": "openai/gpt-5.1", + "name": "GPT-5.1", + "display_name": "GPT-5.1", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 480, - "output": 0 + "context": 400000, + "output": 128000 }, "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": false, - "release_date": "2024-10-15", - "last_updated": "2024-10-15" + "release_date": "2025-11-12", + "last_updated": "2025-11-12", + "cost": { + "input": 1.1, + "output": 9, + "cache_read": 0.11 + } }, { - "id": "google/imagen-4-ultra", - "name": "Imagen-4-Ultra", - "display_name": "Imagen-4-Ultra", + "id": "openai/gpt-5-nano", + "name": "GPT-5-nano", + "display_name": "GPT-5-nano", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 480, - "output": 0 + "context": 400000, + "output": 128000 }, "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": false, - "release_date": "2025-05-24", - "last_updated": "2025-05-24" + "release_date": "2025-08-05", + "last_updated": "2025-08-05", + "cost": { + "input": 0.045, + "output": 0.36, + "cache_read": 0.0045 + } }, { - "id": "google/gemini-2.5-flash", - "name": "Gemini 2.5 Flash", - "display_name": "Gemini 2.5 Flash", + "id": "openai/gpt-5-codex", + "name": "GPT-5-Codex", + "display_name": "GPT-5-Codex", "modalities": { "input": [ "text", - "image", - "video", - "audio" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1065535, - "output": 65535 + "context": 400000, + "output": 128000 }, "temperature": false, "tool_call": true, @@ -39446,67 +46913,56 @@ }, "attachment": true, "open_weights": false, - "release_date": "2025-04-26", - "last_updated": "2025-04-26", + "release_date": "2025-09-23", + "last_updated": "2025-09-23", "cost": { - "input": 0.21, - "output": 1.7, - "cache_read": 0.052 + "input": 1.1, + "output": 9 } }, { - "id": "google/gemini-3.0-pro", - "name": "Gemini-3.0-Pro", - "display_name": "Gemini-3.0-Pro", + "id": "openai/gpt-4o", + "name": "GPT-4o", + "display_name": "GPT-4o", "modalities": { "input": [ "text", - "image", - "video", - "audio" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 64000 + "context": 128000, + "output": 8192 }, "temperature": false, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2025-10-22", - "last_updated": "2025-10-22", - "cost": { - "input": 1.6, - "output": 9.6, - "cache_read": 0.16 - } + "release_date": "2024-05-13", + "last_updated": "2024-05-13" }, { - "id": "google/gemini-2.0-flash-lite", - "name": "Gemini-2.0-Flash-Lite", - "display_name": "Gemini-2.0-Flash-Lite", + "id": "openai/gpt-4.1", + "name": "GPT-4.1", + "display_name": "GPT-4.1", "modalities": { "input": [ "text", - "image", - "video", - "audio" + "image" ], "output": [ "text" ] }, "limit": { - "context": 990000, - "output": 8192 + "context": 1047576, + "output": 32768 }, "temperature": false, "tool_call": true, @@ -39515,108 +46971,127 @@ }, "attachment": true, "open_weights": false, - "release_date": "2025-02-05", - "last_updated": "2025-02-05", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { - "input": 0.052, - "output": 0.21 + "input": 1.8, + "output": 7.2, + "cache_read": 0.45 } }, { - "id": "google/veo-3.1", - "name": "Veo-3.1", - "display_name": "Veo-3.1", + "id": "openai/o4-mini", + "name": "o4-mini", + "display_name": "o4-mini", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ - "video" + "text" ] }, "limit": { - "context": 480, - "output": 0 + "context": 200000, + "output": 100000 }, "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": false, - "release_date": "2025-10-15", - "last_updated": "2025-10-15" + "release_date": "2025-04-16", + "last_updated": "2025-04-16", + "cost": { + "input": 0.99, + "output": 4, + "cache_read": 0.25 + } }, { - "id": "google/imagen-3-fast", - "name": "Imagen-3-Fast", - "display_name": "Imagen-3-Fast", + "id": "openai/o1", + "name": "o1", + "display_name": "o1", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 480, - "output": 0 + "context": 200000, + "output": 100000 }, "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": false, - "release_date": "2024-10-17", - "last_updated": "2024-10-17" + "release_date": "2024-12-18", + "last_updated": "2024-12-18", + "cost": { + "input": 14, + "output": 54 + } }, { - "id": "google/lyria", - "name": "Lyria", - "display_name": "Lyria", + "id": "openai/gpt-5-mini", + "name": "GPT-5-mini", + "display_name": "GPT-5-mini", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ - "audio" + "text" ] }, "limit": { - "context": 0, - "output": 0 + "context": 400000, + "output": 128000 }, "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": false, - "release_date": "2025-06-04", - "last_updated": "2025-06-04" + "release_date": "2025-06-25", + "last_updated": "2025-06-25", + "cost": { + "input": 0.22, + "output": 1.8, + "cache_read": 0.022 + } }, { - "id": "google/gemini-2.0-flash", - "name": "Gemini-2.0-Flash", - "display_name": "Gemini-2.0-Flash", + "id": "openai/gpt-4o-aug", + "name": "GPT-4o-Aug", + "display_name": "GPT-4o-Aug", "modalities": { "input": [ "text", - "image", - "video", - "audio" + "image" ], "output": [ "text" ] }, "limit": { - "context": 990000, + "context": 128000, "output": 8192 }, "temperature": false, @@ -39626,31 +47101,30 @@ }, "attachment": true, "open_weights": false, - "release_date": "2024-12-11", - "last_updated": "2024-12-11", + "release_date": "2024-11-21", + "last_updated": "2024-11-21", "cost": { - "input": 0.1, - "output": 0.42 + "input": 2.2, + "output": 9, + "cache_read": 1.1 } }, { - "id": "google/gemini-2.5-flash-lite", - "name": "Gemini 2.5 Flash Lite", - "display_name": "Gemini 2.5 Flash Lite", + "id": "openai/o3-pro", + "name": "o3-pro", + "display_name": "o3-pro", "modalities": { "input": [ "text", - "image", - "video", - "audio" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1024000, - "output": 64000 + "context": 200000, + "output": 100000 }, "temperature": false, "tool_call": true, @@ -39660,27 +47134,28 @@ }, "attachment": true, "open_weights": false, - "release_date": "2025-06-19", - "last_updated": "2025-06-19", + "release_date": "2025-06-10", + "last_updated": "2025-06-10", "cost": { - "input": 0.07, - "output": 0.28 + "input": 18, + "output": 72 } }, { - "id": "google/veo-3", - "name": "Veo-3", - "display_name": "Veo-3", + "id": "openai/gpt-image-1", + "name": "GPT-Image-1", + "display_name": "GPT-Image-1", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ - "video" + "image" ] }, "limit": { - "context": 480, + "context": 128000, "output": 0 }, "temperature": false, @@ -39690,24 +47165,25 @@ }, "attachment": true, "open_weights": false, - "release_date": "2025-05-21", - "last_updated": "2025-05-21" + "release_date": "2025-03-31", + "last_updated": "2025-03-31" }, { - "id": "google/veo-3-fast", - "name": "Veo-3-Fast", - "display_name": "Veo-3-Fast", + "id": "openai/gpt-3.5-turbo-instruct", + "name": "GPT-3.5-Turbo-Instruct", + "display_name": "GPT-3.5-Turbo-Instruct", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ - "video" + "text" ] }, "limit": { - "context": 480, - "output": 0 + "context": 3500, + "output": 1024 }, "temperature": false, "tool_call": true, @@ -39716,111 +47192,125 @@ }, "attachment": true, "open_weights": false, - "release_date": "2025-10-13", - "last_updated": "2025-10-13" + "release_date": "2023-09-20", + "last_updated": "2023-09-20", + "cost": { + "input": 1.4, + "output": 1.8 + } }, { - "id": "google/imagen-4-fast", - "name": "Imagen-4-Fast", - "display_name": "Imagen-4-Fast", + "id": "openai/o3", + "name": "o3", + "display_name": "o3", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 480, - "output": 0 + "context": 200000, + "output": 100000 }, "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": false, - "release_date": "2025-06-25", - "last_updated": "2025-06-25" + "release_date": "2025-04-16", + "last_updated": "2025-04-16", + "cost": { + "input": 1.8, + "output": 7.2, + "cache_read": 0.45 + } }, { - "id": "google/veo-2", - "name": "Veo-2", - "display_name": "Veo-2", + "id": "openai/o4-mini-deep-research", + "name": "o4-mini-deep-research", + "display_name": "o4-mini-deep-research", "modalities": { "input": [ "text" ], "output": [ - "video" + "text" ] }, "limit": { - "context": 480, - "output": 0 + "context": 200000, + "output": 100000 }, "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": false, - "release_date": "2024-12-02", - "last_updated": "2024-12-02" + "release_date": "2025-06-27", + "last_updated": "2025-06-27", + "cost": { + "input": 1.8, + "output": 7.2, + "cache_read": 0.45 + } }, { - "id": "google/gemini-2.5-pro", - "name": "Gemini 2.5 Pro", - "display_name": "Gemini 2.5 Pro", + "id": "openai/gpt-4-classic-0314", + "name": "GPT-4-Classic-0314", + "display_name": "GPT-4-Classic-0314", "modalities": { "input": [ "text", - "image", - "video", - "audio" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1065535, - "output": 65535 + "context": 8192, + "output": 4096 }, "temperature": false, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2025-02-05", - "last_updated": "2025-02-05", + "release_date": "2024-08-26", + "last_updated": "2024-08-26", "cost": { - "input": 0.87, - "output": 7, - "cache_read": 0.22 + "input": 27, + "output": 54 } }, { - "id": "google/veo-3.1-fast", - "name": "Veo-3.1-Fast", - "display_name": "Veo-3.1-Fast", + "id": "openai/gpt-4o-mini", + "name": "GPT-4o-mini", + "display_name": "GPT-4o-mini", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ - "video" + "text" ] }, "limit": { - "context": 480, - "output": 0 + "context": 128000, + "output": 4096 }, "temperature": false, "tool_call": true, @@ -39829,16 +47319,22 @@ }, "attachment": true, "open_weights": false, - "release_date": "2025-10-15", - "last_updated": "2025-10-15" + "release_date": "2024-07-18", + "last_updated": "2024-07-18", + "cost": { + "input": 0.14, + "output": 0.54, + "cache_read": 0.068 + } }, { - "id": "openai/gpt-5.1-codex", - "name": "GPT-5.1-Codex", - "display_name": "GPT-5.1-Codex", + "id": "openai/gpt-5", + "name": "GPT-5", + "display_name": "GPT-5", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -39856,8 +47352,8 @@ }, "attachment": true, "open_weights": false, - "release_date": "2025-11-12", - "last_updated": "2025-11-12", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { "input": 1.1, "output": 9, @@ -39865,53 +47361,47 @@ } }, { - "id": "openai/gpt-5.1-codex-mini", - "name": "GPT-5.1-Codex-Mini", - "display_name": "GPT-5.1-Codex-Mini", + "id": "openai/dall-e-3", + "name": "DALL-E-3", + "display_name": "DALL-E-3", "modalities": { "input": [ "text" ], "output": [ - "text" + "image" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 800, + "output": 0 }, "temperature": false, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2025-11-12", - "last_updated": "2025-11-12", - "cost": { - "input": 0.22, - "output": 1.8, - "cache_read": 0.022 - } + "release_date": "2023-11-06", + "last_updated": "2023-11-06" }, { - "id": "openai/gpt-5.1-instant", - "name": "GPT-5.1-Instant", - "display_name": "GPT-5.1-Instant", + "id": "openai/sora-2-pro", + "name": "Sora-2-Pro", + "display_name": "Sora-2-Pro", "modalities": { "input": [ "text", "image" ], "output": [ - "text" + "video" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 0, + "output": 0 }, "temperature": false, "tool_call": true, @@ -39920,18 +47410,13 @@ }, "attachment": true, "open_weights": false, - "release_date": "2025-11-12", - "last_updated": "2025-11-12", - "cost": { - "input": 1.1, - "output": 9, - "cache_read": 0.11 - } + "release_date": "2025-10-06", + "last_updated": "2025-10-06" }, { - "id": "openai/gpt-5.1", - "name": "GPT-5.1", - "display_name": "GPT-5.1", + "id": "openai/gpt-5-pro", + "name": "GPT-5-Pro", + "display_name": "GPT-5-Pro", "modalities": { "input": [ "text", @@ -39953,12 +47438,41 @@ }, "attachment": true, "open_weights": false, - "release_date": "2025-11-12", - "last_updated": "2025-11-12", + "release_date": "2025-10-06", + "last_updated": "2025-10-06", "cost": { - "input": 1.1, - "output": 9, - "cache_read": 0.11 + "input": 14, + "output": 110 + } + }, + { + "id": "openai/gpt-4o-mini-search", + "name": "GPT-4o-mini-Search", + "display_name": "GPT-4o-mini-Search", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 8192 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": false, + "release_date": "2025-03-11", + "last_updated": "2025-03-11", + "cost": { + "input": 0.14, + "output": 0.54 } }, { @@ -40075,7 +47589,8 @@ "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" @@ -40108,7 +47623,8 @@ "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" @@ -40142,7 +47658,8 @@ "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" @@ -40165,7 +47682,7 @@ "cost": { "input": 2.6, "output": 13, - "cache_read": 0.25, + "cache_read": 0.26, "cache_write": 3.2 } }, @@ -40176,7 +47693,8 @@ "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" @@ -40210,7 +47728,8 @@ "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" @@ -40233,7 +47752,7 @@ "cost": { "input": 2.6, "output": 13, - "cache_read": 0.25, + "cache_read": 0.26, "cache_write": 3.2 } }, @@ -40244,7 +47763,8 @@ "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" @@ -40277,7 +47797,8 @@ "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" @@ -40299,7 +47820,7 @@ "last_updated": "2025-10-15", "cost": { "input": 0.85, - "output": 4.2, + "output": 4.3, "cache_read": 0.085, "cache_write": 1.1 } @@ -40311,7 +47832,8 @@ "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" @@ -40334,7 +47856,7 @@ "cost": { "input": 2.6, "output": 13, - "cache_read": 0.25, + "cache_read": 0.26, "cache_write": 3.2 } }, @@ -40345,7 +47867,8 @@ "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" @@ -40378,7 +47901,8 @@ "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" @@ -40412,7 +47936,8 @@ "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" @@ -40435,7 +47960,7 @@ "cost": { "input": 2.6, "output": 13, - "cache_read": 0.25, + "cache_read": 0.26, "cache_write": 3.2 } }, @@ -40446,7 +47971,8 @@ "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" @@ -40480,7 +48006,8 @@ "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" @@ -40502,7 +48029,7 @@ "cost": { "input": 2.6, "output": 13, - "cache_read": 0.25, + "cache_read": 0.26, "cache_write": 3.2 } }, @@ -40513,7 +48040,8 @@ "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" @@ -40536,10 +48064,45 @@ "cost": { "input": 2.6, "output": 13, - "cache_read": 0.25, + "cache_read": 0.26, "cache_write": 3.2 } }, + { + "id": "anthropic/claude-opus-4.5", + "name": "claude-opus-4.5", + "display_name": "claude-opus-4.5", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 196608, + "output": 64000 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": false, + "release_date": "2025-11-21", + "last_updated": "2025-11-21", + "cost": { + "input": 4.3, + "output": 21, + "cache_read": 0.43, + "cache_write": 5.3 + } + }, { "id": "anthropic/claude-haiku-3.5", "name": "Claude-Haiku-3.5", @@ -40547,7 +48110,8 @@ "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" @@ -40580,7 +48144,8 @@ "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" @@ -40602,7 +48167,7 @@ "cost": { "input": 2.6, "output": 13, - "cache_read": 0.25, + "cache_read": 0.26, "cache_write": 3.2 } }, @@ -40613,7 +48178,8 @@ "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" @@ -40636,7 +48202,7 @@ "cost": { "input": 2.6, "output": 13, - "cache_read": 0.25, + "cache_read": 0.26, "cache_write": 3.2 } }, @@ -40647,7 +48213,8 @@ "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" @@ -40670,7 +48237,7 @@ "cost": { "input": 2.6, "output": 13, - "cache_read": 0.25, + "cache_read": 0.26, "cache_write": 3.2 } }, @@ -40700,6 +48267,33 @@ "release_date": "2024-08-15", "last_updated": "2024-08-15" }, + { + "id": "novita/kimi-k2-thinking", + "name": "kimi-k2-thinking", + "display_name": "kimi-k2-thinking", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 256000, + "output": 0 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": false, + "release_date": "2025-11-07", + "last_updated": "2025-11-07" + }, { "id": "novita/glm-4.6", "name": "GLM-4.6", @@ -42730,6 +50324,32 @@ "attachment": true, "open_weights": false }, + { + "id": "openai/gpt-5.2", + "name": "OpenAI: gpt-5.2", + "display_name": "OpenAI: gpt-5.2", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 400000, + "output": 128000 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": false + }, { "id": "openai/gpt-5.1-chat", "name": "OpenAI: gpt-5.1", @@ -45846,6 +53466,324 @@ }, "type": "chat" }, + { + "id": "mistral-large-3:675b-cloud", + "name": "Mistral Large 3 675B Cloud", + "display_name": "Mistral Large 3 675B Cloud", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 256000, + "output": 256000 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "ministral-3:latest", + "name": "Ministral 3 Latest", + "display_name": "Ministral 3 Latest", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 256000, + "output": 256000 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "ministral-3:3b", + "name": "Ministral 3 3B", + "display_name": "Ministral 3 3B", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 256000, + "output": 256000 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "ministral-3:8b", + "name": "Ministral 3 8B", + "display_name": "Ministral 3 8B", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 256000, + "output": 256000 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "ministral-3:14b", + "name": "Ministral 3 14B", + "display_name": "Ministral 3 14B", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 256000, + "output": 256000 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "ministral-3:3b-cloud", + "name": "Ministral 3 3B Cloud", + "display_name": "Ministral 3 3B Cloud", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 256000, + "output": 256000 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "ministral-3:8b-cloud", + "name": "Ministral 3 8B Cloud", + "display_name": "Ministral 3 8B Cloud", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 256000, + "output": 256000 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "ministral-3:14b-cloud", + "name": "Ministral 3 14B Cloud", + "display_name": "Ministral 3 14B Cloud", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 256000, + "output": 256000 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "ministral-3:3b-instruct-2512-q8_0", + "name": "Ministral 3 3B Instruct 2512 Q8_0", + "display_name": "Ministral 3 3B Instruct 2512 Q8_0", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 256000, + "output": 256000 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "ministral-3:3b-instruct-2512-fp16", + "name": "Ministral 3 3B Instruct 2512 FP16", + "display_name": "Ministral 3 3B Instruct 2512 FP16", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 256000, + "output": 256000 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "ministral-3:8b-instruct-2512-q8_0", + "name": "Ministral 3 8B Instruct 2512 Q8_0", + "display_name": "Ministral 3 8B Instruct 2512 Q8_0", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 256000, + "output": 256000 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "ministral-3:8b-instruct-2512-fp16", + "name": "Ministral 3 8B Instruct 2512 FP16", + "display_name": "Ministral 3 8B Instruct 2512 FP16", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 256000, + "output": 256000 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "ministral-3:14b-instruct-2512-q8_0", + "name": "Ministral 3 14B Instruct 2512 Q8_0", + "display_name": "Ministral 3 14B Instruct 2512 Q8_0", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 256000, + "output": 256000 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "ministral-3:14b-instruct-2512-fp16", + "name": "Ministral 3 14B Instruct 2512 FP16", + "display_name": "Ministral 3 14B Instruct 2512 FP16", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 256000, + "output": 256000 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "type": "chat" + }, { "id": "qwen2.5:latest", "name": "Qwen2.5 Latest", @@ -47046,6 +54984,20 @@ "name": "PPInfra", "display_name": "PPInfra", "models": [ + { + "id": "zai-org/autoglm-phone-9b-multilingual", + "name": "AutoGLM-Phone-9B-Multilingual", + "display_name": "AutoGLM-Phone-9B-Multilingual", + "limit": { + "context": 65536, + "output": 32000 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "type": "chat" + }, { "id": "baichuan/baichuan-m2-32b", "name": "BaiChuan M2 32B", @@ -47192,6 +55144,21 @@ }, "type": "chat" }, + { + "id": "deepseek/deepseek-v3.2", + "name": "Deepseek V3.2", + "display_name": "Deepseek V3.2", + "limit": { + "context": 163840, + "output": 65536 + }, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "type": "chat" + }, { "id": "deepseek/deepseek-v3.2-exp", "name": "Deepseek V3.2 Exp", @@ -47369,6 +55336,21 @@ }, "type": "chat" }, + { + "id": "zai-org/glm-4.6v", + "name": "GLM 4.6v", + "display_name": "GLM 4.6v", + "limit": { + "context": 131072, + "output": 32768 + }, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "type": "chat" + }, { "id": "zai-org/glm-4.5", "name": "GLM-4.5", @@ -47921,6 +55903,20 @@ }, "type": "chat" }, + { + "id": "amazon/nova-2-lite-v1", + "name": "Amazon: Nova 2 Lite", + "display_name": "Amazon: Nova 2 Lite", + "limit": { + "context": 4096, + "output": 4096 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "type": "chat" + }, { "id": "amazon/nova-lite-v1", "name": "Amazon: Nova Lite 1.0", @@ -48201,6 +56197,20 @@ }, "type": "chat" }, + { + "id": "arcee-ai/trinity-mini", + "name": "Arcee AI: Trinity Mini", + "display_name": "Arcee AI: Trinity Mini", + "limit": { + "context": 4096, + "output": 4096 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "type": "chat" + }, { "id": "arcee-ai/virtuoso-large", "name": "Arcee AI: Virtuoso Large", @@ -48314,9 +56324,9 @@ "type": "chat" }, { - "id": "openrouter/bert-nebulon-alpha", - "name": "Bert-Nebulon Alpha", - "display_name": "Bert-Nebulon Alpha", + "id": "openrouter/bodybuilder", + "name": "Body Builder", + "display_name": "Body Builder", "limit": { "context": 4096, "output": 4096 @@ -48509,20 +56519,6 @@ }, "type": "chat" }, - { - "id": "deepcogito/cogito-v2-preview-deepseek-671b", - "name": "Deep Cogito: Cogito V2 Preview Deepseek 671B", - "display_name": "Deep Cogito: Cogito V2 Preview Deepseek 671B", - "limit": { - "context": 4096, - "output": 4096 - }, - "tool_call": false, - "reasoning": { - "supported": false - }, - "type": "chat" - }, { "id": "deepcogito/cogito-v2-preview-llama-405b", "name": "Deep Cogito: Cogito V2 Preview Llama 405B", @@ -48663,6 +56659,20 @@ }, "type": "chat" }, + { + "id": "deepseek/deepseek-v3.2", + "name": "DeepSeek: DeepSeek V3.2", + "display_name": "DeepSeek: DeepSeek V3.2", + "limit": { + "context": 4096, + "output": 4096 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "type": "chat" + }, { "id": "deepseek/deepseek-v3.2-exp", "name": "DeepSeek: DeepSeek V3.2 Exp", @@ -48677,6 +56687,20 @@ }, "type": "chat" }, + { + "id": "deepseek/deepseek-v3.2-speciale", + "name": "DeepSeek: DeepSeek V3.2 Speciale", + "display_name": "DeepSeek: DeepSeek V3.2 Speciale", + "limit": { + "context": 4096, + "output": 4096 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "type": "chat" + }, { "id": "deepseek/deepseek-r1", "name": "DeepSeek: R1", @@ -48761,6 +56785,20 @@ }, "type": "chat" }, + { + "id": "essentialai/rnj-1-instruct", + "name": "EssentialAI: Rnj 1 Instruct", + "display_name": "EssentialAI: Rnj 1 Instruct", + "limit": { + "context": 4096, + "output": 4096 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "type": "chat" + }, { "id": "alpindale/goliath-120b", "name": "Goliath 120B", @@ -49587,20 +57625,6 @@ }, "type": "chat" }, - { - "id": "mistralai/mistral-small", - "name": "Mistral Small", - "display_name": "Mistral Small", - "limit": { - "context": 4096, - "output": 4096 - }, - "tool_call": false, - "reasoning": { - "supported": false - }, - "type": "chat" - }, { "id": "mistralai/mistral-tiny", "name": "Mistral Tiny", @@ -49616,9 +57640,9 @@ "type": "chat" }, { - "id": "mistralai/codestral-2501", - "name": "Mistral: Codestral 2501", - "display_name": "Mistral: Codestral 2501", + "id": "mistralai/codestral-2508", + "name": "Mistral: Codestral 2508", + "display_name": "Mistral: Codestral 2508", "limit": { "context": 4096, "output": 4096 @@ -49630,9 +57654,9 @@ "type": "chat" }, { - "id": "mistralai/codestral-2508", - "name": "Mistral: Codestral 2508", - "display_name": "Mistral: Codestral 2508", + "id": "mistralai/devstral-2512", + "name": "Mistral: Devstral 2 2512", + "display_name": "Mistral: Devstral 2 2512", "limit": { "context": 4096, "output": 4096 @@ -49686,9 +57710,9 @@ "type": "chat" }, { - "id": "mistralai/magistral-medium-2506", - "name": "Mistral: Magistral Medium 2506", - "display_name": "Mistral: Magistral Medium 2506", + "id": "mistralai/ministral-14b-2512", + "name": "Mistral: Ministral 3 14B 2512", + "display_name": "Mistral: Ministral 3 14B 2512", "limit": { "context": 4096, "output": 4096 @@ -49700,9 +57724,9 @@ "type": "chat" }, { - "id": "mistralai/magistral-medium-2506:thinking", - "name": "Mistral: Magistral Medium 2506 (thinking)", - "display_name": "Mistral: Magistral Medium 2506 (thinking)", + "id": "mistralai/ministral-3b-2512", + "name": "Mistral: Ministral 3 3B 2512", + "display_name": "Mistral: Ministral 3 3B 2512", "limit": { "context": 4096, "output": 4096 @@ -49714,9 +57738,9 @@ "type": "chat" }, { - "id": "mistralai/magistral-small-2506", - "name": "Mistral: Magistral Small 2506", - "display_name": "Mistral: Magistral Small 2506", + "id": "mistralai/ministral-8b-2512", + "name": "Mistral: Ministral 3 8B 2512", + "display_name": "Mistral: Ministral 3 8B 2512", "limit": { "context": 4096, "output": 4096 @@ -49811,6 +57835,20 @@ }, "type": "chat" }, + { + "id": "mistralai/mistral-large-2512", + "name": "Mistral: Mistral Large 3 2512", + "display_name": "Mistral: Mistral Large 3 2512", + "limit": { + "context": 4096, + "output": 4096 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "type": "chat" + }, { "id": "mistralai/mistral-medium-3", "name": "Mistral: Mistral Medium 3", @@ -50777,6 +58815,20 @@ }, "type": "chat" }, + { + "id": "openai/gpt-5.1-codex-max", + "name": "OpenAI: GPT-5.1-Codex-Max", + "display_name": "OpenAI: GPT-5.1-Codex-Max", + "limit": { + "context": 4096, + "output": 4096 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "type": "chat" + }, { "id": "openai/gpt-5.1-codex-mini", "name": "OpenAI: GPT-5.1-Codex-Mini", @@ -50791,6 +58843,48 @@ }, "type": "chat" }, + { + "id": "openai/gpt-5.2", + "name": "OpenAI: GPT-5.2", + "display_name": "OpenAI: GPT-5.2", + "limit": { + "context": 4096, + "output": 4096 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "openai/gpt-5.2-chat", + "name": "OpenAI: GPT-5.2 Chat", + "display_name": "OpenAI: GPT-5.2 Chat", + "limit": { + "context": 4096, + "output": 4096 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "openai/gpt-5.2-pro", + "name": "OpenAI: GPT-5.2 Pro", + "display_name": "OpenAI: GPT-5.2 Pro", + "limit": { + "context": 4096, + "output": 4096 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "type": "chat" + }, { "id": "openai/gpt-oss-120b", "name": "OpenAI: gpt-oss-120b", @@ -50861,20 +58955,6 @@ }, "type": "chat" }, - { - "id": "openai/o1-mini", - "name": "OpenAI: o1-mini", - "display_name": "OpenAI: o1-mini", - "limit": { - "context": 4096, - "output": 4096 - }, - "tool_call": false, - "reasoning": { - "supported": false - }, - "type": "chat" - }, { "id": "openai/o1-pro", "name": "OpenAI: o1-pro", @@ -51099,6 +59179,20 @@ }, "type": "chat" }, + { + "id": "prime-intellect/intellect-3", + "name": "Prime Intellect: INTELLECT-3", + "display_name": "Prime Intellect: INTELLECT-3", + "limit": { + "context": 4096, + "output": 4096 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "type": "chat" + }, { "id": "qwen/qwen-plus-2025-07-28", "name": "Qwen: Qwen Plus 0728", @@ -51435,20 +59529,6 @@ }, "type": "chat" }, - { - "id": "qwen/qwen3-coder-480b-a35b-instruct", - "name": "Qwen: Qwen3 Coder 480B A35B Instruct", - "display_name": "Qwen: Qwen3 Coder 480B A35B Instruct", - "limit": { - "context": 4096, - "output": 4096 - }, - "tool_call": false, - "reasoning": { - "supported": false - }, - "type": "chat" - }, { "id": "qwen/qwen3-coder-flash", "name": "Qwen: Qwen3 Coder Flash", @@ -51618,23 +59698,9 @@ "type": "chat" }, { - "id": "qwen/text-embedding-v3", - "name": "Qwen: Text Embedding v3", - "display_name": "Qwen: Text Embedding v3", - "limit": { - "context": 4096, - "output": 4096 - }, - "tool_call": false, - "reasoning": { - "supported": false - }, - "type": "embedding" - }, - { - "id": "qwen/text-embedding-v4", - "name": "Qwen: Text Embedding v4", - "display_name": "Qwen: Text Embedding v4", + "id": "qwen/qwen-2.5-72b-instruct", + "name": "Qwen2.5 72B Instruct", + "display_name": "Qwen2.5 72B Instruct", "limit": { "context": 4096, "output": 4096 @@ -51643,12 +59709,12 @@ "reasoning": { "supported": false }, - "type": "embedding" + "type": "chat" }, { - "id": "qwen/qwen-2.5-72b-instruct", - "name": "Qwen2.5 72B Instruct", - "display_name": "Qwen2.5 72B Instruct", + "id": "qwen/qwen-2.5-coder-32b-instruct", + "name": "Qwen2.5 Coder 32B Instruct", + "display_name": "Qwen2.5 Coder 32B Instruct", "limit": { "context": 4096, "output": 4096 @@ -51660,9 +59726,9 @@ "type": "chat" }, { - "id": "qwen/qwen-2.5-coder-32b-instruct", - "name": "Qwen2.5 Coder 32B Instruct", - "display_name": "Qwen2.5 Coder 32B Instruct", + "id": "relace/relace-apply-3", + "name": "Relace: Relace Apply 3", + "display_name": "Relace: Relace Apply 3", "limit": { "context": 4096, "output": 4096 @@ -51674,9 +59740,9 @@ "type": "chat" }, { - "id": "relace/relace-apply-3", - "name": "Relace: Relace Apply 3", - "display_name": "Relace: Relace Apply 3", + "id": "relace/relace-search", + "name": "Relace: Relace Search", + "display_name": "Relace: Relace Search", "limit": { "context": 4096, "output": 4096 @@ -51939,6 +60005,20 @@ }, "type": "chat" }, + { + "id": "tngtech/tng-r1t-chimera", + "name": "TNG: R1T Chimera", + "display_name": "TNG: R1T Chimera", + "limit": { + "context": 4096, + "output": 4096 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "type": "chat" + }, { "id": "alibaba/tongyi-deepresearch-30b-a3b", "name": "Tongyi DeepResearch 30B A3B", @@ -52162,6 +60242,20 @@ "supported": false }, "type": "chat" + }, + { + "id": "z-ai/glm-4.6v", + "name": "Z.AI: GLM 4.6V", + "display_name": "Z.AI: GLM 4.6V", + "limit": { + "context": 4096, + "output": 4096 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "type": "chat" } ] }, @@ -52221,6 +60315,57 @@ }, "type": "imageGeneration" }, + { + "id": "gpt-5.2", + "name": "gpt-5.2", + "display_name": "gpt-5.2", + "modalities": { + "input": [ + "text", + "image" + ] + }, + "limit": { + "context": 400000, + "output": 400000 + }, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "cost": { + "input": 1.75, + "output": 14, + "cache_read": 0.175 + }, + "type": "chat" + }, + { + "id": "gpt-5.2-chat-latest", + "name": "gpt-5.2-chat-latest", + "display_name": "gpt-5.2-chat-latest", + "modalities": { + "input": [ + "text", + "image" + ] + }, + "limit": { + "context": 128000, + "output": 128000 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "cost": { + "input": 1.75, + "output": 14, + "cache_read": 0.175 + }, + "type": "chat" + }, { "id": "gemini-3-pro-preview", "name": "gemini-3-pro-preview", @@ -52249,6 +60394,32 @@ }, "type": "chat" }, + { + "id": "gpt-5.2-pro", + "name": "gpt-5.2-pro", + "display_name": "gpt-5.2-pro", + "modalities": { + "input": [ + "text", + "image" + ] + }, + "limit": { + "context": 400000, + "output": 400000 + }, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "cost": { + "input": 21, + "output": 168, + "cache_read": 2.1 + }, + "type": "chat" + }, { "id": "gpt-5.1", "name": "gpt-5.1", @@ -52275,6 +60446,32 @@ }, "type": "chat" }, + { + "id": "gpt-5.1-codex-max", + "name": "gpt-5.1-codex-max", + "display_name": "gpt-5.1-codex-max", + "modalities": { + "input": [ + "text", + "image" + ] + }, + "limit": { + "context": 400000, + "output": 400000 + }, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "cost": { + "input": 1.25, + "output": 10, + "cache_read": 0.125 + }, + "type": "chat" + }, { "id": "gemini-3-pro-preview-search", "name": "gemini-3-pro-preview-search", @@ -52380,6 +60577,30 @@ }, "type": "chat" }, + { + "id": "mistral-large-3", + "name": "mistral-large-3", + "display_name": "mistral-large-3", + "modalities": { + "input": [ + "text", + "image" + ] + }, + "limit": { + "context": 256000, + "output": 256000 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "cost": { + "input": 0.5, + "output": 1.5 + }, + "type": "chat" + }, { "id": "claude-haiku-4-5", "name": "claude-haiku-4-5", @@ -52482,6 +60703,84 @@ }, "type": "chat" }, + { + "id": "glm-4.6v", + "name": "glm-4.6v", + "display_name": "glm-4.6v", + "modalities": { + "input": [ + "text", + "image", + "video" + ] + }, + "limit": { + "context": 128000, + "output": 128000 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "cost": { + "input": 0.137, + "output": 0.411, + "cache_read": 0.0274 + }, + "type": "chat" + }, + { + "id": "grok-4-1-fast-non-reasoning", + "name": "grok-4-1-fast-non-reasoning", + "display_name": "grok-4-1-fast-non-reasoning", + "modalities": { + "input": [ + "text", + "image" + ] + }, + "limit": { + "context": 2000000, + "output": 2000000 + }, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "cost": { + "input": 0.2, + "output": 0.5, + "cache_read": 0.05 + }, + "type": "chat" + }, + { + "id": "grok-4-1-fast-reasoning", + "name": "grok-4-1-fast-reasoning", + "display_name": "grok-4-1-fast-reasoning", + "modalities": { + "input": [ + "text", + "image" + ] + }, + "limit": { + "context": 2000000, + "output": 2000000 + }, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "cost": { + "input": 0.2, + "output": 0.5, + "cache_read": 0.05 + }, + "type": "chat" + }, { "id": "gpt-5", "name": "gpt-5", @@ -52508,6 +60807,128 @@ }, "type": "chat" }, + { + "id": "deepseek-v3.2-fast", + "name": "deepseek-v3.2-fast", + "display_name": "deepseek-v3.2-fast", + "modalities": { + "input": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 128000 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "cost": { + "input": 1.096, + "output": 3.288, + "cache_read": 1.096 + }, + "type": "chat" + }, + { + "id": "deepseek-v3.2", + "name": "deepseek-v3.2", + "display_name": "deepseek-v3.2", + "modalities": { + "input": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 128000 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "cost": { + "input": 0.302, + "output": 0.453, + "cache_read": 0.0302 + }, + "type": "chat" + }, + { + "id": "deepseek-v3.2-speciale", + "name": "deepseek-v3.2-speciale", + "display_name": "deepseek-v3.2-speciale", + "modalities": { + "input": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 128000 + }, + "tool_call": false, + "reasoning": { + "supported": true, + "default": true + }, + "cost": { + "input": 0.302, + "output": 0.453, + "cache_read": 0.0302 + }, + "type": "chat" + }, + { + "id": "deepseek-v3.2-think", + "name": "deepseek-v3.2-think", + "display_name": "deepseek-v3.2-think", + "modalities": { + "input": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 128000 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "cost": { + "input": 0.302, + "output": 0.453, + "cache_read": 0.0302 + }, + "type": "chat" + }, + { + "id": "deepseek-math-v2", + "name": "deepseek-math-v2", + "display_name": "deepseek-math-v2", + "modalities": { + "input": [ + "text" + ] + }, + "limit": { + "context": 163000, + "output": 163000 + }, + "tool_call": false, + "reasoning": { + "supported": true, + "default": true + }, + "cost": { + "input": 0.492, + "output": 1.968, + "cache_read": 0.0984 + }, + "type": "chat" + }, { "id": "gpt-5-codex", "name": "gpt-5-codex", @@ -52662,9 +61083,15 @@ "type": "chat" }, { - "id": "sora-2-pro", - "name": "sora-2-pro", - "display_name": "sora-2-pro", + "id": "doubao-seedream-4-5", + "name": "doubao-seedream-4-5", + "display_name": "doubao-seedream-4-5", + "modalities": { + "input": [ + "text", + "image" + ] + }, "limit": { "context": 8192, "output": 8192 @@ -52675,9 +61102,10 @@ }, "cost": { "input": 2, - "output": 2 + "output": 0, + "cache_read": 0 }, - "type": "chat" + "type": "imageGeneration" }, { "id": "sora-2", @@ -52697,6 +61125,24 @@ }, "type": "chat" }, + { + "id": "sora-2-pro", + "name": "sora-2-pro", + "display_name": "sora-2-pro", + "limit": { + "context": 8192, + "output": 8192 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "cost": { + "input": 2, + "output": 2 + }, + "type": "chat" + }, { "id": "gpt-4o-audio-preview", "name": "gpt-4o-audio-preview", @@ -52924,12 +61370,13 @@ "type": "chat" }, { - "id": "wan2.5-t2v-preview", - "name": "wan2.5-t2v-preview", - "display_name": "wan2.5-t2v-preview", + "id": "wan2.2-i2v-plus", + "name": "wan2.2-i2v-plus", + "display_name": "wan2.2-i2v-plus", "modalities": { "input": [ - "text" + "text", + "image" ] }, "limit": { @@ -52947,9 +61394,14 @@ "type": "chat" }, { - "id": "web-sora-2-pro", - "name": "web-sora-2-pro", - "display_name": "web-sora-2-pro", + "id": "wan2.2-t2v-plus", + "name": "wan2.2-t2v-plus", + "display_name": "wan2.2-t2v-plus", + "modalities": { + "input": [ + "text" + ] + }, "limit": { "context": 8192, "output": 8192 @@ -52960,14 +61412,20 @@ }, "cost": { "input": 2, - "output": 2 + "output": 0 }, "type": "chat" }, { - "id": "web-sora-2", - "name": "web-sora-2", - "display_name": "web-sora-2", + "id": "wan2.5-i2v-preview", + "name": "wan2.5-i2v-preview", + "display_name": "wan2.5-i2v-preview", + "modalities": { + "input": [ + "text", + "image" + ] + }, "limit": { "context": 8192, "output": 8192 @@ -52978,18 +61436,17 @@ }, "cost": { "input": 2, - "output": 2 + "output": 0 }, "type": "chat" }, { - "id": "wan2.5-i2v-preview", - "name": "wan2.5-i2v-preview", - "display_name": "wan2.5-i2v-preview", + "id": "wan2.5-t2v-preview", + "name": "wan2.5-t2v-preview", + "display_name": "wan2.5-t2v-preview", "modalities": { "input": [ - "text", - "image" + "text" ] }, "limit": { @@ -53007,14 +61464,9 @@ "type": "chat" }, { - "id": "wan2.2-t2v-plus", - "name": "wan2.2-t2v-plus", - "display_name": "wan2.2-t2v-plus", - "modalities": { - "input": [ - "text" - ] - }, + "id": "web-sora-2", + "name": "web-sora-2", + "display_name": "web-sora-2", "limit": { "context": 8192, "output": 8192 @@ -53025,20 +61477,14 @@ }, "cost": { "input": 2, - "output": 0 + "output": 2 }, "type": "chat" }, { - "id": "wan2.2-i2v-plus", - "name": "wan2.2-i2v-plus", - "display_name": "wan2.2-i2v-plus", - "modalities": { - "input": [ - "text", - "image" - ] - }, + "id": "web-sora-2-pro", + "name": "web-sora-2-pro", + "display_name": "web-sora-2-pro", "limit": { "context": 8192, "output": 8192 @@ -53049,7 +61495,7 @@ }, "cost": { "input": 2, - "output": 0 + "output": 2 }, "type": "chat" }, @@ -53301,6 +61747,56 @@ }, "type": "chat" }, + { + "id": "claude-opus-4-0", + "name": "claude-opus-4-0", + "display_name": "claude-opus-4-0", + "modalities": { + "input": [ + "text", + "image" + ] + }, + "limit": { + "context": 200000, + "output": 200000 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "cost": { + "input": 16.5, + "output": 82.5 + }, + "type": "chat" + }, + { + "id": "claude-sonnet-4-0", + "name": "claude-sonnet-4-0", + "display_name": "claude-sonnet-4-0", + "modalities": { + "input": [ + "text", + "image" + ] + }, + "limit": { + "context": 1000000, + "output": 1000000 + }, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "cost": { + "input": 3.3, + "output": 16.5, + "cache_read": 0.33 + }, + "type": "chat" + }, { "id": "gemini-2.5-flash", "name": "gemini-2.5-flash", @@ -53435,50 +61931,6 @@ }, "type": "chat" }, - { - "id": "grok-code-fast-1", - "name": "grok-code-fast-1", - "display_name": "grok-code-fast-1", - "limit": { - "context": 256000, - "output": 256000 - }, - "tool_call": false, - "reasoning": { - "supported": false - }, - "cost": { - "input": 0.2, - "output": 1.5, - "cache_read": 0.02 - }, - "type": "chat" - }, - { - "id": "kimi-for-coding", - "name": "kimi-for-coding", - "display_name": "kimi-for-coding", - "modalities": { - "input": [ - "text" - ] - }, - "limit": { - "context": 256000, - "output": 256000 - }, - "tool_call": true, - "reasoning": { - "supported": true, - "default": true - }, - "cost": { - "input": 0, - "output": 0, - "cache_read": 0 - }, - "type": "chat" - }, { "id": "gemini-2.5-flash-nothink", "name": "gemini-2.5-flash-nothink", @@ -53851,6 +62303,31 @@ }, "type": "chat" }, + { + "id": "gemini-2.5-flash-image-preview", + "name": "gemini-2.5-flash-image-preview", + "display_name": "gemini-2.5-flash-image-preview", + "modalities": { + "input": [ + "image", + "text" + ] + }, + "limit": { + "context": 32800, + "output": 32800 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "cost": { + "input": 0.3, + "output": 1.2, + "cache_read": 0.3 + }, + "type": "imageGeneration" + }, { "id": "glm-4.5", "name": "glm-4.5", @@ -54004,9 +62481,9 @@ "type": "chat" }, { - "id": "veo-3.0-generate-preview", - "name": "veo-3.0-generate-preview", - "display_name": "veo-3.0-generate-preview", + "id": "qwen3-vl-235b-a22b-instruct", + "name": "qwen3-vl-235b-a22b-instruct", + "display_name": "qwen3-vl-235b-a22b-instruct", "modalities": { "input": [ "text", @@ -54015,24 +62492,23 @@ ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 131000, + "output": 131000 }, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "cost": { - "input": 2, - "output": 2, - "cache_read": 0 + "input": 0.274, + "output": 1.096 }, "type": "chat" }, { - "id": "veo-3.1-fast-generate-preview", - "name": "veo-3.1-fast-generate-preview", - "display_name": "veo-3.1-fast-generate-preview", + "id": "qwen3-vl-235b-a22b-thinking", + "name": "qwen3-vl-235b-a22b-thinking", + "display_name": "qwen3-vl-235b-a22b-thinking", "modalities": { "input": [ "text", @@ -54041,23 +62517,24 @@ ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 131000, + "output": 131000 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "cost": { - "input": 2, - "output": 0 + "input": 0.274, + "output": 2.74 }, "type": "chat" }, { - "id": "veo-3.1-generate-preview", - "name": "veo-3.1-generate-preview", - "display_name": "veo-3.1-generate-preview", + "id": "qwen3-vl-30b-a3b-instruct", + "name": "qwen3-vl-30b-a3b-instruct", + "display_name": "qwen3-vl-30b-a3b-instruct", "modalities": { "input": [ "text", @@ -54066,17 +62543,16 @@ ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 128000, + "output": 128000 }, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "cost": { - "input": 2, - "output": 2, - "cache_read": 0 + "input": 0.1028, + "output": 0.4112 }, "type": "chat" }, @@ -54107,9 +62583,9 @@ "type": "chat" }, { - "id": "qwen3-vl-30b-a3b-instruct", - "name": "qwen3-vl-30b-a3b-instruct", - "display_name": "qwen3-vl-30b-a3b-instruct", + "id": "veo-3.0-generate-preview", + "name": "veo-3.0-generate-preview", + "display_name": "veo-3.0-generate-preview", "modalities": { "input": [ "text", @@ -54118,23 +62594,24 @@ ] }, "limit": { - "context": 128000, - "output": 128000 + "context": 8192, + "output": 8192 }, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "cost": { - "input": 0.1028, - "output": 0.4112 + "input": 2, + "output": 2, + "cache_read": 0 }, "type": "chat" }, { - "id": "qwen3-vl-235b-a22b-thinking", - "name": "qwen3-vl-235b-a22b-thinking", - "display_name": "qwen3-vl-235b-a22b-thinking", + "id": "veo-3.1-fast-generate-preview", + "name": "veo-3.1-fast-generate-preview", + "display_name": "veo-3.1-fast-generate-preview", "modalities": { "input": [ "text", @@ -54143,24 +62620,23 @@ ] }, "limit": { - "context": 131000, - "output": 131000 + "context": 8192, + "output": 8192 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "cost": { - "input": 0.274, - "output": 2.74 + "input": 2, + "output": 0 }, "type": "chat" }, { - "id": "qwen3-vl-235b-a22b-instruct", - "name": "qwen3-vl-235b-a22b-instruct", - "display_name": "qwen3-vl-235b-a22b-instruct", + "id": "veo-3.1-generate-preview", + "name": "veo-3.1-generate-preview", + "display_name": "veo-3.1-generate-preview", "modalities": { "input": [ "text", @@ -54169,16 +62645,17 @@ ] }, "limit": { - "context": 131000, - "output": 131000 + "context": 8192, + "output": 8192 }, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "cost": { - "input": 0.274, - "output": 1.096 + "input": 2, + "output": 2, + "cache_read": 0 }, "type": "chat" }, @@ -54201,31 +62678,6 @@ }, "type": "chat" }, - { - "id": "gemini-2.5-flash-image-preview", - "name": "gemini-2.5-flash-image-preview", - "display_name": "gemini-2.5-flash-image-preview", - "modalities": { - "input": [ - "image", - "text" - ] - }, - "limit": { - "context": 32800, - "output": 32800 - }, - "tool_call": false, - "reasoning": { - "supported": false - }, - "cost": { - "input": 0.3, - "output": 1.2, - "cache_read": 0.3 - }, - "type": "imageGeneration" - }, { "id": "aihubmix-router", "name": "aihubmix-router", @@ -55141,13 +63593,12 @@ "type": "chat" }, { - "id": "qwen3-reranker-4b", - "name": "qwen3-reranker-4b", - "display_name": "qwen3-reranker-4b", + "id": "qwen3-embedding-0.6b", + "name": "qwen3-embedding-0.6b", + "display_name": "qwen3-embedding-0.6b", "modalities": { "input": [ - "text", - "image" + "text" ] }, "limit": { @@ -55159,34 +63610,33 @@ "supported": false }, "cost": { - "input": 0.11, - "output": 0.11 + "input": 0.068, + "output": 0.068 }, - "type": "rerank" + "type": "embedding" }, { - "id": "qwen3-reranker-0.6b", - "name": "qwen3-reranker-0.6b", - "display_name": "qwen3-reranker-0.6b", + "id": "qwen3-embedding-4b", + "name": "qwen3-embedding-4b", + "display_name": "qwen3-embedding-4b", "modalities": { "input": [ - "text", - "image" + "text" ] }, "limit": { - "context": 16000, - "output": 16000 + "context": 8192, + "output": 8192 }, "tool_call": false, "reasoning": { "supported": false }, "cost": { - "input": 0.11, - "output": 0.11 + "input": 0.068, + "output": 0.068 }, - "type": "rerank" + "type": "embedding" }, { "id": "qwen3-embedding-8b", @@ -55212,35 +63662,37 @@ "type": "embedding" }, { - "id": "qwen3-embedding-4b", - "name": "qwen3-embedding-4b", - "display_name": "qwen3-embedding-4b", + "id": "qwen3-reranker-0.6b", + "name": "qwen3-reranker-0.6b", + "display_name": "qwen3-reranker-0.6b", "modalities": { "input": [ - "text" + "text", + "image" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 16000, + "output": 16000 }, "tool_call": false, "reasoning": { "supported": false }, "cost": { - "input": 0.068, - "output": 0.068 + "input": 0.11, + "output": 0.11 }, - "type": "embedding" + "type": "rerank" }, { - "id": "qwen3-embedding-0.6b", - "name": "qwen3-embedding-0.6b", - "display_name": "qwen3-embedding-0.6b", + "id": "qwen3-reranker-4b", + "name": "qwen3-reranker-4b", + "display_name": "qwen3-reranker-4b", "modalities": { "input": [ - "text" + "text", + "image" ] }, "limit": { @@ -55252,10 +63704,10 @@ "supported": false }, "cost": { - "input": 0.068, - "output": 0.068 + "input": 0.11, + "output": 0.11 }, - "type": "embedding" + "type": "rerank" }, { "id": "qwen3-reranker-8b", @@ -55995,6 +64447,34 @@ }, "type": "chat" }, + { + "id": "gemini-2.5-pro-preview-06-05", + "name": "gemini-2.5-pro-preview-06-05", + "display_name": "gemini-2.5-pro-preview-06-05", + "modalities": { + "input": [ + "text", + "image", + "audio", + "video" + ] + }, + "limit": { + "context": 1048576, + "output": 1048576 + }, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "cost": { + "input": 1.25, + "output": 10, + "cache_read": 0.31 + }, + "type": "chat" + }, { "id": "embedding-2", "name": "embedding-2", @@ -56068,34 +64548,6 @@ }, "type": "chat" }, - { - "id": "gemini-2.5-pro-preview-06-05", - "name": "gemini-2.5-pro-preview-06-05", - "display_name": "gemini-2.5-pro-preview-06-05", - "modalities": { - "input": [ - "text", - "image", - "audio", - "video" - ] - }, - "limit": { - "context": 1048576, - "output": 1048576 - }, - "tool_call": true, - "reasoning": { - "supported": true, - "default": true - }, - "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.31 - }, - "type": "chat" - }, { "id": "o1", "name": "o1", @@ -56532,54 +64984,54 @@ "type": "chat" }, { - "id": "gpt-4o-2024-11-20", - "name": "gpt-4o-2024-11-20", - "display_name": "gpt-4o-2024-11-20", + "id": "gemini-2.0-flash-thinking-exp-01-21", + "name": "gemini-2.0-flash-thinking-exp-01-21", + "display_name": "gemini-2.0-flash-thinking-exp-01-21", "modalities": { "input": [ "text", - "image" + "image", + "audio", + "video" ] }, "limit": { - "context": 128000, - "output": 128000 + "context": 8192, + "output": 8192 }, "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, "cost": { - "input": 2.5, - "output": 10, - "cache_read": 1.25 + "input": 0.076, + "output": 0.304 }, "type": "chat" }, { - "id": "gemini-2.0-flash-thinking-exp-01-21", - "name": "gemini-2.0-flash-thinking-exp-01-21", - "display_name": "gemini-2.0-flash-thinking-exp-01-21", + "id": "gpt-4o-2024-11-20", + "name": "gpt-4o-2024-11-20", + "display_name": "gpt-4o-2024-11-20", "modalities": { "input": [ "text", - "image", - "audio", - "video" + "image" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 128000, + "output": 128000 }, "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "cost": { - "input": 0.076, - "output": 0.304 + "input": 2.5, + "output": 10, + "cache_read": 1.25 }, "type": "chat" }, @@ -56683,24 +65135,6 @@ }, "type": "chat" }, - { - "id": "ernie-x1.1-preview", - "name": "ernie-x1.1-preview", - "display_name": "ernie-x1.1-preview", - "limit": { - "context": 8192, - "output": 8192 - }, - "tool_call": false, - "reasoning": { - "supported": false - }, - "cost": { - "input": 0.136, - "output": 0.544 - }, - "type": "chat" - }, { "id": "minimax-m2", "name": "minimax-m2", @@ -56725,69 +65159,9 @@ "type": "chat" }, { - "id": "kat-dev", - "name": "kat-dev", - "display_name": "kat-dev", - "modalities": { - "input": [ - "text" - ] - }, - "limit": { - "context": 128000, - "output": 128000 - }, - "tool_call": true, - "reasoning": { - "supported": false - }, - "cost": { - "input": 0.137, - "output": 0.548 - }, - "type": "chat" - }, - { - "id": "llama-3.3-70b", - "name": "llama-3.3-70b", - "display_name": "llama-3.3-70b", - "limit": { - "context": 65536, - "output": 65536 - }, - "tool_call": false, - "reasoning": { - "supported": false - }, - "cost": { - "input": 0.6, - "output": 0.6 - }, - "type": "chat" - }, - { - "id": "o1-global", - "name": "o1-global", - "display_name": "o1-global", - "limit": { - "context": 8192, - "output": 8192 - }, - "tool_call": false, - "reasoning": { - "supported": false - }, - "cost": { - "input": 15, - "output": 60, - "cache_read": 7.5 - }, - "type": "chat" - }, - { - "id": "qianfan-qi-vl", - "name": "qianfan-qi-vl", - "display_name": "qianfan-qi-vl", + "id": "ernie-x1.1-preview", + "name": "ernie-x1.1-preview", + "display_name": "ernie-x1.1-preview", "limit": { "context": 8192, "output": 8192 @@ -56797,8 +65171,8 @@ "supported": false }, "cost": { - "input": 0.2, - "output": 0.6 + "input": 0.136, + "output": 0.544 }, "type": "chat" }, @@ -56850,56 +65224,6 @@ }, "type": "embedding" }, - { - "id": "claude-opus-4-0", - "name": "claude-opus-4-0", - "display_name": "claude-opus-4-0", - "modalities": { - "input": [ - "text", - "image" - ] - }, - "limit": { - "context": 200000, - "output": 200000 - }, - "tool_call": true, - "reasoning": { - "supported": false - }, - "cost": { - "input": 16.5, - "output": 82.5 - }, - "type": "chat" - }, - { - "id": "claude-sonnet-4-0", - "name": "claude-sonnet-4-0", - "display_name": "claude-sonnet-4-0", - "modalities": { - "input": [ - "text", - "image" - ] - }, - "limit": { - "context": 1000000, - "output": 1000000 - }, - "tool_call": true, - "reasoning": { - "supported": true, - "default": true - }, - "cost": { - "input": 3.3, - "output": 16.5, - "cache_read": 0.33 - }, - "type": "chat" - }, { "id": "codestral-latest", "name": "codestral-latest", @@ -57015,9 +65339,50 @@ "type": "chat" }, { - "id": "unsloth/gemma-3-27b-it", - "name": "unsloth/gemma-3-27b-it", - "display_name": "unsloth/gemma-3-27b-it", + "id": "kat-dev", + "name": "kat-dev", + "display_name": "kat-dev", + "modalities": { + "input": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 128000 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "cost": { + "input": 0.137, + "output": 0.548 + }, + "type": "chat" + }, + { + "id": "llama-3.3-70b", + "name": "llama-3.3-70b", + "display_name": "llama-3.3-70b", + "limit": { + "context": 65536, + "output": 65536 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "cost": { + "input": 0.6, + "output": 0.6 + }, + "type": "chat" + }, + { + "id": "o1-global", + "name": "o1-global", + "display_name": "o1-global", "limit": { "context": 8192, "output": 8192 @@ -57027,9 +65392,27 @@ "supported": false }, "cost": { - "input": 0.22, - "output": 0.22, - "cache_read": 0 + "input": 15, + "output": 60, + "cache_read": 7.5 + }, + "type": "chat" + }, + { + "id": "qianfan-qi-vl", + "name": "qianfan-qi-vl", + "display_name": "qianfan-qi-vl", + "limit": { + "context": 8192, + "output": 8192 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "cost": { + "input": 0.2, + "output": 0.6 }, "type": "chat" }, @@ -57057,6 +65440,43 @@ }, "type": "chat" }, + { + "id": "unsloth/gemma-3-27b-it", + "name": "unsloth/gemma-3-27b-it", + "display_name": "unsloth/gemma-3-27b-it", + "limit": { + "context": 8192, + "output": 8192 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "cost": { + "input": 0.22, + "output": 0.22, + "cache_read": 0 + }, + "type": "chat" + }, + { + "id": "qwen-qwq-32b", + "name": "qwen-qwq-32b", + "display_name": "qwen-qwq-32b", + "limit": { + "context": 8192, + "output": 8192 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "cost": { + "input": 0.4, + "output": 0.8 + }, + "type": "chat" + }, { "id": "unsloth/gemma-3-12b-it", "name": "unsloth/gemma-3-12b-it", @@ -57118,24 +65538,6 @@ }, "type": "chat" }, - { - "id": "qwen-qwq-32b", - "name": "qwen-qwq-32b", - "display_name": "qwen-qwq-32b", - "limit": { - "context": 8192, - "output": 8192 - }, - "tool_call": false, - "reasoning": { - "supported": false - }, - "cost": { - "input": 0.4, - "output": 0.8 - }, - "type": "chat" - }, { "id": "qwen-max-0125", "name": "qwen-max-0125", @@ -57722,9 +66124,9 @@ "type": "chat" }, { - "id": "grok-3-mini-fast-beta", - "name": "grok-3-mini-fast-beta", - "display_name": "grok-3-mini-fast-beta", + "id": "qwen-turbo-2025-04-28", + "name": "qwen-turbo-2025-04-28", + "display_name": "qwen-turbo-2025-04-28", "limit": { "context": 8192, "output": 8192 @@ -57734,15 +66136,16 @@ "supported": false }, "cost": { - "input": 0.33, - "output": 2.20011 + "input": 0.046, + "output": 0.92, + "cache_read": 0 }, "type": "chat" }, { - "id": "qwen-3-32b", - "name": "qwen-3-32b", - "display_name": "qwen-3-32b", + "id": "grok-3-mini-fast-beta", + "name": "grok-3-mini-fast-beta", + "display_name": "grok-3-mini-fast-beta", "limit": { "context": 8192, "output": 8192 @@ -57752,15 +66155,15 @@ "supported": false }, "cost": { - "input": 0.4, - "output": 1.6 + "input": 0.33, + "output": 2.20011 }, "type": "chat" }, { - "id": "qwen-turbo-2025-04-28", - "name": "qwen-turbo-2025-04-28", - "display_name": "qwen-turbo-2025-04-28", + "id": "qwen-3-32b", + "name": "qwen-3-32b", + "display_name": "qwen-3-32b", "limit": { "context": 8192, "output": 8192 @@ -57770,9 +66173,8 @@ "supported": false }, "cost": { - "input": 0.046, - "output": 0.92, - "cache_read": 0 + "input": 0.4, + "output": 1.6 }, "type": "chat" }, @@ -57927,29 +66329,6 @@ }, "type": "chat" }, - { - "id": "coding-glm-4.5-air", - "name": "coding-glm-4.5-air", - "display_name": "coding-glm-4.5-air", - "modalities": { - "input": [ - "text" - ] - }, - "limit": { - "context": 8192, - "output": 8192 - }, - "tool_call": false, - "reasoning": { - "supported": false - }, - "cost": { - "input": 0.014, - "output": 0.084 - }, - "type": "chat" - }, { "id": "glm-4.5-air", "name": "glm-4.5-air", @@ -58010,6 +66389,29 @@ }, "type": "chat" }, + { + "id": "coding-glm-4.5-air", + "name": "coding-glm-4.5-air", + "display_name": "coding-glm-4.5-air", + "modalities": { + "input": [ + "text" + ] + }, + "limit": { + "context": 8192, + "output": 8192 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "cost": { + "input": 0.014, + "output": 0.084 + }, + "type": "chat" + }, { "id": "llama-3.1-sonar-huge-128k-online", "name": "llama-3.1-sonar-huge-128k-online", @@ -58064,6 +66466,24 @@ }, "type": "chat" }, + { + "id": "gemini-2.0-flash-thinking-exp", + "name": "gemini-2.0-flash-thinking-exp", + "display_name": "gemini-2.0-flash-thinking-exp", + "limit": { + "context": 8192, + "output": 8192 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "cost": { + "input": 0.076, + "output": 0.304 + }, + "type": "chat" + }, { "id": "glm-4.5-flash", "name": "glm-4.5-flash", @@ -58082,8 +66502,9 @@ "supported": false }, "cost": { - "input": 0.02, - "output": 0.02 + "input": 0, + "output": 0, + "cache_read": 0 }, "type": "chat" }, @@ -58378,24 +66799,6 @@ }, "type": "chat" }, - { - "id": "gemini-2.0-flash-thinking-exp", - "name": "gemini-2.0-flash-thinking-exp", - "display_name": "gemini-2.0-flash-thinking-exp", - "limit": { - "context": 8192, - "output": 8192 - }, - "tool_call": false, - "reasoning": { - "supported": false - }, - "cost": { - "input": 0.076, - "output": 0.304 - }, - "type": "chat" - }, { "id": "aihubmix-command-r-08-2024", "name": "aihubmix-command-r-08-2024", @@ -58465,6 +66868,53 @@ }, "type": "chat" }, + { + "id": "baidu-deepseek-v3.2", + "name": "baidu-deepseek-v3.2", + "display_name": "baidu-deepseek-v3.2", + "modalities": { + "input": [ + "text" + ] + }, + "limit": { + "context": 8192, + "output": 8192 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "cost": { + "input": 0.274, + "output": 0.411 + }, + "type": "chat" + }, + { + "id": "baidu-deepseek-v3.2-exp", + "name": "baidu-deepseek-v3.2-exp", + "display_name": "baidu-deepseek-v3.2-exp", + "modalities": { + "input": [ + "text" + ] + }, + "limit": { + "context": 8192, + "output": 8192 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "cost": { + "input": 0.274, + "output": 0.411, + "cache_read": 0.0274 + }, + "type": "chat" + }, { "id": "chatglm_lite", "name": "chatglm_lite", @@ -60931,6 +69381,278 @@ }, "type": "chat" }, + { + "id": "qwen2.5-math-72b-instruct", + "name": "qwen2.5-math-72b-instruct", + "display_name": "qwen2.5-math-72b-instruct", + "limit": { + "context": 8192, + "output": 8192 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "cost": { + "input": 0.8, + "output": 2.4 + }, + "type": "chat" + }, + { + "id": "qwen2.5-math-7b-instruct", + "name": "qwen2.5-math-7b-instruct", + "display_name": "qwen2.5-math-7b-instruct", + "limit": { + "context": 8192, + "output": 8192 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "cost": { + "input": 0.2, + "output": 0.4 + }, + "type": "chat" + }, + { + "id": "sonar-reasoning-pro", + "name": "sonar-reasoning-pro", + "display_name": "sonar-reasoning-pro", + "limit": { + "context": 8192, + "output": 8192 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "cost": { + "input": 3, + "output": 12 + }, + "type": "chat" + }, + { + "id": "step-2-16k", + "name": "step-2-16k", + "display_name": "step-2-16k", + "limit": { + "context": 8192, + "output": 8192 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "cost": { + "input": 2, + "output": 2 + }, + "type": "chat" + }, + { + "id": "text-ada-001", + "name": "text-ada-001", + "display_name": "text-ada-001", + "limit": { + "context": 8192, + "output": 8192 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "cost": { + "input": 0.4, + "output": 0.4 + }, + "type": "chat" + }, + { + "id": "text-babbage-001", + "name": "text-babbage-001", + "display_name": "text-babbage-001", + "limit": { + "context": 8192, + "output": 8192 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "cost": { + "input": 0.5, + "output": 0.5 + }, + "type": "chat" + }, + { + "id": "text-curie-001", + "name": "text-curie-001", + "display_name": "text-curie-001", + "limit": { + "context": 8192, + "output": 8192 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "cost": { + "input": 2, + "output": 2 + }, + "type": "chat" + }, + { + "id": "text-davinci-002", + "name": "text-davinci-002", + "display_name": "text-davinci-002", + "limit": { + "context": 8192, + "output": 8192 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "cost": { + "input": 20, + "output": 20 + }, + "type": "chat" + }, + { + "id": "text-davinci-003", + "name": "text-davinci-003", + "display_name": "text-davinci-003", + "limit": { + "context": 8192, + "output": 8192 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "cost": { + "input": 20, + "output": 20 + }, + "type": "chat" + }, + { + "id": "text-davinci-edit-001", + "name": "text-davinci-edit-001", + "display_name": "text-davinci-edit-001", + "limit": { + "context": 8192, + "output": 8192 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "cost": { + "input": 20, + "output": 20 + }, + "type": "chat" + }, + { + "id": "text-embedding-3-large", + "name": "text-embedding-3-large", + "display_name": "text-embedding-3-large", + "modalities": { + "input": [ + "text" + ] + }, + "limit": { + "context": 8192, + "output": 8192 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "cost": { + "input": 0.13, + "output": 0.13 + }, + "type": "embedding" + }, + { + "id": "text-embedding-3-small", + "name": "text-embedding-3-small", + "display_name": "text-embedding-3-small", + "modalities": { + "input": [ + "text" + ] + }, + "limit": { + "context": 8192, + "output": 8192 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "cost": { + "input": 0.02, + "output": 0.02 + }, + "type": "embedding" + }, + { + "id": "text-embedding-ada-002", + "name": "text-embedding-ada-002", + "display_name": "text-embedding-ada-002", + "modalities": { + "input": [ + "text" + ] + }, + "limit": { + "context": 8192, + "output": 8192 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "cost": { + "input": 0.1, + "output": 0.1 + }, + "type": "embedding" + }, + { + "id": "text-embedding-v1", + "name": "text-embedding-v1", + "display_name": "text-embedding-v1", + "modalities": { + "input": [ + "text" + ] + }, + "limit": { + "context": 8192, + "output": 8192 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "cost": { + "input": 0.1, + "output": 0.1 + }, + "type": "embedding" + }, { "id": "text-moderation-007", "name": "text-moderation-007", @@ -61003,29 +69725,6 @@ }, "type": "chat" }, - { - "id": "text-embedding-v1", - "name": "text-embedding-v1", - "display_name": "text-embedding-v1", - "modalities": { - "input": [ - "text" - ] - }, - "limit": { - "context": 8192, - "output": 8192 - }, - "tool_call": false, - "reasoning": { - "supported": false - }, - "cost": { - "input": 0.1, - "output": 0.1 - }, - "type": "embedding" - }, { "id": "tts-1", "name": "tts-1", @@ -61114,75 +69813,6 @@ "output": 30 } }, - { - "id": "text-embedding-ada-002", - "name": "text-embedding-ada-002", - "display_name": "text-embedding-ada-002", - "modalities": { - "input": [ - "text" - ] - }, - "limit": { - "context": 8192, - "output": 8192 - }, - "tool_call": false, - "reasoning": { - "supported": false - }, - "cost": { - "input": 0.1, - "output": 0.1 - }, - "type": "embedding" - }, - { - "id": "text-embedding-3-small", - "name": "text-embedding-3-small", - "display_name": "text-embedding-3-small", - "modalities": { - "input": [ - "text" - ] - }, - "limit": { - "context": 8192, - "output": 8192 - }, - "tool_call": false, - "reasoning": { - "supported": false - }, - "cost": { - "input": 0.02, - "output": 0.02 - }, - "type": "embedding" - }, - { - "id": "text-embedding-3-large", - "name": "text-embedding-3-large", - "display_name": "text-embedding-3-large", - "modalities": { - "input": [ - "text" - ] - }, - "limit": { - "context": 8192, - "output": 8192 - }, - "tool_call": false, - "reasoning": { - "supported": false - }, - "cost": { - "input": 0.13, - "output": 0.13 - }, - "type": "embedding" - }, { "id": "veo-3", "name": "veo-3", @@ -61210,60 +69840,6 @@ }, "type": "chat" }, - { - "id": "text-davinci-edit-001", - "name": "text-davinci-edit-001", - "display_name": "text-davinci-edit-001", - "limit": { - "context": 8192, - "output": 8192 - }, - "tool_call": false, - "reasoning": { - "supported": false - }, - "cost": { - "input": 20, - "output": 20 - }, - "type": "chat" - }, - { - "id": "text-davinci-003", - "name": "text-davinci-003", - "display_name": "text-davinci-003", - "limit": { - "context": 8192, - "output": 8192 - }, - "tool_call": false, - "reasoning": { - "supported": false - }, - "cost": { - "input": 20, - "output": 20 - }, - "type": "chat" - }, - { - "id": "text-davinci-002", - "name": "text-davinci-002", - "display_name": "text-davinci-002", - "limit": { - "context": 8192, - "output": 8192 - }, - "tool_call": false, - "reasoning": { - "supported": false - }, - "cost": { - "input": 20, - "output": 20 - }, - "type": "chat" - }, { "id": "veo3", "name": "veo3", @@ -61291,132 +69867,6 @@ }, "type": "chat" }, - { - "id": "text-curie-001", - "name": "text-curie-001", - "display_name": "text-curie-001", - "limit": { - "context": 8192, - "output": 8192 - }, - "tool_call": false, - "reasoning": { - "supported": false - }, - "cost": { - "input": 2, - "output": 2 - }, - "type": "chat" - }, - { - "id": "text-babbage-001", - "name": "text-babbage-001", - "display_name": "text-babbage-001", - "limit": { - "context": 8192, - "output": 8192 - }, - "tool_call": false, - "reasoning": { - "supported": false - }, - "cost": { - "input": 0.5, - "output": 0.5 - }, - "type": "chat" - }, - { - "id": "text-ada-001", - "name": "text-ada-001", - "display_name": "text-ada-001", - "limit": { - "context": 8192, - "output": 8192 - }, - "tool_call": false, - "reasoning": { - "supported": false - }, - "cost": { - "input": 0.4, - "output": 0.4 - }, - "type": "chat" - }, - { - "id": "qwen2.5-math-72b-instruct", - "name": "qwen2.5-math-72b-instruct", - "display_name": "qwen2.5-math-72b-instruct", - "limit": { - "context": 8192, - "output": 8192 - }, - "tool_call": false, - "reasoning": { - "supported": false - }, - "cost": { - "input": 0.8, - "output": 2.4 - }, - "type": "chat" - }, - { - "id": "step-2-16k", - "name": "step-2-16k", - "display_name": "step-2-16k", - "limit": { - "context": 8192, - "output": 8192 - }, - "tool_call": false, - "reasoning": { - "supported": false - }, - "cost": { - "input": 2, - "output": 2 - }, - "type": "chat" - }, - { - "id": "sonar-reasoning-pro", - "name": "sonar-reasoning-pro", - "display_name": "sonar-reasoning-pro", - "limit": { - "context": 8192, - "output": 8192 - }, - "tool_call": false, - "reasoning": { - "supported": false - }, - "cost": { - "input": 3, - "output": 12 - }, - "type": "chat" - }, - { - "id": "qwen2.5-math-7b-instruct", - "name": "qwen2.5-math-7b-instruct", - "display_name": "qwen2.5-math-7b-instruct", - "limit": { - "context": 8192, - "output": 8192 - }, - "tool_call": false, - "reasoning": { - "supported": false - }, - "cost": { - "input": 0.2, - "output": 0.4 - }, - "type": "chat" - }, { "id": "whisper-1", "name": "whisper-1", @@ -62062,9 +70512,9 @@ "type": "chat" }, { - "id": "allenai/olmo-3-32b-think", - "name": "AllenAI: Olmo 3 32B Think", - "display_name": "AllenAI: Olmo 3 32B Think", + "id": "allenai/olmo-3-32b-think:free", + "name": "AllenAI: Olmo 3 32B Think (free)", + "display_name": "AllenAI: Olmo 3 32B Think (free)", "modalities": { "input": [ "text" @@ -62154,6 +70604,58 @@ }, "type": "chat" }, + { + "id": "amazon/nova-2-lite-v1", + "name": "Amazon: Nova 2 Lite", + "display_name": "Amazon: Nova 2 Lite", + "modalities": { + "input": [ + "text", + "image", + "video" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 1000000, + "output": 65535 + }, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "type": "imageGeneration" + }, + { + "id": "amazon/nova-2-lite-v1:free", + "name": "Amazon: Nova 2 Lite (free)", + "display_name": "Amazon: Nova 2 Lite (free)", + "modalities": { + "input": [ + "text", + "image", + "video" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 1000000, + "output": 65535 + }, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "type": "imageGeneration" + }, { "id": "amazon/nova-lite-v1", "name": "Amazon: Nova Lite 1.0", @@ -62523,7 +71025,7 @@ }, "limit": { "context": 200000, - "output": 64000 + "output": 32000 }, "tool_call": true, "reasoning": { @@ -62651,6 +71153,54 @@ }, "type": "imageGeneration" }, + { + "id": "arcee-ai/trinity-mini", + "name": "Arcee AI: Trinity Mini", + "display_name": "Arcee AI: Trinity Mini", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 131072 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "type": "chat" + }, + { + "id": "arcee-ai/trinity-mini:free", + "name": "Arcee AI: Trinity Mini (free)", + "display_name": "Arcee AI: Trinity Mini (free)", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 131072 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "type": "chat" + }, { "id": "arcee-ai/virtuoso-large", "name": "Arcee AI: Virtuoso Large", @@ -62946,29 +71496,6 @@ }, "type": "chat" }, - { - "id": "deepcogito/cogito-v2-preview-deepseek-671b", - "name": "Deep Cogito: Cogito V2 Preview Deepseek 671B", - "display_name": "Deep Cogito: Cogito V2 Preview Deepseek 671B", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 163840, - "output": 163840 - }, - "tool_call": false, - "reasoning": { - "supported": true, - "default": true - }, - "type": "chat" - }, { "id": "deepcogito/cogito-v2-preview-llama-109b-moe", "name": "Cogito V2 Preview Llama 109B", @@ -63120,8 +71647,8 @@ ] }, "limit": { - "context": 163840, - "output": 163840 + "context": 8192, + "output": 7168 }, "tool_call": true, "reasoning": { @@ -63303,8 +71830,8 @@ ] }, "limit": { - "context": 131072, - "output": 65536 + "context": 163840, + "output": 163840 }, "tool_call": true, "reasoning": { @@ -63326,8 +71853,8 @@ ] }, "limit": { - "context": 131072, - "output": 65536 + "context": 163840, + "output": 163840 }, "tool_call": true, "reasoning": { @@ -63336,6 +71863,30 @@ }, "type": "chat" }, + { + "id": "deepseek/deepseek-v3.2", + "name": "DeepSeek: DeepSeek V3.2", + "display_name": "DeepSeek: DeepSeek V3.2", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 163840, + "output": 163840 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "type": "chat" + }, { "id": "deepseek/deepseek-v3.2-exp", "name": "DeepSeek: DeepSeek V3.2 Exp", @@ -63350,7 +71901,7 @@ }, "limit": { "context": 163840, - "output": 65536 + "output": 163840 }, "temperature": true, "tool_call": true, @@ -63360,6 +71911,30 @@ }, "type": "chat" }, + { + "id": "deepseek/deepseek-v3.2-speciale", + "name": "DeepSeek: DeepSeek V3.2 Speciale", + "display_name": "DeepSeek: DeepSeek V3.2 Speciale", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 163840, + "output": 65536 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": true, + "default": true + }, + "type": "chat" + }, { "id": "eleutherai/llemma_7b", "name": "EleutherAI: Llemma 7b", @@ -63382,6 +71957,28 @@ }, "type": "chat" }, + { + "id": "essentialai/rnj-1-instruct", + "name": "EssentialAI: Rnj 1 Instruct", + "display_name": "EssentialAI: Rnj 1 Instruct", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 32768, + "output": 32768 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "type": "chat" + }, { "id": "google/gemini-2.0-flash-001", "name": "Google: Gemini 2.0 Flash", @@ -63849,8 +72446,8 @@ ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 96000, + "output": 96000 }, "tool_call": true, "reasoning": { @@ -64517,7 +73114,7 @@ }, "limit": { "context": 131072, - "output": 120000 + "output": 16384 }, "tool_call": true, "reasoning": { @@ -64562,7 +73159,7 @@ }, "limit": { "context": 1048576, - "output": 8192 + "output": 16384 }, "tool_call": true, "reasoning": { @@ -64898,8 +73495,8 @@ ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, @@ -64910,9 +73507,9 @@ "type": "chat" }, { - "id": "mistralai/codestral-2501", - "name": "Mistral: Codestral 2501", - "display_name": "Mistral: Codestral 2501", + "id": "mistralai/codestral-2508", + "name": "Mistral: Codestral 2508", + "display_name": "Mistral: Codestral 2508", "modalities": { "input": [ "text" @@ -64933,9 +73530,9 @@ "type": "chat" }, { - "id": "mistralai/codestral-2508", - "name": "Mistral: Codestral 2508", - "display_name": "Mistral: Codestral 2508", + "id": "mistralai/devstral-2512", + "name": "Mistral: Devstral 2 2512", + "display_name": "Mistral: Devstral 2 2512", "modalities": { "input": [ "text" @@ -64945,8 +73542,8 @@ ] }, "limit": { - "context": 256000, - "output": 256000 + "context": 262144, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -64956,9 +73553,9 @@ "type": "chat" }, { - "id": "mistralai/devstral-medium", - "name": "Mistral: Devstral Medium", - "display_name": "Mistral: Devstral Medium", + "id": "mistralai/devstral-2512:free", + "name": "Mistral: Devstral 2 2512 (free)", + "display_name": "Mistral: Devstral 2 2512 (free)", "modalities": { "input": [ "text" @@ -64968,8 +73565,8 @@ ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, @@ -64979,9 +73576,9 @@ "type": "chat" }, { - "id": "mistralai/devstral-small", - "name": "Mistral: Devstral Small 1.1", - "display_name": "Mistral: Devstral Small 1.1", + "id": "mistralai/devstral-medium", + "name": "Mistral: Devstral Medium", + "display_name": "Mistral: Devstral Medium", "modalities": { "input": [ "text" @@ -64991,8 +73588,8 @@ ] }, "limit": { - "context": 128000, - "output": 128000 + "context": 131072, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -65002,9 +73599,9 @@ "type": "chat" }, { - "id": "mistralai/devstral-small-2505", - "name": "Mistral: Devstral Small 2505", - "display_name": "Mistral: Devstral Small 2505", + "id": "mistralai/devstral-small", + "name": "Mistral: Devstral Small 1.1", + "display_name": "Mistral: Devstral Small 1.1", "modalities": { "input": [ "text" @@ -65025,9 +73622,9 @@ "type": "chat" }, { - "id": "mistralai/magistral-medium-2506", - "name": "Mistral: Magistral Medium 2506", - "display_name": "Mistral: Magistral Medium 2506", + "id": "mistralai/devstral-small-2505", + "name": "Mistral: Devstral Small 2505", + "display_name": "Mistral: Devstral Small 2505", "modalities": { "input": [ "text" @@ -65037,45 +73634,44 @@ ] }, "limit": { - "context": 40960, - "output": 40000 + "context": 128000, + "output": 128000 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "type": "chat" }, { - "id": "mistralai/magistral-medium-2506:thinking", - "name": "Mistral: Magistral Medium 2506 (thinking)", - "display_name": "Mistral: Magistral Medium 2506 (thinking)", + "id": "mistralai/ministral-14b-2512", + "name": "Mistral: Ministral 3 14B 2512", + "display_name": "Mistral: Ministral 3 14B 2512", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 40960, - "output": 40000 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "type": "chat" + "type": "imageGeneration" }, { - "id": "mistralai/magistral-small-2506", - "name": "Mistral: Magistral Small 2506", - "display_name": "Mistral: Magistral Small 2506", + "id": "mistralai/ministral-3b", + "name": "Mistral: Ministral 3B", + "display_name": "Mistral: Ministral 3B", "modalities": { "input": [ "text" @@ -65085,24 +73681,24 @@ ] }, "limit": { - "context": 40000, - "output": 40000 + "context": 131072, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "type": "chat" }, { - "id": "mistralai/ministral-3b", - "name": "Mistral: Ministral 3B", - "display_name": "Mistral: Ministral 3B", + "id": "mistralai/ministral-3b-2512", + "name": "Mistral: Ministral 3 3B 2512", + "display_name": "Mistral: Ministral 3 3B 2512", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -65117,7 +73713,7 @@ "reasoning": { "supported": false }, - "type": "chat" + "type": "imageGeneration" }, { "id": "mistralai/ministral-8b", @@ -65142,6 +73738,30 @@ }, "type": "chat" }, + { + "id": "mistralai/ministral-8b-2512", + "name": "Mistral: Ministral 3 8B 2512", + "display_name": "Mistral: Ministral 3 8B 2512", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 262144, + "output": 262144 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "type": "imageGeneration" + }, { "id": "mistralai/mistral-7b-instruct", "name": "Mistral: Mistral 7B Instruct", @@ -65327,9 +73947,9 @@ "type": "chat" }, { - "id": "mistralai/mistral-medium-3", - "name": "Mistral: Mistral Medium 3", - "display_name": "Mistral: Mistral Medium 3", + "id": "mistralai/mistral-large-2512", + "name": "Mistral: Mistral Large 3 2512", + "display_name": "Mistral: Mistral Large 3 2512", "modalities": { "input": [ "text", @@ -65340,8 +73960,8 @@ ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, @@ -65351,9 +73971,9 @@ "type": "imageGeneration" }, { - "id": "mistralai/mistral-medium-3.1", - "name": "Mistral: Mistral Medium 3.1", - "display_name": "Mistral: Mistral Medium 3.1", + "id": "mistralai/mistral-medium-3", + "name": "Mistral: Mistral Medium 3", + "display_name": "Mistral: Mistral Medium 3", "modalities": { "input": [ "text", @@ -65375,12 +73995,13 @@ "type": "imageGeneration" }, { - "id": "mistralai/mistral-nemo", - "name": "Mistral: Mistral Nemo", - "display_name": "Mistral: Mistral Nemo", + "id": "mistralai/mistral-medium-3.1", + "name": "Mistral: Mistral Medium 3.1", + "display_name": "Mistral: Mistral Medium 3.1", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -65388,19 +74009,19 @@ }, "limit": { "context": 131072, - "output": 16384 + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "type": "chat" + "type": "imageGeneration" }, { - "id": "mistralai/mistral-saba", - "name": "Mistral: Saba", - "display_name": "Mistral: Saba", + "id": "mistralai/mistral-nemo", + "name": "Mistral: Mistral Nemo", + "display_name": "Mistral: Mistral Nemo", "modalities": { "input": [ "text" @@ -65410,8 +74031,8 @@ ] }, "limit": { - "context": 32768, - "output": 32768 + "context": 131072, + "output": 16384 }, "temperature": true, "tool_call": true, @@ -65421,9 +74042,9 @@ "type": "chat" }, { - "id": "mistralai/mistral-small", - "name": "Mistral Small", - "display_name": "Mistral Small", + "id": "mistralai/mistral-saba", + "name": "Mistral: Saba", + "display_name": "Mistral: Saba", "modalities": { "input": [ "text" @@ -65457,7 +74078,7 @@ }, "limit": { "context": 32768, - "output": 16384 + "output": 32768 }, "temperature": true, "tool_call": true, @@ -65813,28 +74434,6 @@ }, "type": "chat" }, - { - "id": "moonshotai/kimi-linear-48b-a3b-instruct", - "name": "MoonshotAI: Kimi Linear 48B A3B Instruct", - "display_name": "MoonshotAI: Kimi Linear 48B A3B Instruct", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 1048576, - "output": 1048576 - }, - "tool_call": false, - "reasoning": { - "supported": false - }, - "type": "chat" - }, { "id": "morph/morph-v3-fast", "name": "Morph: Morph V3 Fast", @@ -65923,6 +74522,28 @@ }, "type": "chat" }, + { + "id": "nex-agi/deepseek-v3.1-nex-n1:free", + "name": "Nex AGI: DeepSeek V3.1 Nex N1 (free)", + "display_name": "Nex AGI: DeepSeek V3.1 Nex N1 (free)", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 163840 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "type": "chat" + }, { "id": "nousresearch/deephermes-3-mistral-24b-preview", "name": "Nous: DeepHermes 3 Mistral 24B Preview", @@ -67079,6 +75700,30 @@ }, "type": "imageGeneration" }, + { + "id": "openai/gpt-5.1-codex-max", + "name": "OpenAI: GPT-5.1-Codex-Max", + "display_name": "OpenAI: GPT-5.1-Codex-Max", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 400000, + "output": 128000 + }, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "type": "imageGeneration" + }, { "id": "openai/gpt-5.1-codex-mini", "name": "OpenAI: GPT-5.1-Codex-Mini", @@ -67103,6 +75748,80 @@ }, "type": "imageGeneration" }, + { + "id": "openai/gpt-5.2", + "name": "OpenAI: GPT-5.2", + "display_name": "OpenAI: GPT-5.2", + "modalities": { + "input": [ + "image", + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 400000, + "output": 128000 + }, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "type": "imageGeneration" + }, + { + "id": "openai/gpt-5.2-chat", + "name": "OpenAI: GPT-5.2 Chat", + "display_name": "OpenAI: GPT-5.2 Chat", + "modalities": { + "input": [ + "image", + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 16384 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": true, + "type": "imageGeneration" + }, + { + "id": "openai/gpt-5.2-pro", + "name": "OpenAI: GPT-5.2 Pro", + "display_name": "OpenAI: GPT-5.2 Pro", + "modalities": { + "input": [ + "image", + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 400000, + "output": 128000 + }, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "type": "imageGeneration" + }, { "id": "openai/gpt-oss-120b", "name": "OpenAI: gpt-oss-120b", @@ -67117,7 +75836,7 @@ }, "limit": { "context": 131072, - "output": 32768 + "output": 131072 }, "tool_call": true, "reasoning": { @@ -67140,7 +75859,30 @@ }, "limit": { "context": 131072, - "output": 32768 + "output": 131072 + }, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "type": "chat" + }, + { + "id": "openai/gpt-oss-120b:free", + "name": "OpenAI: gpt-oss-120b (free)", + "display_name": "OpenAI: gpt-oss-120b (free)", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 131072 }, "tool_call": true, "reasoning": { @@ -67186,7 +75928,7 @@ }, "limit": { "context": 131072, - "output": 131072 + "output": 128000 }, "tool_call": true, "reasoning": { @@ -67513,28 +76255,26 @@ "type": "chat" }, { - "id": "openrouter/bert-nebulon-alpha", - "name": "Bert-Nebulon Alpha", - "display_name": "Bert-Nebulon Alpha", + "id": "openrouter/bodybuilder", + "name": "Body Builder", + "display_name": "Body Builder", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 256000 + "context": 8192, + "output": 8192 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "type": "imageGeneration" + "type": "chat" }, { "id": "perplexity/sonar", @@ -68073,13 +76813,12 @@ ] }, "limit": { - "context": 131072, - "output": 16384 + "context": 262144, + "output": 262144 }, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "type": "chat" }, @@ -68369,7 +77108,7 @@ }, "limit": { "context": 262144, - "output": 262144 + "output": 65536 }, "tool_call": true, "reasoning": { @@ -68482,8 +77221,8 @@ ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, @@ -68682,6 +77421,28 @@ }, "type": "chat" }, + { + "id": "relace/relace-search", + "name": "Relace: Relace Search", + "display_name": "Relace: Relace Search", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 256000, + "output": 128000 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "type": "chat" + }, { "id": "sao10k/l3-euryale-70b", "name": "Sao10k: Llama 3 Euryale 70B v2.1", @@ -68862,28 +77623,6 @@ }, "type": "chat" }, - { - "id": "thedrummer/anubis-70b-v1.1", - "name": "TheDrummer: Anubis 70B V1.1", - "display_name": "TheDrummer: Anubis 70B V1.1", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 131072, - "output": 131072 - }, - "tool_call": false, - "reasoning": { - "supported": false - }, - "type": "chat" - }, { "id": "thedrummer/cydonia-24b-v4.1", "name": "TheDrummer: Cydonia 24B V4.1", @@ -69295,9 +78034,9 @@ "type": "imageGeneration" }, { - "id": "x-ai/grok-4.1-fast:free", - "name": "xAI: Grok 4.1 Fast (free)", - "display_name": "xAI: Grok 4.1 Fast (free)", + "id": "x-ai/grok-4.1-fast", + "name": "xAI: Grok 4.1 Fast", + "display_name": "xAI: Grok 4.1 Fast", "modalities": { "input": [ "text", @@ -69509,6 +78248,32 @@ "default": true }, "type": "chat" + }, + { + "id": "z-ai/glm-4.6v", + "name": "Z.AI: GLM 4.6V", + "display_name": "Z.AI: GLM 4.6V", + "modalities": { + "input": [ + "image", + "text", + "video" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 24000 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "type": "imageGeneration" } ] }, @@ -69546,7 +78311,8 @@ "display_name": "claude-3-5-haiku-20241022", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -69568,7 +78334,8 @@ "display_name": "claude-3-5-sonnet-20241022", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -69590,7 +78357,8 @@ "display_name": "claude-3-7-sonnet-20250219", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -69612,7 +78380,8 @@ "display_name": "claude-3-haiku-20240307", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -69657,7 +78426,8 @@ "display_name": "claude-opus-4-1-20250805", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -69679,7 +78449,8 @@ "display_name": "claude-opus-4-20250514", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -69724,7 +78495,8 @@ "display_name": "claude-sonnet-4-20250514", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -69837,7 +78609,8 @@ "display_name": "doubao-1-5-pro-32k-250115", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -69859,7 +78632,8 @@ "display_name": "doubao-1.5-pro-32k-character-250715", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -69903,7 +78677,8 @@ "display_name": "ERNIE 4.5 VL 424B A47B", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -69926,7 +78701,10 @@ "display_name": "gemini-2.0-flash-20250609", "modalities": { "input": [ - "text" + "text", + "image", + "video", + "audio" ], "output": [ "text" @@ -69948,7 +78726,10 @@ "display_name": "gemini-2.0-flash-lite", "modalities": { "input": [ - "text" + "text", + "image", + "video", + "audio" ], "output": [ "text" @@ -69970,7 +78751,10 @@ "display_name": "gemini-2.5-flash", "modalities": { "input": [ - "text" + "text", + "image", + "video", + "audio" ], "output": [ "text" @@ -69992,7 +78776,10 @@ "display_name": "gemini-2.5-flash-lite", "modalities": { "input": [ - "text" + "text", + "image", + "video", + "audio" ], "output": [ "text" @@ -70014,7 +78801,10 @@ "display_name": "gemini-2.5-flash-lite-preview-06-17", "modalities": { "input": [ - "text" + "text", + "video", + "image", + "audio" ], "output": [ "text" @@ -70037,7 +78827,9 @@ "modalities": { "input": [ "text", - "image" + "image", + "video", + "audio" ], "output": [ "text" @@ -70060,7 +78852,10 @@ "display_name": "gemini-2.5-flash-preview-05-20", "modalities": { "input": [ - "text" + "text", + "image", + "video", + "audio" ], "output": [ "text" @@ -70082,7 +78877,10 @@ "display_name": "gemini-2.5-pro", "modalities": { "input": [ - "text" + "text", + "image", + "video", + "audio" ], "output": [ "text" @@ -70104,7 +78902,10 @@ "display_name": "gemini-2.5-pro-preview-06-05", "modalities": { "input": [ - "text" + "text", + "image", + "video", + "audio" ], "output": [ "text" @@ -70127,7 +78928,9 @@ "modalities": { "input": [ "text", - "image" + "image", + "video", + "audio" ], "output": [ "text" @@ -70149,7 +78952,8 @@ "display_name": "Gemma 3 27B", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -70171,7 +78975,8 @@ "display_name": "Gemma3 12B", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -70193,7 +78998,8 @@ "display_name": "GLM 4.1V 9B Thinking", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -70216,7 +79022,9 @@ "display_name": "GLM 4.5V", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" @@ -70262,7 +79070,8 @@ "display_name": "gpt-4.1", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -70284,7 +79093,8 @@ "display_name": "gpt-4.1-mini", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -70306,7 +79116,8 @@ "display_name": "gpt-4.1-nano", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -70328,7 +79139,8 @@ "display_name": "gpt-4o", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -70350,7 +79162,8 @@ "display_name": "gpt-4o-mini", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -70372,7 +79185,8 @@ "display_name": "gpt-5", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -70395,7 +79209,8 @@ "display_name": "gpt-5-chat-latest", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -70440,7 +79255,8 @@ "display_name": "gpt-5-mini", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -70463,7 +79279,8 @@ "display_name": "gpt-5-nano", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -70509,7 +79326,8 @@ "display_name": "gpt-5.1", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -70532,7 +79350,8 @@ "display_name": "gpt-5.1-chat-latest", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -70555,7 +79374,78 @@ "display_name": "gpt-5.1-codex", "modalities": { "input": [ + "text", + "image" + ], + "output": [ "text" + ] + }, + "limit": { + "context": 400000, + "output": 128000 + }, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "type": "chat" + }, + { + "id": "gpt-5.2", + "name": "gpt-5.2", + "display_name": "gpt-5.2", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 400000, + "output": 128000 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "gpt-5.2-chat-latest", + "name": "gpt-5.2-chat-latest", + "display_name": "gpt-5.2-chat-latest", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 16000 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "gpt-5.2-pro", + "name": "gpt-5.2-pro", + "display_name": "gpt-5.2-pro", + "modalities": { + "input": [ + "text", + "image" ], "output": [ "text" @@ -70578,7 +79468,8 @@ "display_name": "grok-3", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -70600,7 +79491,8 @@ "display_name": "grok-3-mini", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -70622,7 +79514,8 @@ "display_name": "grok-4-0709", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -70736,7 +79629,8 @@ "display_name": "grok-code-fast-1", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -70912,7 +79806,8 @@ "display_name": "Llama 4 Maverick Instruct", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -70934,7 +79829,8 @@ "display_name": "Llama 4 Scout Instruct", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -71045,7 +79941,8 @@ "display_name": "o1", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -71067,7 +79964,8 @@ "display_name": "o1-mini", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -71089,7 +79987,8 @@ "display_name": "o3", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -71111,7 +80010,8 @@ "display_name": "o3-mini", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -71133,7 +80033,8 @@ "display_name": "OpenAI GPT OSS 120B", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -71156,7 +80057,8 @@ "display_name": "OpenAI: GPT OSS 20B", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -71245,7 +80147,9 @@ "display_name": "Qwen2.5 VL 72B Instruct", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" diff --git a/src/renderer/shell/App.vue b/src/renderer/shell/App.vue index bc1b113d8..a9dbd2ae1 100644 --- a/src/renderer/shell/App.vue +++ b/src/renderer/shell/App.vue @@ -13,11 +13,14 @@ import { useRouter } from 'vue-router' import AppBar from './components/AppBar.vue' import { useDeviceVersion } from '@/composables/useDeviceVersion' import { useMcpStore } from '@/stores/mcp' +import { useFontManager } from '@/composables/useFontManager' // Detect platform to apply proper styling const { isWinMacOS } = useDeviceVersion() const router = useRouter() const mcpStore = useMcpStore() +const { setupFontListener } = useFontManager() +setupFontListener() onMounted(async () => { // Check for pending MCP install from localStorage (cold start scenario) diff --git a/src/renderer/shell/tooltip-overlay/main.ts b/src/renderer/shell/tooltip-overlay/main.ts index 3d943b823..1d13a32e6 100644 --- a/src/renderer/shell/tooltip-overlay/main.ts +++ b/src/renderer/shell/tooltip-overlay/main.ts @@ -1,4 +1,7 @@ import '@/assets/main.css' +import { CONFIG_EVENTS } from '@/events' +import { usePresenter } from '@/composables/usePresenter' +import { buildFontStack, DEFAULT_CODE_FONT_STACK, DEFAULT_TEXT_FONT_STACK } from '@/lib/fontStack' type TooltipOverlayShowPayload = { x: number @@ -6,6 +9,18 @@ type TooltipOverlayShowPayload = { text: string } +const configPresenter = usePresenter('configPresenter') + +const applyFontVariables = (textFont: string, codeFont: string) => { + document.documentElement.style.setProperty('--dc-font-family', textFont) + document.documentElement.style.setProperty('--dc-code-font-family', codeFont) +} + +const toTextFontStack = (font: unknown) => + buildFontStack(typeof font === 'string' ? font : '', DEFAULT_TEXT_FONT_STACK) +const toCodeFontStack = (font: unknown) => + buildFontStack(typeof font === 'string' ? font : '', DEFAULT_CODE_FONT_STACK) + const root = document.getElementById('app') if (!root) { throw new Error('Tooltip overlay: missing #app') @@ -29,6 +44,26 @@ root.appendChild(tooltip) const { ipcRenderer } = window.electron +const initFonts = async () => { + const [fontFamily, codeFontFamily] = await Promise.all([ + configPresenter.getFontFamily(), + configPresenter.getCodeFontFamily() + ]) + applyFontVariables(toTextFontStack(fontFamily), toCodeFontStack(codeFontFamily)) +} + +initFonts().catch((error) => { + console.warn('Tooltip overlay: failed to initialize fonts', error) +}) + +ipcRenderer.on(CONFIG_EVENTS.FONT_FAMILY_CHANGED, (_event, value) => { + document.documentElement.style.setProperty('--dc-font-family', toTextFontStack(value)) +}) + +ipcRenderer.on(CONFIG_EVENTS.CODE_FONT_FAMILY_CHANGED, (_event, value) => { + document.documentElement.style.setProperty('--dc-code-font-family', toCodeFontStack(value)) +}) + const hide = () => { tooltip.classList.add('hidden') } diff --git a/src/renderer/src/lib/fontStack.ts b/src/renderer/src/lib/fontStack.ts new file mode 100644 index 000000000..291e6b9e9 --- /dev/null +++ b/src/renderer/src/lib/fontStack.ts @@ -0,0 +1,13 @@ +export const DEFAULT_TEXT_FONT_STACK = + "'Geist', Noto Sans, ui-sans-serif, system-ui, sans-serif, 'Apple Color Emoji', 'Segoe UI Emoji', 'Segoe UI Symbol', 'Noto Color Emoji'" + +export const DEFAULT_CODE_FONT_STACK = + "'JetBrains Mono', 'Fira Code', 'Menlo', 'Monaco', 'Consolas', 'Courier New', monospace" + +export const buildFontStack = (custom: string, fallback: string) => { + const normalized = (custom || '').trim() + if (!normalized) return fallback + const wrapped = + /\s/.test(normalized) && !normalized.includes(',') ? `"${normalized}"` : normalized + return `${wrapped}, ${fallback}` +} diff --git a/src/renderer/src/stores/uiSettingsStore.ts b/src/renderer/src/stores/uiSettingsStore.ts index 5bca34005..ec54c5228 100644 --- a/src/renderer/src/stores/uiSettingsStore.ts +++ b/src/renderer/src/stores/uiSettingsStore.ts @@ -2,21 +2,10 @@ import { ref, computed, onMounted, onBeforeUnmount } from 'vue' import { defineStore } from 'pinia' import { usePresenter } from '@/composables/usePresenter' import { CONFIG_EVENTS } from '@/events' +import { buildFontStack, DEFAULT_CODE_FONT_STACK, DEFAULT_TEXT_FONT_STACK } from '@/lib/fontStack' const FONT_SIZE_CLASSES = ['text-sm', 'text-base', 'text-lg', 'text-xl', 'text-2xl'] const DEFAULT_FONT_SIZE_LEVEL = 1 -const DEFAULT_FONT_STACK = - "'Geist', Noto Sans, ui-sans-serif, system-ui, sans-serif, 'Apple Color Emoji', 'Segoe UI Emoji', 'Segoe UI Symbol', 'Noto Color Emoji'" -const DEFAULT_CODE_FONT_STACK = - "'JetBrains Mono', 'Fira Code', 'Menlo', 'Monaco', 'Consolas', 'Courier New', monospace" - -const buildFontStack = (custom: string, fallback: string) => { - const normalized = (custom || '').trim() - if (!normalized) return fallback - const wrapped = - /\s/.test(normalized) && !normalized.includes(',') ? `"${normalized}"` : normalized - return `${wrapped}, ${fallback}` -} export const useUiSettingsStore = defineStore('uiSettings', () => { const configP = usePresenter('configPresenter') @@ -38,7 +27,9 @@ export const useUiSettingsStore = defineStore('uiSettings', () => { () => FONT_SIZE_CLASSES[fontSizeLevel.value] || FONT_SIZE_CLASSES[DEFAULT_FONT_SIZE_LEVEL] ) - const formattedFontFamily = computed(() => buildFontStack(fontFamily.value, DEFAULT_FONT_STACK)) + const formattedFontFamily = computed(() => + buildFontStack(fontFamily.value, DEFAULT_TEXT_FONT_STACK) + ) const formattedCodeFontFamily = computed(() => buildFontStack(codeFontFamily.value, DEFAULT_CODE_FONT_STACK) )