diff --git a/packages/ai-openrouter/src/model-meta.ts b/packages/ai-openrouter/src/model-meta.ts index cec4ced80..c93ff4103 100644 --- a/packages/ai-openrouter/src/model-meta.ts +++ b/packages/ai-openrouter/src/model-meta.ts @@ -410,41 +410,6 @@ const ALFREDPROS_CODELLAMA_7B_INSTRUCT_SOLIDITY = { image: 0, }, } as const -const ALIBABA_TONGYI_DEEPRESEARCH_30B_A3B = { - id: 'alibaba/tongyi-deepresearch-30b-a3b', - name: 'Tongyi DeepResearch 30B A3B', - supports: { - input: ['text'], - output: ['text'], - supports: [ - 'frequencyPenalty', - 'logitBias', - 'maxCompletionTokens', - 'presencePenalty', - 'reasoning', - 'responseFormat', - 'seed', - 'stop', - 'temperature', - 'toolChoice', - 'topP', - ], - }, - context_window: 131072, - max_output_tokens: 131072, - pricing: { - text: { - input: { - normal: 0.09, - cached: 0.09, - }, - output: { - normal: 0.45, - }, - }, - image: 0, - }, -} as const const ALLENAI_OLMO_3_32B_THINK = { id: 'allenai/olmo-3-32b-think', name: 'AllenAI: Olmo 3 32B Think', @@ -1157,35 +1122,6 @@ const ARCEE_AI_TRINITY_LARGE_THINKING = { image: 0, }, } as const -const ARCEE_AI_TRINITY_LARGE_THINKING_FREE = { - id: 'arcee-ai/trinity-large-thinking:free', - name: 'Arcee AI: Trinity Large Thinking (free)', - supports: { - input: ['text'], - output: ['text'], - supports: [ - 'maxCompletionTokens', - 'reasoning', - 'temperature', - 'toolChoice', - 'topP', - ], - }, - context_window: 262144, - max_output_tokens: 80000, - pricing: { - text: { - input: { - normal: 0, - cached: 0, - }, - output: { - normal: 0, - }, - }, - image: 0, - }, -} as const const ARCEE_AI_TRINITY_MINI = { id: 'arcee-ai/trinity-mini', name: 'Arcee AI: Trinity Mini', @@ -1250,29 +1186,6 @@ const ARCEE_AI_VIRTUOSO_LARGE = { image: 0, }, } as const -const BAIDU_COBUDDY_FREE = { - id: 'baidu/cobuddy:free', - name: 'Baidu Qianfan: CoBuddy (free)', - supports: { - input: ['text'], - output: ['text'], - supports: ['maxCompletionTokens', 'reasoning', 'stop'], - }, - context_window: 131072, - max_output_tokens: 65536, - pricing: { - text: { - input: { - normal: 0, - cached: 0, - }, - output: { - normal: 0, - }, - }, - image: 0, - }, -} as const const BAIDU_ERNIE_4_5_21B_A3B = { id: 'baidu/ernie-4.5-21b-a3b', name: 'Baidu: ERNIE 4.5 21B A3B', @@ -1837,16 +1750,16 @@ const DEEPSEEK_DEEPSEEK_CHAT = { 'topP', ], }, - context_window: 163840, - max_output_tokens: 16384, + context_window: 131072, + max_output_tokens: 16000, pricing: { text: { input: { - normal: 0.32, + normal: 0.2288, cached: 0, }, output: { - normal: 0.89, + normal: 0.9144, }, }, image: 0, @@ -2222,14 +2135,15 @@ const DEEPSEEK_DEEPSEEK_V4_FLASH = { ], }, context_window: 1048576, + max_output_tokens: 16384, pricing: { text: { input: { - normal: 0.112, - cached: 0.022, + normal: 0.1, + cached: 0.02, }, output: { - normal: 0.224, + normal: 0.2, }, }, image: 0, @@ -3764,7 +3678,6 @@ const META_LLAMA_LLAMA_3_1_8B_INSTRUCT = { supports: [ 'frequencyPenalty', 'logitBias', - 'logprobs', 'maxCompletionTokens', 'presencePenalty', 'responseFormat', @@ -3772,7 +3685,6 @@ const META_LLAMA_LLAMA_3_1_8B_INSTRUCT = { 'stop', 'temperature', 'toolChoice', - 'topLogprobs', 'topP', ], }, @@ -4414,7 +4326,7 @@ const MINIMAX_MINIMAX_M2_5_FREE = { 'temperature', ], }, - context_window: 204800, + context_window: 262144, max_output_tokens: 8192, pricing: { text: { @@ -5422,6 +5334,28 @@ const MOONSHOTAI_KIMI_K2_6 = { image: 0, }, } as const +const MOONSHOTAI_KIMI_K2_6_FREE = { + id: 'moonshotai/kimi-k2.6:free', + name: 'MoonshotAI: Kimi K2.6 (free)', + supports: { + input: ['text', 'image'], + output: ['text'], + supports: ['reasoning', 'toolChoice'], + }, + context_window: 262144, + pricing: { + text: { + input: { + normal: 0, + cached: 0, + }, + output: { + normal: 0, + }, + }, + image: 0, + }, +} as const const MORPH_MORPH_V3_FAST = { id: 'morph/morph-v3-fast', name: 'Morph: Morph V3 Fast', @@ -6982,12 +6916,12 @@ const OPENAI_GPT_5_1_CHAT = { ], }, context_window: 128000, - max_output_tokens: 16384, + max_output_tokens: 32000, pricing: { text: { input: { normal: 1.25, - cached: 0.125, + cached: 0.13, }, output: { normal: 10, @@ -7017,7 +6951,7 @@ const OPENAI_GPT_5_1_CODEX = { text: { input: { normal: 1.25, - cached: 0.125, + cached: 0.13, }, output: { normal: 10, @@ -7072,12 +7006,12 @@ const OPENAI_GPT_5_1_CODEX_MINI = { ], }, context_window: 400000, - max_output_tokens: 128000, + max_output_tokens: 100000, pricing: { text: { input: { normal: 0.25, - cached: 0.03, + cached: 0.025, }, output: { normal: 2, @@ -7131,7 +7065,7 @@ const OPENAI_GPT_5_2_CHAT = { ], }, context_window: 128000, - max_output_tokens: 32000, + max_output_tokens: 16384, pricing: { text: { input: { @@ -8263,8 +8197,8 @@ const POOLSIDE_LAGUNA_M_1_FREE = { output: ['text'], supports: ['maxCompletionTokens', 'reasoning', 'temperature', 'toolChoice'], }, - context_window: 131072, - max_output_tokens: 8192, + context_window: 262144, + max_output_tokens: 32768, pricing: { text: { input: { @@ -8286,8 +8220,8 @@ const POOLSIDE_LAGUNA_XS_2_FREE = { output: ['text'], supports: ['maxCompletionTokens', 'reasoning', 'temperature', 'toolChoice'], }, - context_window: 131072, - max_output_tokens: 8192, + context_window: 262144, + max_output_tokens: 32768, pricing: { text: { input: { @@ -8486,7 +8420,7 @@ const QWEN_QWEN_PLUS_2025_07_28 = { text: { input: { normal: 0.26, - cached: 0.325, + cached: 0, }, output: { normal: 0.78, @@ -8637,7 +8571,6 @@ const QWEN_QWEN3_235B_A22B_2507 = { supports: [ 'frequencyPenalty', 'logitBias', - 'logprobs', 'maxCompletionTokens', 'presencePenalty', 'responseFormat', @@ -8645,7 +8578,6 @@ const QWEN_QWEN3_235B_A22B_2507 = { 'stop', 'temperature', 'toolChoice', - 'topLogprobs', 'topP', ], }, @@ -9671,7 +9603,7 @@ const QWEN_QWEN3_5_FLASH_02_23 = { text: { input: { normal: 0.065, - cached: 0.08125, + cached: 0, }, output: { normal: 0.26, @@ -9703,7 +9635,7 @@ const QWEN_QWEN3_5_PLUS_02_15 = { text: { input: { normal: 0.26, - cached: 0.325, + cached: 0, }, output: { normal: 1.56, @@ -9735,7 +9667,7 @@ const QWEN_QWEN3_5_PLUS_20260420 = { text: { input: { normal: 0.3, - cached: 0, + cached: 0.375, }, output: { normal: 1.8, @@ -9767,11 +9699,11 @@ const QWEN_QWEN3_6_27B = { ], }, context_window: 262144, - max_output_tokens: 262144, + max_output_tokens: 262140, pricing: { text: { input: { - normal: 0.3, + normal: 0.29, cached: 0, }, output: { @@ -9804,12 +9736,12 @@ const QWEN_QWEN3_6_35B_A3B = { ], }, context_window: 262144, - max_output_tokens: 262144, + max_output_tokens: 262140, pricing: { text: { input: { - normal: 0.15, - cached: 0.05, + normal: 0.14, + cached: 0, }, output: { normal: 1, @@ -9840,11 +9772,11 @@ const QWEN_QWEN3_6_FLASH = { pricing: { text: { input: { - normal: 0.12375, - cached: 0.1545, + normal: 0.1875, + cached: 0.234375, }, output: { - normal: 0.7425, + normal: 1.125, }, }, image: 0, @@ -9906,11 +9838,11 @@ const QWEN_QWEN3_6_PLUS = { pricing: { text: { input: { - normal: 0.1794, - cached: 0.2236, + normal: 0.325, + cached: 0.40625, }, output: { - normal: 1.07315, + normal: 1.95, }, }, image: 0, @@ -9940,11 +9872,11 @@ const QWEN_QWEN3_7_MAX = { pricing: { text: { input: { - normal: 2.5, - cached: 3.125, + normal: 1.25, + cached: 1.8125, }, output: { - normal: 7.5, + normal: 3.75, }, }, image: 0, @@ -10336,6 +10268,7 @@ const TENCENT_HY3_PREVIEW = { 'maxCompletionTokens', 'presencePenalty', 'reasoning', + 'seed', 'stop', 'temperature', 'toolChoice', @@ -10343,15 +10276,14 @@ const TENCENT_HY3_PREVIEW = { ], }, context_window: 262144, - max_output_tokens: 262144, pricing: { text: { input: { - normal: 0.066, - cached: 0.029, + normal: 0.063, + cached: 0.021, }, output: { - normal: 0.26, + normal: 0.21, }, }, image: 0, @@ -10834,11 +10766,11 @@ const XIAOMI_MIMO_V2_5 = { pricing: { text: { input: { - normal: 0.4, - cached: 0.08, + normal: 0.14, + cached: 0.0028, }, output: { - normal: 2, + normal: 0.28, }, }, image: 0, @@ -10865,15 +10797,15 @@ const XIAOMI_MIMO_V2_5_PRO = { ], }, context_window: 1048576, - max_output_tokens: 16384, + max_output_tokens: 131072, pricing: { text: { input: { - normal: 1, - cached: 0.2, + normal: 0.435, + cached: 0.0036, }, output: { - normal: 3, + normal: 0.87, }, }, image: 0, @@ -10946,6 +10878,7 @@ const Z_AI_GLM_4_5_AIR = { 'maxCompletionTokens', 'presencePenalty', 'reasoning', + 'responseFormat', 'seed', 'stop', 'temperature', @@ -10954,15 +10887,15 @@ const Z_AI_GLM_4_5_AIR = { ], }, context_window: 131072, - max_output_tokens: 98304, + max_output_tokens: 131070, pricing: { text: { input: { - normal: 0.13, - cached: 0.025, + normal: 0.125, + cached: 0, }, output: { - normal: 0.85, + normal: 0.84, }, }, image: 0, @@ -11442,21 +11375,6 @@ export type OpenRouterModelOptionsByName = { | 'temperature' | 'topP' > - [ALIBABA_TONGYI_DEEPRESEARCH_30B_A3B.id]: OpenRouterCommonOptions & - Pick< - OpenRouterBaseOptions, - | 'frequencyPenalty' - | 'logitBias' - | 'maxCompletionTokens' - | 'presencePenalty' - | 'reasoning' - | 'responseFormat' - | 'seed' - | 'stop' - | 'temperature' - | 'toolChoice' - | 'topP' - > [ALLENAI_OLMO_3_32B_THINK.id]: OpenRouterCommonOptions & Pick< OpenRouterBaseOptions, @@ -11690,15 +11608,6 @@ export type OpenRouterModelOptionsByName = { | 'toolChoice' | 'topP' > - [ARCEE_AI_TRINITY_LARGE_THINKING_FREE.id]: OpenRouterCommonOptions & - Pick< - OpenRouterBaseOptions, - | 'maxCompletionTokens' - | 'reasoning' - | 'temperature' - | 'toolChoice' - | 'topP' - > [ARCEE_AI_TRINITY_MINI.id]: OpenRouterCommonOptions & Pick< OpenRouterBaseOptions, @@ -11723,8 +11632,6 @@ export type OpenRouterModelOptionsByName = { | 'toolChoice' | 'topP' > - [BAIDU_COBUDDY_FREE.id]: OpenRouterCommonOptions & - Pick [BAIDU_ERNIE_4_5_21B_A3B.id]: OpenRouterCommonOptions & Pick< OpenRouterBaseOptions, @@ -12676,7 +12583,6 @@ export type OpenRouterModelOptionsByName = { OpenRouterBaseOptions, | 'frequencyPenalty' | 'logitBias' - | 'logprobs' | 'maxCompletionTokens' | 'presencePenalty' | 'responseFormat' @@ -12684,7 +12590,6 @@ export type OpenRouterModelOptionsByName = { | 'stop' | 'temperature' | 'toolChoice' - | 'topLogprobs' | 'topP' > [META_LLAMA_LLAMA_3_2_11B_VISION_INSTRUCT.id]: OpenRouterCommonOptions & @@ -13338,6 +13243,8 @@ export type OpenRouterModelOptionsByName = { | 'topLogprobs' | 'topP' > + [MOONSHOTAI_KIMI_K2_6_FREE.id]: OpenRouterCommonOptions & + Pick [MORPH_MORPH_V3_FAST.id]: OpenRouterCommonOptions & Pick [MORPH_MORPH_V3_LARGE.id]: OpenRouterCommonOptions & @@ -14526,7 +14433,6 @@ export type OpenRouterModelOptionsByName = { OpenRouterBaseOptions, | 'frequencyPenalty' | 'logitBias' - | 'logprobs' | 'maxCompletionTokens' | 'presencePenalty' | 'responseFormat' @@ -14534,7 +14440,6 @@ export type OpenRouterModelOptionsByName = { | 'stop' | 'temperature' | 'toolChoice' - | 'topLogprobs' | 'topP' > [QWEN_QWEN3_235B_A22B_THINKING_2507.id]: OpenRouterCommonOptions & @@ -15209,6 +15114,7 @@ export type OpenRouterModelOptionsByName = { | 'maxCompletionTokens' | 'presencePenalty' | 'reasoning' + | 'seed' | 'stop' | 'temperature' | 'toolChoice' @@ -15449,6 +15355,7 @@ export type OpenRouterModelOptionsByName = { | 'maxCompletionTokens' | 'presencePenalty' | 'reasoning' + | 'responseFormat' | 'seed' | 'stop' | 'temperature' @@ -15625,7 +15532,6 @@ export type OpenRouterModelInputModalitiesByName = { [AION_LABS_AION_2_0.id]: ReadonlyArray<'text'> [AION_LABS_AION_RP_LLAMA_3_1_8B.id]: ReadonlyArray<'text'> [ALFREDPROS_CODELLAMA_7B_INSTRUCT_SOLIDITY.id]: ReadonlyArray<'text'> - [ALIBABA_TONGYI_DEEPRESEARCH_30B_A3B.id]: ReadonlyArray<'text'> [ALLENAI_OLMO_3_32B_THINK.id]: ReadonlyArray<'text'> [AMAZON_NOVA_2_LITE_V1.id]: ReadonlyArray< 'text' | 'image' | 'video' | 'document' @@ -15656,10 +15562,8 @@ export type OpenRouterModelInputModalitiesByName = { [ARCEE_AI_MAESTRO_REASONING.id]: ReadonlyArray<'text'> [ARCEE_AI_SPOTLIGHT.id]: ReadonlyArray<'image' | 'text'> [ARCEE_AI_TRINITY_LARGE_THINKING.id]: ReadonlyArray<'text'> - [ARCEE_AI_TRINITY_LARGE_THINKING_FREE.id]: ReadonlyArray<'text'> [ARCEE_AI_TRINITY_MINI.id]: ReadonlyArray<'text'> [ARCEE_AI_VIRTUOSO_LARGE.id]: ReadonlyArray<'text'> - [BAIDU_COBUDDY_FREE.id]: ReadonlyArray<'text'> [BAIDU_ERNIE_4_5_21B_A3B.id]: ReadonlyArray<'text'> [BAIDU_ERNIE_4_5_21B_A3B_THINKING.id]: ReadonlyArray<'text'> [BAIDU_ERNIE_4_5_300B_A47B.id]: ReadonlyArray<'text'> @@ -15826,6 +15730,7 @@ export type OpenRouterModelInputModalitiesByName = { [MOONSHOTAI_KIMI_K2_THINKING.id]: ReadonlyArray<'text'> [MOONSHOTAI_KIMI_K2_5.id]: ReadonlyArray<'text' | 'image'> [MOONSHOTAI_KIMI_K2_6.id]: ReadonlyArray<'text' | 'image'> + [MOONSHOTAI_KIMI_K2_6_FREE.id]: ReadonlyArray<'text' | 'image'> [MORPH_MORPH_V3_FAST.id]: ReadonlyArray<'text'> [MORPH_MORPH_V3_LARGE.id]: ReadonlyArray<'text'> [NEX_AGI_DEEPSEEK_V3_1_NEX_N1.id]: ReadonlyArray<'text'> @@ -16037,7 +15942,6 @@ export const OPENROUTER_CHAT_MODELS = [ AION_LABS_AION_2_0.id, AION_LABS_AION_RP_LLAMA_3_1_8B.id, ALFREDPROS_CODELLAMA_7B_INSTRUCT_SOLIDITY.id, - ALIBABA_TONGYI_DEEPRESEARCH_30B_A3B.id, ALLENAI_OLMO_3_32B_THINK.id, AMAZON_NOVA_2_LITE_V1.id, AMAZON_NOVA_LITE_V1.id, @@ -16062,10 +15966,8 @@ export const OPENROUTER_CHAT_MODELS = [ ARCEE_AI_MAESTRO_REASONING.id, ARCEE_AI_SPOTLIGHT.id, ARCEE_AI_TRINITY_LARGE_THINKING.id, - ARCEE_AI_TRINITY_LARGE_THINKING_FREE.id, ARCEE_AI_TRINITY_MINI.id, ARCEE_AI_VIRTUOSO_LARGE.id, - BAIDU_COBUDDY_FREE.id, BAIDU_ERNIE_4_5_21B_A3B.id, BAIDU_ERNIE_4_5_21B_A3B_THINKING.id, BAIDU_ERNIE_4_5_300B_A47B.id, @@ -16192,6 +16094,7 @@ export const OPENROUTER_CHAT_MODELS = [ MOONSHOTAI_KIMI_K2_THINKING.id, MOONSHOTAI_KIMI_K2_5.id, MOONSHOTAI_KIMI_K2_6.id, + MOONSHOTAI_KIMI_K2_6_FREE.id, MORPH_MORPH_V3_FAST.id, MORPH_MORPH_V3_LARGE.id, NEX_AGI_DEEPSEEK_V3_1_NEX_N1.id, @@ -16379,10 +16282,7 @@ export const OPENROUTER_CHAT_MODELS = [ ] as const export type OpenRouterChatModelToolCapabilitiesByName = { - [K in (typeof OPENROUTER_CHAT_MODELS)[number]]: readonly [ - 'web_search', - 'web_fetch', - ] + [K in (typeof OPENROUTER_CHAT_MODELS)[number]]: readonly ['web_search'] } export const OPENROUTER_IMAGE_MODELS = [ diff --git a/scripts/.sync-models-last-run b/scripts/.sync-models-last-run index 1f83e39bc..3e47207be 100644 --- a/scripts/.sync-models-last-run +++ b/scripts/.sync-models-last-run @@ -1 +1 @@ -1779439521 +1779961160 diff --git a/scripts/openrouter.models.json b/scripts/openrouter.models.json index 9cd7a646e..8d470e937 100644 --- a/scripts/openrouter.models.json +++ b/scripts/openrouter.models.json @@ -426,7 +426,7 @@ "top_provider": { "context_length": 400000, "max_completion_tokens": 128000, - "is_moderated": false + "is_moderated": true }, "per_request_limits": null, "supported_parameters": [ @@ -701,63 +701,6 @@ "details": "/api/v1/models/alfredpros/codellama-7b-instruct-solidity/endpoints" } }, - { - "id": "alibaba/tongyi-deepresearch-30b-a3b", - "canonical_slug": "alibaba/tongyi-deepresearch-30b-a3b", - "hugging_face_id": "Alibaba-NLP/Tongyi-DeepResearch-30B-A3B", - "name": "Tongyi DeepResearch 30B A3B", - "created": 1758210804, - "description": "Tongyi DeepResearch is an agentic large language model developed by Tongyi Lab, with 30 billion total parameters activating only 3 billion per token. It's optimized for long-horizon, deep information-seeking tasks...", - "context_length": 131072, - "architecture": { - "modality": "text->text", - "input_modalities": ["text"], - "output_modalities": ["text"], - "tokenizer": "Other", - "instruct_type": null - }, - "pricing": { - "prompt": "0.00000009", - "completion": "0.00000045", - "input_cache_read": "0.00000009" - }, - "top_provider": { - "context_length": 131072, - "max_completion_tokens": 131072, - "is_moderated": false - }, - "per_request_limits": null, - "supported_parameters": [ - "frequency_penalty", - "include_reasoning", - "logit_bias", - "max_tokens", - "min_p", - "presence_penalty", - "reasoning", - "repetition_penalty", - "response_format", - "seed", - "stop", - "structured_outputs", - "temperature", - "tool_choice", - "tools", - "top_k", - "top_p" - ], - "default_parameters": { - "temperature": null, - "top_p": null, - "frequency_penalty": null - }, - "supported_voices": null, - "knowledge_cutoff": "2025-03-31", - "expiration_date": null, - "links": { - "details": "/api/v1/models/alibaba/tongyi-deepresearch-30b-a3b/endpoints" - } - }, { "id": "allenai/olmo-3-32b-think", "canonical_slug": "allenai/olmo-3-32b-think-20251121", @@ -1977,56 +1920,6 @@ "details": "/api/v1/models/arcee-ai/trinity-large-thinking/endpoints" } }, - { - "id": "arcee-ai/trinity-large-thinking:free", - "canonical_slug": "arcee-ai/trinity-large-thinking", - "hugging_face_id": "arcee-ai/Trinity-Large-Thinking", - "name": "Arcee AI: Trinity Large Thinking (free)", - "created": 1775058318, - "description": "Trinity Large Thinking is a powerful open source reasoning model from the team at Arcee AI. It shows strong performance in PinchBench, agentic workloads, and reasoning tasks. Launch video: https://youtu.be/Gc82AXLa0Rg?si=4RLn6WBz33qT--B7...", - "context_length": 262144, - "architecture": { - "modality": "text->text", - "input_modalities": ["text"], - "output_modalities": ["text"], - "tokenizer": "Other", - "instruct_type": null - }, - "pricing": { - "prompt": "0", - "completion": "0" - }, - "top_provider": { - "context_length": 262144, - "max_completion_tokens": 80000, - "is_moderated": false - }, - "per_request_limits": null, - "supported_parameters": [ - "include_reasoning", - "max_tokens", - "reasoning", - "temperature", - "tool_choice", - "tools", - "top_k", - "top_p" - ], - "default_parameters": { - "temperature": 0.3, - "top_p": 0.8, - "top_k": null, - "frequency_penalty": null, - "presence_penalty": null, - "repetition_penalty": null - }, - "supported_voices": null, - "knowledge_cutoff": null, - "expiration_date": null, - "links": { - "details": "/api/v1/models/arcee-ai/trinity-large-thinking/endpoints" - } - }, { "id": "arcee-ai/trinity-mini", "canonical_slug": "arcee-ai/trinity-mini-20251201", @@ -2124,46 +2017,6 @@ "details": "/api/v1/models/arcee-ai/virtuoso-large/endpoints" } }, - { - "id": "baidu/cobuddy:free", - "canonical_slug": "baidu/cobuddy-20260430", - "hugging_face_id": null, - "name": "Baidu Qianfan: CoBuddy (free)", - "created": 1778035480, - "description": "CoBuddy is a code generation model from Baidu, optimized for coding tasks and AI Agent workflows. It features high inference throughput and low end-to-end latency, with native support for tool...", - "context_length": 131072, - "architecture": { - "modality": "text->text", - "input_modalities": ["text"], - "output_modalities": ["text"], - "tokenizer": "Other", - "instruct_type": null - }, - "pricing": { - "prompt": "0", - "completion": "0" - }, - "top_provider": { - "context_length": 131072, - "max_completion_tokens": 65536, - "is_moderated": false - }, - "per_request_limits": null, - "supported_parameters": [ - "include_reasoning", - "max_tokens", - "reasoning", - "stop", - "tools" - ], - "default_parameters": {}, - "supported_voices": null, - "knowledge_cutoff": null, - "expiration_date": null, - "links": { - "details": "/api/v1/models/baidu/cobuddy-20260430/endpoints" - } - }, { "id": "baidu/ernie-4.5-21b-a3b", "canonical_slug": "baidu/ernie-4.5-21b-a3b", @@ -2992,7 +2845,7 @@ "name": "DeepSeek: DeepSeek V3", "created": 1735241320, "description": "DeepSeek-V3 is the latest model from the DeepSeek team, building upon the instruction following and coding abilities of the previous versions. Pre-trained on nearly 15 trillion tokens, the reported evaluations...", - "context_length": 163840, + "context_length": 131072, "architecture": { "modality": "text->text", "input_modalities": ["text"], @@ -3001,12 +2854,12 @@ "instruct_type": null }, "pricing": { - "prompt": "0.00000032", - "completion": "0.00000089" + "prompt": "0.0000002288", + "completion": "0.0000009144" }, "top_provider": { - "context_length": 163840, - "max_completion_tokens": 16384, + "context_length": 128000, + "max_completion_tokens": 16000, "is_moderated": false }, "per_request_limits": null, @@ -3596,13 +3449,13 @@ "instruct_type": null }, "pricing": { - "prompt": "0.000000112", - "completion": "0.000000224", - "input_cache_read": "0.000000022" + "prompt": "0.0000001", + "completion": "0.0000002", + "input_cache_read": "0.00000002" }, "top_provider": { - "context_length": 1048575, - "max_completion_tokens": null, + "context_length": 1048576, + "max_completion_tokens": 16384, "is_moderated": false }, "per_request_limits": null, @@ -3956,7 +3809,10 @@ "default_parameters": { "temperature": null, "top_p": null, - "frequency_penalty": null + "top_k": null, + "frequency_penalty": null, + "presence_penalty": null, + "repetition_penalty": null }, "supported_voices": null, "knowledge_cutoff": "2025-01-31", @@ -6180,7 +6036,6 @@ "supported_parameters": [ "frequency_penalty", "logit_bias", - "logprobs", "max_tokens", "min_p", "presence_penalty", @@ -6193,7 +6048,6 @@ "tool_choice", "tools", "top_k", - "top_logprobs", "top_p" ], "default_parameters": {}, @@ -7125,7 +6979,7 @@ "name": "MiniMax: MiniMax M2.5 (free)", "created": 1770908502, "description": "MiniMax-M2.5 is a SOTA large language model designed for real-world productivity. Trained in a diverse range of complex real-world digital working environments, M2.5 builds upon the coding expertise of M2.1...", - "context_length": 204800, + "context_length": 262144, "architecture": { "modality": "text->text", "input_modalities": ["text"], @@ -7138,7 +6992,7 @@ "completion": "0" }, "top_provider": { - "context_length": 196608, + "context_length": 262144, "max_completion_tokens": 8192, "is_moderated": true }, @@ -8726,6 +8580,52 @@ "details": "/api/v1/models/moonshotai/kimi-k2.6-20260420/endpoints" } }, + { + "id": "moonshotai/kimi-k2.6:free", + "canonical_slug": "moonshotai/kimi-k2.6-20260420", + "hugging_face_id": "moonshotai/Kimi-K2.6", + "name": "MoonshotAI: Kimi K2.6 (free)", + "created": 1776699402, + "description": "Kimi K2.6 is Moonshot AI's next-generation multimodal model, designed for long-horizon coding, coding-driven UI/UX generation, and multi-agent orchestration. It handles complex end-to-end coding tasks across Python, Rust, and Go, and...", + "context_length": 262144, + "architecture": { + "modality": "text+image->text", + "input_modalities": ["text", "image"], + "output_modalities": ["text"], + "tokenizer": "Other", + "instruct_type": null + }, + "pricing": { + "prompt": "0", + "completion": "0" + }, + "top_provider": { + "context_length": 262144, + "max_completion_tokens": null, + "is_moderated": false + }, + "per_request_limits": null, + "supported_parameters": [ + "include_reasoning", + "reasoning", + "tool_choice", + "tools" + ], + "default_parameters": { + "temperature": null, + "top_p": null, + "top_k": null, + "frequency_penalty": null, + "presence_penalty": null, + "repetition_penalty": null + }, + "supported_voices": null, + "knowledge_cutoff": null, + "expiration_date": null, + "links": { + "details": "/api/v1/models/moonshotai/kimi-k2.6-20260420/endpoints" + } + }, { "id": "morph/morph-v3-fast", "canonical_slug": "morph/morph-v3-fast", @@ -8891,7 +8791,7 @@ "default_parameters": {}, "supported_voices": null, "knowledge_cutoff": "2023-12-31", - "expiration_date": null, + "expiration_date": "2026-06-05", "links": { "details": "/api/v1/models/nousresearch/hermes-2-pro-llama-3-8b/endpoints" } @@ -11098,12 +10998,12 @@ "prompt": "0.00000125", "completion": "0.00001", "web_search": "0.01", - "input_cache_read": "0.000000125" + "input_cache_read": "0.00000013" }, "top_provider": { "context_length": 128000, - "max_completion_tokens": 16384, - "is_moderated": true + "max_completion_tokens": 32000, + "is_moderated": false }, "per_request_limits": null, "supported_parameters": [ @@ -11146,12 +11046,12 @@ "prompt": "0.00000125", "completion": "0.00001", "web_search": "0.01", - "input_cache_read": "0.000000125" + "input_cache_read": "0.00000013" }, "top_provider": { "context_length": 400000, "max_completion_tokens": 128000, - "is_moderated": true + "is_moderated": false }, "per_request_limits": null, "supported_parameters": [ @@ -11252,12 +11152,12 @@ "prompt": "0.00000025", "completion": "0.000002", "web_search": "0.01", - "input_cache_read": "0.00000003" + "input_cache_read": "0.000000025" }, "top_provider": { "context_length": 400000, - "max_completion_tokens": 128000, - "is_moderated": false + "max_completion_tokens": 100000, + "is_moderated": true }, "per_request_limits": null, "supported_parameters": [ @@ -11310,7 +11210,7 @@ "top_provider": { "context_length": 400000, "max_completion_tokens": 128000, - "is_moderated": false + "is_moderated": true }, "per_request_limits": null, "supported_parameters": [ @@ -11362,8 +11262,8 @@ }, "top_provider": { "context_length": 128000, - "max_completion_tokens": 32000, - "is_moderated": false + "max_completion_tokens": 16384, + "is_moderated": true }, "per_request_limits": null, "supported_parameters": [ @@ -11382,7 +11282,7 @@ }, "supported_voices": null, "knowledge_cutoff": null, - "expiration_date": null, + "expiration_date": "2026-08-10", "links": { "details": "/api/v1/models/openai/gpt-5.2-chat-20251211/endpoints" } @@ -11411,7 +11311,7 @@ "top_provider": { "context_length": 400000, "max_completion_tokens": 128000, - "is_moderated": false + "is_moderated": true }, "per_request_limits": null, "supported_parameters": [ @@ -11613,7 +11513,7 @@ "top_provider": { "context_length": 1050000, "max_completion_tokens": 128000, - "is_moderated": false + "is_moderated": true }, "per_request_limits": null, "supported_parameters": [ @@ -11722,7 +11622,7 @@ "top_provider": { "context_length": 400000, "max_completion_tokens": 128000, - "is_moderated": false + "is_moderated": true }, "per_request_limits": null, "supported_parameters": [ @@ -11827,7 +11727,7 @@ "top_provider": { "context_length": 1050000, "max_completion_tokens": 128000, - "is_moderated": false + "is_moderated": true }, "per_request_limits": null, "supported_parameters": [ @@ -13213,7 +13113,7 @@ "name": "Poolside: Laguna M.1 (free)", "created": 1777388504, "description": "Laguna M.1 is the flagship coding agent model from [Poolside](https://poolside.ai), optimized for complex software engineering tasks. Designed for agentic coding workflows, it supports tool calling and reasoning, with a 128K...", - "context_length": 131072, + "context_length": 262144, "architecture": { "modality": "text->text", "input_modalities": ["text"], @@ -13226,8 +13126,8 @@ "completion": "0" }, "top_provider": { - "context_length": 131072, - "max_completion_tokens": 8192, + "context_length": 262144, + "max_completion_tokens": 32768, "is_moderated": false }, "per_request_limits": null, @@ -13261,7 +13161,7 @@ "name": "Poolside: Laguna XS.2 (free)", "created": 1777389604, "description": "Laguna XS.2 is the second-generation model in the XS size class from [Poolside](https://poolside.ai), their efficient coding agent series. It combines tool calling and reasoning capabilities with a compact footprint, offering...", - "context_length": 131072, + "context_length": 262144, "architecture": { "modality": "text->text", "input_modalities": ["text"], @@ -13274,8 +13174,8 @@ "completion": "0" }, "top_provider": { - "context_length": 131072, - "max_completion_tokens": 8192, + "context_length": 262144, + "max_completion_tokens": 32768, "is_moderated": false }, "per_request_limits": null, @@ -13565,8 +13465,7 @@ }, "pricing": { "prompt": "0.00000026", - "completion": "0.00000078", - "input_cache_write": "0.000000325" + "completion": "0.00000078" }, "top_provider": { "context_length": 1000000, @@ -13822,7 +13721,6 @@ "supported_parameters": [ "frequency_penalty", "logit_bias", - "logprobs", "max_tokens", "min_p", "presence_penalty", @@ -13835,7 +13733,6 @@ "tool_choice", "tools", "top_k", - "top_logprobs", "top_p" ], "default_parameters": {}, @@ -13955,7 +13852,7 @@ }, "supported_voices": null, "knowledge_cutoff": "2025-03-31", - "expiration_date": null, + "expiration_date": "2026-06-05", "links": { "details": "/api/v1/models/qwen/qwen3-30b-a3b-04-28/endpoints" } @@ -15422,8 +15319,7 @@ }, "pricing": { "prompt": "0.000000065", - "completion": "0.00000026", - "input_cache_write": "0.00000008125" + "completion": "0.00000026" }, "top_provider": { "context_length": 1000000, @@ -15473,8 +15369,7 @@ }, "pricing": { "prompt": "0.00000026", - "completion": "0.00000156", - "input_cache_write": "0.000000325" + "completion": "0.00000156" }, "top_provider": { "context_length": 1000000, @@ -15524,7 +15419,8 @@ }, "pricing": { "prompt": "0.0000003", - "completion": "0.0000018" + "completion": "0.0000018", + "input_cache_write": "0.000000375" }, "top_provider": { "context_length": 1000000, @@ -15569,12 +15465,12 @@ "instruct_type": null }, "pricing": { - "prompt": "0.0000003", + "prompt": "0.00000029", "completion": "0.0000032" }, "top_provider": { - "context_length": 262144, - "max_completion_tokens": 262144, + "context_length": 262140, + "max_completion_tokens": 262140, "is_moderated": false }, "per_request_limits": null, @@ -15630,13 +15526,12 @@ "instruct_type": null }, "pricing": { - "prompt": "0.00000015", - "completion": "0.000001", - "input_cache_read": "0.00000005" + "prompt": "0.00000014", + "completion": "0.000001" }, "top_provider": { - "context_length": 262144, - "max_completion_tokens": 262144, + "context_length": 262140, + "max_completion_tokens": 262140, "is_moderated": false }, "per_request_limits": null, @@ -15689,9 +15584,9 @@ "instruct_type": null }, "pricing": { - "prompt": "0.00000012375", - "completion": "0.0000007425", - "input_cache_write": "0.0000001545" + "prompt": "0.0000001875", + "completion": "0.000001125", + "input_cache_write": "0.000000234375" }, "top_provider": { "context_length": 1000000, @@ -15785,9 +15680,9 @@ "instruct_type": null }, "pricing": { - "prompt": "0.0000001794", - "completion": "0.00000107315", - "input_cache_write": "0.0000002236" + "prompt": "0.000000325", + "completion": "0.00000195", + "input_cache_write": "0.00000040625" }, "top_provider": { "context_length": 1000000, @@ -15839,9 +15734,10 @@ "instruct_type": null }, "pricing": { - "prompt": "0.0000025", - "completion": "0.0000075", - "input_cache_write": "0.000003125" + "prompt": "0.00000125", + "completion": "0.00000375", + "input_cache_read": "0.00000025", + "input_cache_write": "0.0000015625" }, "top_provider": { "context_length": 1000000, @@ -16109,7 +16005,7 @@ "default_parameters": {}, "supported_voices": null, "knowledge_cutoff": "2023-12-31", - "expiration_date": null, + "expiration_date": "2026-06-05", "links": { "details": "/api/v1/models/sao10k/l3-euryale-70b/endpoints" } @@ -16464,13 +16360,13 @@ "instruct_type": null }, "pricing": { - "prompt": "0.000000066", - "completion": "0.00000026", - "input_cache_read": "0.000000029" + "prompt": "0.000000063", + "completion": "0.00000021", + "input_cache_read": "0.000000021" }, "top_provider": { "context_length": 262144, - "max_completion_tokens": 262144, + "max_completion_tokens": null, "is_moderated": false }, "per_request_limits": null, @@ -16480,6 +16376,7 @@ "max_tokens", "presence_penalty", "reasoning", + "seed", "stop", "temperature", "tool_choice", @@ -17251,9 +17148,9 @@ "instruct_type": null }, "pricing": { - "prompt": "0.0000004", - "completion": "0.000002", - "input_cache_read": "0.00000008" + "prompt": "0.00000014", + "completion": "0.00000028", + "input_cache_read": "0.0000000028" }, "top_provider": { "context_length": 1048576, @@ -17305,13 +17202,13 @@ "instruct_type": null }, "pricing": { - "prompt": "0.000001", - "completion": "0.000003", - "input_cache_read": "0.0000002" + "prompt": "0.000000435", + "completion": "0.00000087", + "input_cache_read": "0.0000000036" }, "top_provider": { "context_length": 1048576, - "max_completion_tokens": 16384, + "max_completion_tokens": 131072, "is_moderated": false }, "per_request_limits": null, @@ -17463,13 +17360,12 @@ "instruct_type": null }, "pricing": { - "prompt": "0.00000013", - "completion": "0.00000085", - "input_cache_read": "0.000000025" + "prompt": "0.000000125", + "completion": "0.00000084" }, "top_provider": { - "context_length": 131072, - "max_completion_tokens": 98304, + "context_length": 131070, + "max_completion_tokens": 131070, "is_moderated": false }, "per_request_limits": null, @@ -17480,6 +17376,7 @@ "presence_penalty", "reasoning", "repetition_penalty", + "response_format", "seed", "stop", "temperature",