diff --git a/packages/ai-openrouter/src/model-meta.ts b/packages/ai-openrouter/src/model-meta.ts index cec4ced80..fb3c1cbf2 100644 --- a/packages/ai-openrouter/src/model-meta.ts +++ b/packages/ai-openrouter/src/model-meta.ts @@ -410,41 +410,6 @@ const ALFREDPROS_CODELLAMA_7B_INSTRUCT_SOLIDITY = { image: 0, }, } as const -const ALIBABA_TONGYI_DEEPRESEARCH_30B_A3B = { - id: 'alibaba/tongyi-deepresearch-30b-a3b', - name: 'Tongyi DeepResearch 30B A3B', - supports: { - input: ['text'], - output: ['text'], - supports: [ - 'frequencyPenalty', - 'logitBias', - 'maxCompletionTokens', - 'presencePenalty', - 'reasoning', - 'responseFormat', - 'seed', - 'stop', - 'temperature', - 'toolChoice', - 'topP', - ], - }, - context_window: 131072, - max_output_tokens: 131072, - pricing: { - text: { - input: { - normal: 0.09, - cached: 0.09, - }, - output: { - normal: 0.45, - }, - }, - image: 0, - }, -} as const const ALLENAI_OLMO_3_32B_THINK = { id: 'allenai/olmo-3-32b-think', name: 'AllenAI: Olmo 3 32B Think', @@ -1157,35 +1122,6 @@ const ARCEE_AI_TRINITY_LARGE_THINKING = { image: 0, }, } as const -const ARCEE_AI_TRINITY_LARGE_THINKING_FREE = { - id: 'arcee-ai/trinity-large-thinking:free', - name: 'Arcee AI: Trinity Large Thinking (free)', - supports: { - input: ['text'], - output: ['text'], - supports: [ - 'maxCompletionTokens', - 'reasoning', - 'temperature', - 'toolChoice', - 'topP', - ], - }, - context_window: 262144, - max_output_tokens: 80000, - pricing: { - text: { - input: { - normal: 0, - cached: 0, - }, - output: { - normal: 0, - }, - }, - image: 0, - }, -} as const const ARCEE_AI_TRINITY_MINI = { id: 'arcee-ai/trinity-mini', name: 'Arcee AI: Trinity Mini', @@ -1837,16 +1773,16 @@ const DEEPSEEK_DEEPSEEK_CHAT = { 'topP', ], }, - context_window: 163840, - max_output_tokens: 16384, + context_window: 131072, + max_output_tokens: 16000, pricing: { text: { input: { - normal: 0.32, + normal: 0.2288, cached: 0, }, output: { - normal: 0.89, + normal: 0.9144, }, }, image: 0, @@ -2222,14 +2158,15 @@ const DEEPSEEK_DEEPSEEK_V4_FLASH = { ], }, context_window: 1048576, + max_output_tokens: 16384, pricing: { text: { input: { - normal: 0.112, - cached: 0.022, + normal: 0.1, + cached: 0.02, }, output: { - normal: 0.224, + normal: 0.2, }, }, image: 0, @@ -8263,8 +8200,8 @@ const POOLSIDE_LAGUNA_M_1_FREE = { output: ['text'], supports: ['maxCompletionTokens', 'reasoning', 'temperature', 'toolChoice'], }, - context_window: 131072, - max_output_tokens: 8192, + context_window: 262144, + max_output_tokens: 32768, pricing: { text: { input: { @@ -8286,8 +8223,8 @@ const POOLSIDE_LAGUNA_XS_2_FREE = { output: ['text'], supports: ['maxCompletionTokens', 'reasoning', 'temperature', 'toolChoice'], }, - context_window: 131072, - max_output_tokens: 8192, + context_window: 262144, + max_output_tokens: 32768, pricing: { text: { input: { @@ -8486,7 +8423,7 @@ const QWEN_QWEN_PLUS_2025_07_28 = { text: { input: { normal: 0.26, - cached: 0.325, + cached: 0, }, output: { normal: 0.78, @@ -9671,7 +9608,7 @@ const QWEN_QWEN3_5_FLASH_02_23 = { text: { input: { normal: 0.065, - cached: 0.08125, + cached: 0, }, output: { normal: 0.26, @@ -9703,7 +9640,7 @@ const QWEN_QWEN3_5_PLUS_02_15 = { text: { input: { normal: 0.26, - cached: 0.325, + cached: 0, }, output: { normal: 1.56, @@ -9735,7 +9672,7 @@ const QWEN_QWEN3_5_PLUS_20260420 = { text: { input: { normal: 0.3, - cached: 0, + cached: 0.375, }, output: { normal: 1.8, @@ -9767,11 +9704,11 @@ const QWEN_QWEN3_6_27B = { ], }, context_window: 262144, - max_output_tokens: 262144, + max_output_tokens: 262140, pricing: { text: { input: { - normal: 0.3, + normal: 0.29, cached: 0, }, output: { @@ -9804,12 +9741,12 @@ const QWEN_QWEN3_6_35B_A3B = { ], }, context_window: 262144, - max_output_tokens: 262144, + max_output_tokens: 262140, pricing: { text: { input: { - normal: 0.15, - cached: 0.05, + normal: 0.14, + cached: 0, }, output: { normal: 1, @@ -9840,11 +9777,11 @@ const QWEN_QWEN3_6_FLASH = { pricing: { text: { input: { - normal: 0.12375, - cached: 0.1545, + normal: 0.1875, + cached: 0.234375, }, output: { - normal: 0.7425, + normal: 1.125, }, }, image: 0, @@ -9906,11 +9843,11 @@ const QWEN_QWEN3_6_PLUS = { pricing: { text: { input: { - normal: 0.1794, - cached: 0.2236, + normal: 0.325, + cached: 0.40625, }, output: { - normal: 1.07315, + normal: 1.95, }, }, image: 0, @@ -9940,11 +9877,11 @@ const QWEN_QWEN3_7_MAX = { pricing: { text: { input: { - normal: 2.5, - cached: 3.125, + normal: 1.25, + cached: 1.8125, }, output: { - normal: 7.5, + normal: 3.75, }, }, image: 0, @@ -10834,11 +10771,11 @@ const XIAOMI_MIMO_V2_5 = { pricing: { text: { input: { - normal: 0.4, - cached: 0.08, + normal: 0.14, + cached: 0.0028, }, output: { - normal: 2, + normal: 0.28, }, }, image: 0, @@ -10865,15 +10802,15 @@ const XIAOMI_MIMO_V2_5_PRO = { ], }, context_window: 1048576, - max_output_tokens: 16384, + max_output_tokens: 131072, pricing: { text: { input: { - normal: 1, - cached: 0.2, + normal: 0.435, + cached: 0.0036, }, output: { - normal: 3, + normal: 0.87, }, }, image: 0, @@ -10946,6 +10883,7 @@ const Z_AI_GLM_4_5_AIR = { 'maxCompletionTokens', 'presencePenalty', 'reasoning', + 'responseFormat', 'seed', 'stop', 'temperature', @@ -10954,15 +10892,15 @@ const Z_AI_GLM_4_5_AIR = { ], }, context_window: 131072, - max_output_tokens: 98304, + max_output_tokens: 131070, pricing: { text: { input: { - normal: 0.13, - cached: 0.025, + normal: 0.125, + cached: 0, }, output: { - normal: 0.85, + normal: 0.84, }, }, image: 0, @@ -11442,21 +11380,6 @@ export type OpenRouterModelOptionsByName = { | 'temperature' | 'topP' > - [ALIBABA_TONGYI_DEEPRESEARCH_30B_A3B.id]: OpenRouterCommonOptions & - Pick< - OpenRouterBaseOptions, - | 'frequencyPenalty' - | 'logitBias' - | 'maxCompletionTokens' - | 'presencePenalty' - | 'reasoning' - | 'responseFormat' - | 'seed' - | 'stop' - | 'temperature' - | 'toolChoice' - | 'topP' - > [ALLENAI_OLMO_3_32B_THINK.id]: OpenRouterCommonOptions & Pick< OpenRouterBaseOptions, @@ -11690,15 +11613,6 @@ export type OpenRouterModelOptionsByName = { | 'toolChoice' | 'topP' > - [ARCEE_AI_TRINITY_LARGE_THINKING_FREE.id]: OpenRouterCommonOptions & - Pick< - OpenRouterBaseOptions, - | 'maxCompletionTokens' - | 'reasoning' - | 'temperature' - | 'toolChoice' - | 'topP' - > [ARCEE_AI_TRINITY_MINI.id]: OpenRouterCommonOptions & Pick< OpenRouterBaseOptions, @@ -15449,6 +15363,7 @@ export type OpenRouterModelOptionsByName = { | 'maxCompletionTokens' | 'presencePenalty' | 'reasoning' + | 'responseFormat' | 'seed' | 'stop' | 'temperature' @@ -15625,7 +15540,6 @@ export type OpenRouterModelInputModalitiesByName = { [AION_LABS_AION_2_0.id]: ReadonlyArray<'text'> [AION_LABS_AION_RP_LLAMA_3_1_8B.id]: ReadonlyArray<'text'> [ALFREDPROS_CODELLAMA_7B_INSTRUCT_SOLIDITY.id]: ReadonlyArray<'text'> - [ALIBABA_TONGYI_DEEPRESEARCH_30B_A3B.id]: ReadonlyArray<'text'> [ALLENAI_OLMO_3_32B_THINK.id]: ReadonlyArray<'text'> [AMAZON_NOVA_2_LITE_V1.id]: ReadonlyArray< 'text' | 'image' | 'video' | 'document' @@ -15656,7 +15570,6 @@ export type OpenRouterModelInputModalitiesByName = { [ARCEE_AI_MAESTRO_REASONING.id]: ReadonlyArray<'text'> [ARCEE_AI_SPOTLIGHT.id]: ReadonlyArray<'image' | 'text'> [ARCEE_AI_TRINITY_LARGE_THINKING.id]: ReadonlyArray<'text'> - [ARCEE_AI_TRINITY_LARGE_THINKING_FREE.id]: ReadonlyArray<'text'> [ARCEE_AI_TRINITY_MINI.id]: ReadonlyArray<'text'> [ARCEE_AI_VIRTUOSO_LARGE.id]: ReadonlyArray<'text'> [BAIDU_COBUDDY_FREE.id]: ReadonlyArray<'text'> @@ -16037,7 +15950,6 @@ export const OPENROUTER_CHAT_MODELS = [ AION_LABS_AION_2_0.id, AION_LABS_AION_RP_LLAMA_3_1_8B.id, ALFREDPROS_CODELLAMA_7B_INSTRUCT_SOLIDITY.id, - ALIBABA_TONGYI_DEEPRESEARCH_30B_A3B.id, ALLENAI_OLMO_3_32B_THINK.id, AMAZON_NOVA_2_LITE_V1.id, AMAZON_NOVA_LITE_V1.id, @@ -16062,7 +15974,6 @@ export const OPENROUTER_CHAT_MODELS = [ ARCEE_AI_MAESTRO_REASONING.id, ARCEE_AI_SPOTLIGHT.id, ARCEE_AI_TRINITY_LARGE_THINKING.id, - ARCEE_AI_TRINITY_LARGE_THINKING_FREE.id, ARCEE_AI_TRINITY_MINI.id, ARCEE_AI_VIRTUOSO_LARGE.id, BAIDU_COBUDDY_FREE.id, @@ -16379,10 +16290,7 @@ export const OPENROUTER_CHAT_MODELS = [ ] as const export type OpenRouterChatModelToolCapabilitiesByName = { - [K in (typeof OPENROUTER_CHAT_MODELS)[number]]: readonly [ - 'web_search', - 'web_fetch', - ] + [K in (typeof OPENROUTER_CHAT_MODELS)[number]]: readonly ['web_search'] } export const OPENROUTER_IMAGE_MODELS = [ diff --git a/scripts/.sync-models-last-run b/scripts/.sync-models-last-run index 1f83e39bc..1daf3ace8 100644 --- a/scripts/.sync-models-last-run +++ b/scripts/.sync-models-last-run @@ -1 +1 @@ -1779439521 +1779872161 diff --git a/scripts/openrouter.models.json b/scripts/openrouter.models.json index 9cd7a646e..4cc0d0edd 100644 --- a/scripts/openrouter.models.json +++ b/scripts/openrouter.models.json @@ -701,63 +701,6 @@ "details": "/api/v1/models/alfredpros/codellama-7b-instruct-solidity/endpoints" } }, - { - "id": "alibaba/tongyi-deepresearch-30b-a3b", - "canonical_slug": "alibaba/tongyi-deepresearch-30b-a3b", - "hugging_face_id": "Alibaba-NLP/Tongyi-DeepResearch-30B-A3B", - "name": "Tongyi DeepResearch 30B A3B", - "created": 1758210804, - "description": "Tongyi DeepResearch is an agentic large language model developed by Tongyi Lab, with 30 billion total parameters activating only 3 billion per token. It's optimized for long-horizon, deep information-seeking tasks...", - "context_length": 131072, - "architecture": { - "modality": "text->text", - "input_modalities": ["text"], - "output_modalities": ["text"], - "tokenizer": "Other", - "instruct_type": null - }, - "pricing": { - "prompt": "0.00000009", - "completion": "0.00000045", - "input_cache_read": "0.00000009" - }, - "top_provider": { - "context_length": 131072, - "max_completion_tokens": 131072, - "is_moderated": false - }, - "per_request_limits": null, - "supported_parameters": [ - "frequency_penalty", - "include_reasoning", - "logit_bias", - "max_tokens", - "min_p", - "presence_penalty", - "reasoning", - "repetition_penalty", - "response_format", - "seed", - "stop", - "structured_outputs", - "temperature", - "tool_choice", - "tools", - "top_k", - "top_p" - ], - "default_parameters": { - "temperature": null, - "top_p": null, - "frequency_penalty": null - }, - "supported_voices": null, - "knowledge_cutoff": "2025-03-31", - "expiration_date": null, - "links": { - "details": "/api/v1/models/alibaba/tongyi-deepresearch-30b-a3b/endpoints" - } - }, { "id": "allenai/olmo-3-32b-think", "canonical_slug": "allenai/olmo-3-32b-think-20251121", @@ -1977,56 +1920,6 @@ "details": "/api/v1/models/arcee-ai/trinity-large-thinking/endpoints" } }, - { - "id": "arcee-ai/trinity-large-thinking:free", - "canonical_slug": "arcee-ai/trinity-large-thinking", - "hugging_face_id": "arcee-ai/Trinity-Large-Thinking", - "name": "Arcee AI: Trinity Large Thinking (free)", - "created": 1775058318, - "description": "Trinity Large Thinking is a powerful open source reasoning model from the team at Arcee AI. It shows strong performance in PinchBench, agentic workloads, and reasoning tasks. Launch video: https://youtu.be/Gc82AXLa0Rg?si=4RLn6WBz33qT--B7...", - "context_length": 262144, - "architecture": { - "modality": "text->text", - "input_modalities": ["text"], - "output_modalities": ["text"], - "tokenizer": "Other", - "instruct_type": null - }, - "pricing": { - "prompt": "0", - "completion": "0" - }, - "top_provider": { - "context_length": 262144, - "max_completion_tokens": 80000, - "is_moderated": false - }, - "per_request_limits": null, - "supported_parameters": [ - "include_reasoning", - "max_tokens", - "reasoning", - "temperature", - "tool_choice", - "tools", - "top_k", - "top_p" - ], - "default_parameters": { - "temperature": 0.3, - "top_p": 0.8, - "top_k": null, - "frequency_penalty": null, - "presence_penalty": null, - "repetition_penalty": null - }, - "supported_voices": null, - "knowledge_cutoff": null, - "expiration_date": null, - "links": { - "details": "/api/v1/models/arcee-ai/trinity-large-thinking/endpoints" - } - }, { "id": "arcee-ai/trinity-mini", "canonical_slug": "arcee-ai/trinity-mini-20251201", @@ -2159,7 +2052,7 @@ "default_parameters": {}, "supported_voices": null, "knowledge_cutoff": null, - "expiration_date": null, + "expiration_date": "2026-05-27", "links": { "details": "/api/v1/models/baidu/cobuddy-20260430/endpoints" } @@ -2992,7 +2885,7 @@ "name": "DeepSeek: DeepSeek V3", "created": 1735241320, "description": "DeepSeek-V3 is the latest model from the DeepSeek team, building upon the instruction following and coding abilities of the previous versions. Pre-trained on nearly 15 trillion tokens, the reported evaluations...", - "context_length": 163840, + "context_length": 131072, "architecture": { "modality": "text->text", "input_modalities": ["text"], @@ -3001,12 +2894,12 @@ "instruct_type": null }, "pricing": { - "prompt": "0.00000032", - "completion": "0.00000089" + "prompt": "0.0000002288", + "completion": "0.0000009144" }, "top_provider": { - "context_length": 163840, - "max_completion_tokens": 16384, + "context_length": 128000, + "max_completion_tokens": 16000, "is_moderated": false }, "per_request_limits": null, @@ -3596,13 +3489,13 @@ "instruct_type": null }, "pricing": { - "prompt": "0.000000112", - "completion": "0.000000224", - "input_cache_read": "0.000000022" + "prompt": "0.0000001", + "completion": "0.0000002", + "input_cache_read": "0.00000002" }, "top_provider": { - "context_length": 1048575, - "max_completion_tokens": null, + "context_length": 1048576, + "max_completion_tokens": 16384, "is_moderated": false }, "per_request_limits": null, @@ -3956,7 +3849,10 @@ "default_parameters": { "temperature": null, "top_p": null, - "frequency_penalty": null + "top_k": null, + "frequency_penalty": null, + "presence_penalty": null, + "repetition_penalty": null }, "supported_voices": null, "knowledge_cutoff": "2025-01-31", @@ -8891,7 +8787,7 @@ "default_parameters": {}, "supported_voices": null, "knowledge_cutoff": "2023-12-31", - "expiration_date": null, + "expiration_date": "2026-06-05", "links": { "details": "/api/v1/models/nousresearch/hermes-2-pro-llama-3-8b/endpoints" } @@ -13213,7 +13109,7 @@ "name": "Poolside: Laguna M.1 (free)", "created": 1777388504, "description": "Laguna M.1 is the flagship coding agent model from [Poolside](https://poolside.ai), optimized for complex software engineering tasks. Designed for agentic coding workflows, it supports tool calling and reasoning, with a 128K...", - "context_length": 131072, + "context_length": 262144, "architecture": { "modality": "text->text", "input_modalities": ["text"], @@ -13226,8 +13122,8 @@ "completion": "0" }, "top_provider": { - "context_length": 131072, - "max_completion_tokens": 8192, + "context_length": 262144, + "max_completion_tokens": 32768, "is_moderated": false }, "per_request_limits": null, @@ -13261,7 +13157,7 @@ "name": "Poolside: Laguna XS.2 (free)", "created": 1777389604, "description": "Laguna XS.2 is the second-generation model in the XS size class from [Poolside](https://poolside.ai), their efficient coding agent series. It combines tool calling and reasoning capabilities with a compact footprint, offering...", - "context_length": 131072, + "context_length": 262144, "architecture": { "modality": "text->text", "input_modalities": ["text"], @@ -13274,8 +13170,8 @@ "completion": "0" }, "top_provider": { - "context_length": 131072, - "max_completion_tokens": 8192, + "context_length": 262144, + "max_completion_tokens": 32768, "is_moderated": false }, "per_request_limits": null, @@ -13565,8 +13461,7 @@ }, "pricing": { "prompt": "0.00000026", - "completion": "0.00000078", - "input_cache_write": "0.000000325" + "completion": "0.00000078" }, "top_provider": { "context_length": 1000000, @@ -13955,7 +13850,7 @@ }, "supported_voices": null, "knowledge_cutoff": "2025-03-31", - "expiration_date": null, + "expiration_date": "2026-06-05", "links": { "details": "/api/v1/models/qwen/qwen3-30b-a3b-04-28/endpoints" } @@ -15422,8 +15317,7 @@ }, "pricing": { "prompt": "0.000000065", - "completion": "0.00000026", - "input_cache_write": "0.00000008125" + "completion": "0.00000026" }, "top_provider": { "context_length": 1000000, @@ -15473,8 +15367,7 @@ }, "pricing": { "prompt": "0.00000026", - "completion": "0.00000156", - "input_cache_write": "0.000000325" + "completion": "0.00000156" }, "top_provider": { "context_length": 1000000, @@ -15524,7 +15417,8 @@ }, "pricing": { "prompt": "0.0000003", - "completion": "0.0000018" + "completion": "0.0000018", + "input_cache_write": "0.000000375" }, "top_provider": { "context_length": 1000000, @@ -15569,12 +15463,12 @@ "instruct_type": null }, "pricing": { - "prompt": "0.0000003", + "prompt": "0.00000029", "completion": "0.0000032" }, "top_provider": { - "context_length": 262144, - "max_completion_tokens": 262144, + "context_length": 262140, + "max_completion_tokens": 262140, "is_moderated": false }, "per_request_limits": null, @@ -15630,13 +15524,12 @@ "instruct_type": null }, "pricing": { - "prompt": "0.00000015", - "completion": "0.000001", - "input_cache_read": "0.00000005" + "prompt": "0.00000014", + "completion": "0.000001" }, "top_provider": { - "context_length": 262144, - "max_completion_tokens": 262144, + "context_length": 262140, + "max_completion_tokens": 262140, "is_moderated": false }, "per_request_limits": null, @@ -15689,9 +15582,9 @@ "instruct_type": null }, "pricing": { - "prompt": "0.00000012375", - "completion": "0.0000007425", - "input_cache_write": "0.0000001545" + "prompt": "0.0000001875", + "completion": "0.000001125", + "input_cache_write": "0.000000234375" }, "top_provider": { "context_length": 1000000, @@ -15785,9 +15678,9 @@ "instruct_type": null }, "pricing": { - "prompt": "0.0000001794", - "completion": "0.00000107315", - "input_cache_write": "0.0000002236" + "prompt": "0.000000325", + "completion": "0.00000195", + "input_cache_write": "0.00000040625" }, "top_provider": { "context_length": 1000000, @@ -15839,9 +15732,10 @@ "instruct_type": null }, "pricing": { - "prompt": "0.0000025", - "completion": "0.0000075", - "input_cache_write": "0.000003125" + "prompt": "0.00000125", + "completion": "0.00000375", + "input_cache_read": "0.00000025", + "input_cache_write": "0.0000015625" }, "top_provider": { "context_length": 1000000, @@ -16109,7 +16003,7 @@ "default_parameters": {}, "supported_voices": null, "knowledge_cutoff": "2023-12-31", - "expiration_date": null, + "expiration_date": "2026-06-05", "links": { "details": "/api/v1/models/sao10k/l3-euryale-70b/endpoints" } @@ -17251,9 +17145,9 @@ "instruct_type": null }, "pricing": { - "prompt": "0.0000004", - "completion": "0.000002", - "input_cache_read": "0.00000008" + "prompt": "0.00000014", + "completion": "0.00000028", + "input_cache_read": "0.0000000028" }, "top_provider": { "context_length": 1048576, @@ -17305,13 +17199,13 @@ "instruct_type": null }, "pricing": { - "prompt": "0.000001", - "completion": "0.000003", - "input_cache_read": "0.0000002" + "prompt": "0.000000435", + "completion": "0.00000087", + "input_cache_read": "0.0000000036" }, "top_provider": { "context_length": 1048576, - "max_completion_tokens": 16384, + "max_completion_tokens": 131072, "is_moderated": false }, "per_request_limits": null, @@ -17463,13 +17357,12 @@ "instruct_type": null }, "pricing": { - "prompt": "0.00000013", - "completion": "0.00000085", - "input_cache_read": "0.000000025" + "prompt": "0.000000125", + "completion": "0.00000084" }, "top_provider": { - "context_length": 131072, - "max_completion_tokens": 98304, + "context_length": 131070, + "max_completion_tokens": 131070, "is_moderated": false }, "per_request_limits": null, @@ -17480,6 +17373,7 @@ "presence_penalty", "reasoning", "repetition_penalty", + "response_format", "seed", "stop", "temperature",