diff --git a/.changeset/sync-models.md b/.changeset/sync-models.md new file mode 100644 index 000000000..3949386d6 --- /dev/null +++ b/.changeset/sync-models.md @@ -0,0 +1,5 @@ +--- +'@tanstack/ai-anthropic': patch +--- + +Update model metadata from OpenRouter API diff --git a/packages/ai-anthropic/src/model-meta.ts b/packages/ai-anthropic/src/model-meta.ts index 86301ed7d..94df2ba39 100644 --- a/packages/ai-anthropic/src/model-meta.ts +++ b/packages/ai-anthropic/src/model-meta.ts @@ -710,6 +710,45 @@ const CLAUDE_OPUS_4_8_FAST = { AnthropicSamplingOptions > +const CLAUDE_FABLE_5 = { + name: 'claude-fable-5', + id: 'claude-fable-5', + context_window: 1_000_000, + max_output_tokens: 128_000, + supports: { + input: ['text', 'image', 'document'], + extended_thinking: true, + priority_tier: true, + tools: [ + 'web_search', + 'web_fetch', + 'code_execution', + 'computer_use', + 'bash', + 'text_editor', + 'memory', + ], + }, + pricing: { + input: { + normal: 10, + cached: 1, + }, + output: { + normal: 50, + }, + }, +} as const satisfies ModelMeta< + AnthropicContainerOptions & + AnthropicContextManagementOptions & + AnthropicMCPOptions & + AnthropicServiceTierOptions & + AnthropicStopSequencesOptions & + AnthropicThinkingOptions & + AnthropicToolChoiceOptions & + AnthropicSamplingOptions +> + export const ANTHROPIC_MODELS = [ CLAUDE_OPUS_4_6.id, CLAUDE_OPUS_4_5.id, @@ -731,6 +770,8 @@ export const ANTHROPIC_MODELS = [ CLAUDE_OPUS_4_8.id, CLAUDE_OPUS_4_8_FAST.id, + + CLAUDE_FABLE_5.id, ] as const /** @@ -891,6 +932,14 @@ export type AnthropicChatModelProviderOptionsByName = { AnthropicThinkingOptions & AnthropicToolChoiceOptions & AnthropicSamplingOptions + [CLAUDE_FABLE_5.id]: AnthropicContainerOptions & + AnthropicContextManagementOptions & + AnthropicMCPOptions & + AnthropicServiceTierOptions & + AnthropicStopSequencesOptions & + AnthropicThinkingOptions & + AnthropicToolChoiceOptions & + AnthropicSamplingOptions } export type AnthropicChatModelToolCapabilitiesByName = { @@ -937,4 +986,5 @@ export type AnthropicModelInputModalitiesByName = { [CLAUDE_OPUS_4_7_FAST.id]: typeof CLAUDE_OPUS_4_7_FAST.supports.input [CLAUDE_OPUS_4_8.id]: typeof CLAUDE_OPUS_4_8.supports.input [CLAUDE_OPUS_4_8_FAST.id]: typeof CLAUDE_OPUS_4_8_FAST.supports.input + [CLAUDE_FABLE_5.id]: typeof CLAUDE_FABLE_5.supports.input } diff --git a/packages/ai-openrouter/src/model-meta.ts b/packages/ai-openrouter/src/model-meta.ts index 42122cd2c..d7b08cc41 100644 --- a/packages/ai-openrouter/src/model-meta.ts +++ b/packages/ai-openrouter/src/model-meta.ts @@ -3,6 +3,36 @@ import type { OpenRouterCommonOptions, } from './text/text-provider-options' +const _ANTHROPIC_CLAUDE_FABLE_LATEST = { + id: '~anthropic/claude-fable-latest', + name: 'Anthropic: Claude Fable Latest', + supports: { + input: ['text', 'image', 'document'], + output: ['text'], + supports: [ + 'maxCompletionTokens', + 'maxCompletionTokens', + 'reasoning', + 'responseFormat', + 'stop', + 'toolChoice', + ], + }, + context_window: 1000000, + max_output_tokens: 128000, + pricing: { + text: { + input: { + normal: 10, + cached: 13.5, + }, + output: { + normal: 50, + }, + }, + image: 0, + }, +} as const const _ANTHROPIC_CLAUDE_HAIKU_LATEST = { id: '~anthropic/claude-haiku-latest', name: 'Anthropic Claude Haiku Latest', @@ -183,15 +213,15 @@ const _MOONSHOTAI_KIMI_LATEST = { ], }, context_window: 262144, - max_output_tokens: 262144, + max_output_tokens: 262142, pricing: { text: { input: { - normal: 0.684, - cached: 0.144, + normal: 0.68, + cached: 0.34, }, output: { - normal: 3.42, + normal: 3.41, }, }, image: 0, @@ -628,6 +658,36 @@ const ANTHROPIC_CLAUDE_3_5_HAIKU = { image: 0, }, } as const +const ANTHROPIC_CLAUDE_FABLE_5 = { + id: 'anthropic/claude-fable-5', + name: 'Anthropic: Claude Fable 5', + supports: { + input: ['text', 'image', 'document'], + output: ['text'], + supports: [ + 'maxCompletionTokens', + 'maxCompletionTokens', + 'reasoning', + 'responseFormat', + 'stop', + 'toolChoice', + ], + }, + context_window: 1000000, + max_output_tokens: 128000, + pricing: { + text: { + input: { + normal: 10, + cached: 13.5, + }, + output: { + normal: 50, + }, + }, + image: 0, + }, +} as const const ANTHROPIC_CLAUDE_HAIKU_4_5 = { id: 'anthropic/claude-haiku-4.5', name: 'Anthropic: Claude Haiku 4.5', @@ -1052,68 +1112,6 @@ const ARCEE_AI_CODER_LARGE = { image: 0, }, } as const -const ARCEE_AI_MAESTRO_REASONING = { - id: 'arcee-ai/maestro-reasoning', - name: 'Arcee AI: Maestro Reasoning', - supports: { - input: ['text'], - output: ['text'], - supports: [ - 'frequencyPenalty', - 'logitBias', - 'maxCompletionTokens', - 'presencePenalty', - 'stop', - 'temperature', - 'topP', - ], - }, - context_window: 131072, - max_output_tokens: 32000, - pricing: { - text: { - input: { - normal: 0.9, - cached: 0, - }, - output: { - normal: 3.3, - }, - }, - image: 0, - }, -} as const -const ARCEE_AI_SPOTLIGHT = { - id: 'arcee-ai/spotlight', - name: 'Arcee AI: Spotlight', - supports: { - input: ['image', 'text'], - output: ['text'], - supports: [ - 'frequencyPenalty', - 'logitBias', - 'maxCompletionTokens', - 'presencePenalty', - 'stop', - 'temperature', - 'topP', - ], - }, - context_window: 131072, - max_output_tokens: 65537, - pricing: { - text: { - input: { - normal: 0.18, - cached: 0, - }, - output: { - normal: 0.18, - }, - }, - image: 0, - }, -} as const const ARCEE_AI_TRINITY_LARGE_THINKING = { id: 'arcee-ai/trinity-large-thinking', name: 'Arcee AI: Trinity Large Thinking', @@ -1213,39 +1211,6 @@ const ARCEE_AI_VIRTUOSO_LARGE = { image: 0, }, } as const -const BAIDU_ERNIE_4_5_VL_28B_A3B = { - id: 'baidu/ernie-4.5-vl-28b-a3b', - name: 'Baidu: ERNIE 4.5 VL 28B A3B', - supports: { - input: ['text', 'image'], - output: ['text'], - supports: [ - 'frequencyPenalty', - 'maxCompletionTokens', - 'presencePenalty', - 'reasoning', - 'seed', - 'stop', - 'temperature', - 'toolChoice', - 'topP', - ], - }, - context_window: 131072, - max_output_tokens: 8000, - pricing: { - text: { - input: { - normal: 0.14, - cached: 0, - }, - output: { - normal: 0.56, - }, - }, - image: 0, - }, -} as const const BAIDU_ERNIE_4_5_VL_424B_A47B = { id: 'baidu/ernie-4.5-vl-424b-a47b', name: 'Baidu: ERNIE 4.5 VL 424B A47B ', @@ -1683,7 +1648,7 @@ const DEEPSEEK_DEEPSEEK_CHAT_V3_0324 = { 'topP', ], }, - context_window: 163840, + context_window: 131072, max_output_tokens: 16384, pricing: { text: { @@ -2615,11 +2580,11 @@ const GOOGLE_GEMMA_3_12B_IT = { pricing: { text: { input: { - normal: 0.04, + normal: 0.05, cached: 0, }, output: { - normal: 0.13, + normal: 0.15, }, }, image: 0, @@ -2682,11 +2647,11 @@ const GOOGLE_GEMMA_3_4B_IT = { pricing: { text: { input: { - normal: 0.04, + normal: 0.05, cached: 0, }, output: { - normal: 0.08, + normal: 0.1, }, }, image: 0, @@ -2812,15 +2777,15 @@ const GOOGLE_GEMMA_4_31B_IT = { ], }, context_window: 262144, - max_output_tokens: 16384, + max_output_tokens: 8192, pricing: { text: { input: { normal: 0.12, - cached: 0, + cached: 0.09, }, output: { - normal: 0.37, + normal: 0.36, }, }, image: 0, @@ -3394,23 +3359,20 @@ const META_LLAMA_LLAMA_3_8B_INSTRUCT = { 'logitBias', 'maxCompletionTokens', 'presencePenalty', - 'responseFormat', - 'seed', 'stop', 'temperature', 'topP', ], }, context_window: 8192, - max_output_tokens: 8192, pricing: { text: { input: { - normal: 0.04, + normal: 0.14, cached: 0, }, output: { - normal: 0.04, + normal: 0.14, }, }, image: 0, @@ -3478,7 +3440,7 @@ const META_LLAMA_LLAMA_3_1_8B_INSTRUCT = { cached: 0, }, output: { - normal: 0.05, + normal: 0.03, }, }, image: 0, @@ -3507,11 +3469,11 @@ const META_LLAMA_LLAMA_3_2_11B_VISION_INSTRUCT = { pricing: { text: { input: { - normal: 0.245, + normal: 0.345, cached: 0, }, output: { - normal: 0.245, + normal: 0.345, }, }, image: 0, @@ -3732,7 +3694,7 @@ const META_LLAMA_LLAMA_4_SCOUT = { pricing: { text: { input: { - normal: 0.08, + normal: 0.1, cached: 0, }, output: { @@ -4084,10 +4046,10 @@ const MINIMAX_MINIMAX_M2_5 = { text: { input: { normal: 0.15, - cached: 0, + cached: 0.05, }, output: { - normal: 1.15, + normal: 0.9, }, }, image: 0, @@ -4120,11 +4082,11 @@ const MINIMAX_MINIMAX_M2_7 = { pricing: { text: { input: { - normal: 0.279, - cached: 0, + normal: 0.27, + cached: 0.054, }, output: { - normal: 1.2, + normal: 1.08, }, }, image: 0, @@ -4904,15 +4866,14 @@ const MOONSHOTAI_KIMI_K2_5 = { ], }, context_window: 262144, - max_output_tokens: 262144, pricing: { text: { input: { - normal: 0.4, - cached: 0.09, + normal: 0.35, + cached: 0, }, output: { - normal: 1.9, + normal: 1.89, }, }, image: 0, @@ -4942,37 +4903,15 @@ const MOONSHOTAI_KIMI_K2_6 = { ], }, context_window: 262144, - max_output_tokens: 262144, - pricing: { - text: { - input: { - normal: 0.684, - cached: 0.144, - }, - output: { - normal: 3.42, - }, - }, - image: 0, - }, -} as const -const MOONSHOTAI_KIMI_K2_6_FREE = { - id: 'moonshotai/kimi-k2.6:free', - name: 'MoonshotAI: Kimi K2.6 (free)', - supports: { - input: ['text', 'image'], - output: ['text'], - supports: ['reasoning', 'toolChoice'], - }, - context_window: 262144, + max_output_tokens: 262142, pricing: { text: { input: { - normal: 0, - cached: 0, + normal: 0.68, + cached: 0.34, }, output: { - normal: 0, + normal: 3.41, }, }, image: 0, @@ -5024,63 +4963,33 @@ const MORPH_MORPH_V3_LARGE = { image: 0, }, } as const -const NEX_AGI_DEEPSEEK_V3_1_NEX_N1 = { - id: 'nex-agi/deepseek-v3.1-nex-n1', - name: 'Nex AGI: DeepSeek V3.1 Nex N1', +const NEX_AGI_NEX_N2_PRO_FREE = { + id: 'nex-agi/nex-n2-pro:free', + name: 'Nex AGI: Nex-N2-Pro (free)', supports: { - input: ['text'], + input: ['text', 'image'], output: ['text'], supports: [ 'frequencyPenalty', + 'logprobs', 'maxCompletionTokens', + 'reasoning', 'responseFormat', 'temperature', 'toolChoice', 'topP', ], }, - context_window: 131072, - max_output_tokens: 163840, - pricing: { - text: { - input: { - normal: 0.135, - cached: 0, - }, - output: { - normal: 0.5, - }, - }, - image: 0, - }, -} as const -const NOUSRESEARCH_HERMES_2_PRO_LLAMA_3_8B = { - id: 'nousresearch/hermes-2-pro-llama-3-8b', - name: 'NousResearch: Hermes 2 Pro - Llama-3 8B', - supports: { - input: ['text'], - output: ['text'], - supports: [ - 'frequencyPenalty', - 'maxCompletionTokens', - 'presencePenalty', - 'responseFormat', - 'seed', - 'stop', - 'temperature', - 'topP', - ], - }, - context_window: 8192, - max_output_tokens: 8192, + context_window: 262144, + max_output_tokens: 262144, pricing: { text: { input: { - normal: 0.14, + normal: 0, cached: 0, }, output: { - normal: 0.14, + normal: 0, }, }, image: 0, @@ -5171,11 +5080,11 @@ const NOUSRESEARCH_HERMES_3_LLAMA_3_1_70B = { pricing: { text: { input: { - normal: 0.3, + normal: 0.7, cached: 0, }, output: { - normal: 0.3, + normal: 0.7, }, }, image: 0, @@ -5266,7 +5175,7 @@ const NVIDIA_LLAMA_3_3_NEMOTRON_SUPER_49B_V1_5 = { pricing: { text: { input: { - normal: 0.1, + normal: 0.4, cached: 0, }, output: { @@ -5437,81 +5346,109 @@ const NVIDIA_NEMOTRON_3_SUPER_120B_A12B_FREE = { image: 0, }, } as const -const NVIDIA_NEMOTRON_NANO_12B_V2_VL_FREE = { - id: 'nvidia/nemotron-nano-12b-v2-vl:free', - name: 'NVIDIA: Nemotron Nano 12B 2 VL (free)', +const NVIDIA_NEMOTRON_3_ULTRA_550B_A55B = { + id: 'nvidia/nemotron-3-ultra-550b-a55b', + name: 'NVIDIA: Nemotron 3 Ultra', supports: { - input: ['image', 'text', 'video'], + input: ['text'], output: ['text'], supports: [ + 'frequencyPenalty', + 'logitBias', 'maxCompletionTokens', + 'presencePenalty', 'reasoning', + 'responseFormat', 'seed', + 'stop', 'temperature', 'toolChoice', 'topP', ], }, - context_window: 128000, - max_output_tokens: 128000, + context_window: 1000000, + max_output_tokens: 16384, pricing: { text: { input: { - normal: 0, - cached: 0, + normal: 0.5, + cached: 0.15, }, output: { - normal: 0, + normal: 2.5, }, }, image: 0, }, } as const -const NVIDIA_NEMOTRON_NANO_9B_V2 = { - id: 'nvidia/nemotron-nano-9b-v2', - name: 'NVIDIA: Nemotron Nano 9B V2', +const NVIDIA_NEMOTRON_3_ULTRA_550B_A55B_FREE = { + id: 'nvidia/nemotron-3-ultra-550b-a55b:free', + name: 'NVIDIA: Nemotron 3 Ultra (free)', supports: { input: ['text'], output: ['text'], supports: [ - 'frequencyPenalty', - 'logitBias', 'maxCompletionTokens', - 'presencePenalty', 'reasoning', - 'responseFormat', 'seed', - 'stop', 'temperature', 'toolChoice', 'topP', ], }, - context_window: 131072, - max_output_tokens: 16384, + context_window: 1000000, + max_output_tokens: 65536, pricing: { text: { input: { - normal: 0.04, + normal: 0, cached: 0, }, output: { - normal: 0.16, + normal: 0, }, }, image: 0, }, } as const -const NVIDIA_NEMOTRON_NANO_9B_V2_FREE = { - id: 'nvidia/nemotron-nano-9b-v2:free', - name: 'NVIDIA: Nemotron Nano 9B V2 (free)', +const NVIDIA_NEMOTRON_3_5_CONTENT_SAFETY_FREE = { + id: 'nvidia/nemotron-3.5-content-safety:free', + name: 'NVIDIA: Nemotron 3.5 Content Safety (free)', supports: { - input: ['text'], + input: ['text', 'image'], + output: ['text'], + supports: [ + 'maxCompletionTokens', + 'reasoning', + 'seed', + 'temperature', + 'topP', + ], + }, + context_window: 128000, + max_output_tokens: 8192, + pricing: { + text: { + input: { + normal: 0, + cached: 0, + }, + output: { + normal: 0, + }, + }, + image: 0, + }, +} as const +const NVIDIA_NEMOTRON_NANO_12B_V2_VL_FREE = { + id: 'nvidia/nemotron-nano-12b-v2-vl:free', + name: 'NVIDIA: Nemotron Nano 12B 2 VL (free)', + supports: { + input: ['image', 'text', 'video'], output: ['text'], supports: [ 'maxCompletionTokens', 'reasoning', - 'responseFormat', 'seed', 'temperature', 'toolChoice', @@ -5519,6 +5456,7 @@ const NVIDIA_NEMOTRON_NANO_9B_V2_FREE = { ], }, context_window: 128000, + max_output_tokens: 128000, pricing: { text: { input: { @@ -5532,81 +5470,74 @@ const NVIDIA_NEMOTRON_NANO_9B_V2_FREE = { image: 0, }, } as const -const OPENAI_GPT_3_5_TURBO = { - id: 'openai/gpt-3.5-turbo', - name: 'OpenAI: GPT-3.5 Turbo', +const NVIDIA_NEMOTRON_NANO_9B_V2 = { + id: 'nvidia/nemotron-nano-9b-v2', + name: 'NVIDIA: Nemotron Nano 9B V2', supports: { input: ['text'], output: ['text'], supports: [ 'frequencyPenalty', 'logitBias', - 'logprobs', 'maxCompletionTokens', 'presencePenalty', + 'reasoning', 'responseFormat', 'seed', 'stop', 'temperature', 'toolChoice', - 'topLogprobs', 'topP', ], }, - context_window: 16385, - max_output_tokens: 4096, + context_window: 131072, + max_output_tokens: 16384, pricing: { text: { input: { - normal: 0.5, + normal: 0.04, cached: 0, }, output: { - normal: 1.5, + normal: 0.16, }, }, image: 0, }, } as const -const OPENAI_GPT_3_5_TURBO_0613 = { - id: 'openai/gpt-3.5-turbo-0613', - name: 'OpenAI: GPT-3.5 Turbo (older v0613)', +const NVIDIA_NEMOTRON_NANO_9B_V2_FREE = { + id: 'nvidia/nemotron-nano-9b-v2:free', + name: 'NVIDIA: Nemotron Nano 9B V2 (free)', supports: { input: ['text'], output: ['text'], supports: [ - 'frequencyPenalty', - 'logitBias', - 'logprobs', 'maxCompletionTokens', - 'presencePenalty', + 'reasoning', 'responseFormat', 'seed', - 'stop', 'temperature', 'toolChoice', - 'topLogprobs', 'topP', ], }, - context_window: 4095, - max_output_tokens: 4096, + context_window: 128000, pricing: { text: { input: { - normal: 1, + normal: 0, cached: 0, }, output: { - normal: 2, + normal: 0, }, }, image: 0, }, } as const -const OPENAI_GPT_3_5_TURBO_16K = { - id: 'openai/gpt-3.5-turbo-16k', - name: 'OpenAI: GPT-3.5 Turbo 16k', +const OPENAI_GPT_3_5_TURBO = { + id: 'openai/gpt-3.5-turbo', + name: 'OpenAI: GPT-3.5 Turbo', supports: { input: ['text'], output: ['text'], @@ -5615,7 +5546,6 @@ const OPENAI_GPT_3_5_TURBO_16K = { 'logitBias', 'logprobs', 'maxCompletionTokens', - 'maxCompletionTokens', 'presencePenalty', 'responseFormat', 'seed', @@ -5631,19 +5561,19 @@ const OPENAI_GPT_3_5_TURBO_16K = { pricing: { text: { input: { - normal: 3, + normal: 0.5, cached: 0, }, output: { - normal: 4, + normal: 1.5, }, }, image: 0, }, } as const -const OPENAI_GPT_3_5_TURBO_INSTRUCT = { - id: 'openai/gpt-3.5-turbo-instruct', - name: 'OpenAI: GPT-3.5 Turbo Instruct', +const OPENAI_GPT_3_5_TURBO_0613 = { + id: 'openai/gpt-3.5-turbo-0613', + name: 'OpenAI: GPT-3.5 Turbo (older v0613)', supports: { input: ['text'], output: ['text'], @@ -5657,6 +5587,7 @@ const OPENAI_GPT_3_5_TURBO_INSTRUCT = { 'seed', 'stop', 'temperature', + 'toolChoice', 'topLogprobs', 'topP', ], @@ -5666,7 +5597,7 @@ const OPENAI_GPT_3_5_TURBO_INSTRUCT = { pricing: { text: { input: { - normal: 1.5, + normal: 1, cached: 0, }, output: { @@ -5676,9 +5607,9 @@ const OPENAI_GPT_3_5_TURBO_INSTRUCT = { image: 0, }, } as const -const OPENAI_GPT_4 = { - id: 'openai/gpt-4', - name: 'OpenAI: GPT-4', +const OPENAI_GPT_3_5_TURBO_16K = { + id: 'openai/gpt-3.5-turbo-16k', + name: 'OpenAI: GPT-3.5 Turbo 16k', supports: { input: ['text'], output: ['text'], @@ -5698,24 +5629,24 @@ const OPENAI_GPT_4 = { 'topP', ], }, - context_window: 8191, + context_window: 16385, max_output_tokens: 4096, pricing: { text: { input: { - normal: 30, + normal: 3, cached: 0, }, output: { - normal: 60, + normal: 4, }, }, image: 0, }, } as const -const OPENAI_GPT_4_0314 = { - id: 'openai/gpt-4-0314', - name: 'OpenAI: GPT-4 (older v0314)', +const OPENAI_GPT_3_5_TURBO_INSTRUCT = { + id: 'openai/gpt-3.5-turbo-instruct', + name: 'OpenAI: GPT-3.5 Turbo Instruct', supports: { input: ['text'], output: ['text'], @@ -5729,29 +5660,28 @@ const OPENAI_GPT_4_0314 = { 'seed', 'stop', 'temperature', - 'toolChoice', 'topLogprobs', 'topP', ], }, - context_window: 8191, + context_window: 4095, max_output_tokens: 4096, pricing: { text: { input: { - normal: 30, + normal: 1.5, cached: 0, }, output: { - normal: 60, + normal: 2, }, }, image: 0, }, } as const -const OPENAI_GPT_4_1106_PREVIEW = { - id: 'openai/gpt-4-1106-preview', - name: 'OpenAI: GPT-4 Turbo (older v1106)', +const OPENAI_GPT_4 = { + id: 'openai/gpt-4', + name: 'OpenAI: GPT-4', supports: { input: ['text'], output: ['text'], @@ -5760,6 +5690,7 @@ const OPENAI_GPT_4_1106_PREVIEW = { 'logitBias', 'logprobs', 'maxCompletionTokens', + 'maxCompletionTokens', 'presencePenalty', 'responseFormat', 'seed', @@ -5770,16 +5701,16 @@ const OPENAI_GPT_4_1106_PREVIEW = { 'topP', ], }, - context_window: 128000, + context_window: 8191, max_output_tokens: 4096, pricing: { text: { input: { - normal: 10, + normal: 30, cached: 0, }, output: { - normal: 30, + normal: 60, }, }, image: 0, @@ -8169,7 +8100,7 @@ const QWEN_QWEN3_235B_A22B_2507 = { pricing: { text: { input: { - normal: 0.071, + normal: 0.09, cached: 0, }, output: { @@ -8237,15 +8168,15 @@ const QWEN_QWEN3_30B_A3B = { ], }, context_window: 131072, - max_output_tokens: 20000, + max_output_tokens: 16384, pricing: { text: { input: { - normal: 0.09, + normal: 0.12, cached: 0, }, output: { - normal: 0.45, + normal: 0.5, }, }, image: 0, @@ -8275,11 +8206,11 @@ const QWEN_QWEN3_30B_A3B_INSTRUCT_2507 = { pricing: { text: { input: { - normal: 0.0428, + normal: 0.04815, cached: 0, }, output: { - normal: 0.1716, + normal: 0.19305, }, }, image: 0, @@ -9151,11 +9082,11 @@ const QWEN_QWEN3_5_9B = { ], }, context_window: 262144, - max_output_tokens: 81920, + max_output_tokens: 262144, pricing: { text: { input: { - normal: 0.04, + normal: 0.1, cached: 0, }, output: { @@ -9284,15 +9215,15 @@ const QWEN_QWEN3_6_27B = { ], }, context_window: 262144, - max_output_tokens: 262140, + max_output_tokens: 131072, pricing: { text: { input: { - normal: 0.29, + normal: 0.289, cached: 0, }, output: { - normal: 3.2, + normal: 2.4, }, }, image: 0, @@ -9321,12 +9252,12 @@ const QWEN_QWEN3_6_35B_A3B = { ], }, context_window: 262144, - max_output_tokens: 262140, + max_output_tokens: 262144, pricing: { text: { input: { - normal: 0.14, - cached: 0, + normal: 0.15, + cached: 0.05, }, output: { normal: 1, @@ -9467,6 +9398,40 @@ const QWEN_QWEN3_7_MAX = { image: 0, }, } as const +const QWEN_QWEN3_7_PLUS = { + id: 'qwen/qwen3.7-plus', + name: 'Qwen: Qwen3.7 Plus', + supports: { + input: ['text', 'image'], + output: ['text'], + supports: [ + 'logprobs', + 'maxCompletionTokens', + 'presencePenalty', + 'reasoning', + 'responseFormat', + 'seed', + 'temperature', + 'toolChoice', + 'topLogprobs', + 'topP', + ], + }, + context_window: 1000000, + max_output_tokens: 65536, + pricing: { + text: { + input: { + normal: 0.4, + cached: 0.58, + }, + output: { + normal: 1.6, + }, + }, + image: 0, + }, +} as const const REKAAI_REKA_EDGE = { id: 'rekaai/reka-edge', name: 'Reka Edge', @@ -9584,38 +9549,6 @@ const RELACE_RELACE_SEARCH = { image: 0, }, } as const -const SAO10K_L3_EURYALE_70B = { - id: 'sao10k/l3-euryale-70b', - name: 'Sao10k: Llama 3 Euryale 70B v2.1', - supports: { - input: ['text'], - output: ['text'], - supports: [ - 'frequencyPenalty', - 'maxCompletionTokens', - 'presencePenalty', - 'seed', - 'stop', - 'temperature', - 'toolChoice', - 'topP', - ], - }, - context_window: 8192, - max_output_tokens: 8192, - pricing: { - text: { - input: { - normal: 1.48, - cached: 0, - }, - output: { - normal: 1.48, - }, - }, - image: 0, - }, -} as const const SAO10K_L3_LUNARIS_8B = { id: 'sao10k/l3-lunaris-8b', name: 'Sao10K: Llama 3 8B Lunaris', @@ -10273,7 +10206,6 @@ const XIAOMI_MIMO_V2_FLASH = { 'presencePenalty', 'reasoning', 'responseFormat', - 'seed', 'stop', 'temperature', 'toolChoice', @@ -10363,28 +10295,6 @@ const XIAOMI_MIMO_V2_5_PRO = { image: 0, }, } as const -const Z_AI_GLM_4_32B = { - id: 'z-ai/glm-4-32b', - name: 'Z.ai: GLM 4 32B ', - supports: { - input: ['text'], - output: ['text'], - supports: ['maxCompletionTokens', 'temperature', 'toolChoice', 'topP'], - }, - context_window: 128000, - pricing: { - text: { - input: { - normal: 0.1, - cached: 0, - }, - output: { - normal: 0.1, - }, - }, - image: 0, - }, -} as const const Z_AI_GLM_4_5 = { id: 'z-ai/glm-4.5', name: 'Z.ai: GLM 4.5', @@ -10427,6 +10337,7 @@ const Z_AI_GLM_4_5_AIR = { output: ['text'], supports: [ 'frequencyPenalty', + 'logprobs', 'maxCompletionTokens', 'presencePenalty', 'reasoning', @@ -10435,6 +10346,7 @@ const Z_AI_GLM_4_5_AIR = { 'stop', 'temperature', 'toolChoice', + 'topLogprobs', 'topP', ], }, @@ -10453,35 +10365,6 @@ const Z_AI_GLM_4_5_AIR = { image: 0, }, } as const -const Z_AI_GLM_4_5_AIR_FREE = { - id: 'z-ai/glm-4.5-air:free', - name: 'Z.ai: GLM 4.5 Air (free)', - supports: { - input: ['text'], - output: ['text'], - supports: [ - 'maxCompletionTokens', - 'reasoning', - 'temperature', - 'toolChoice', - 'topP', - ], - }, - context_window: 131072, - max_output_tokens: 96000, - pricing: { - text: { - input: { - normal: 0, - cached: 0, - }, - output: { - normal: 0, - }, - }, - image: 0, - }, -} as const const Z_AI_GLM_4_5V = { id: 'z-ai/glm-4.5v', name: 'Z.ai: GLM 4.5V', @@ -10571,12 +10454,12 @@ const Z_AI_GLM_4_6V = { ], }, context_window: 131072, - max_output_tokens: 24000, + max_output_tokens: 32768, pricing: { text: { input: { normal: 0.3, - cached: 0.05, + cached: 0.055, }, output: { normal: 0.9, @@ -10711,7 +10594,7 @@ const Z_AI_GLM_5_TURBO = { 'topP', ], }, - context_window: 202752, + context_window: 262144, max_output_tokens: 131072, pricing: { text: { @@ -10763,38 +10646,18 @@ const Z_AI_GLM_5_1 = { image: 0, }, } as const -const Z_AI_GLM_5V_TURBO = { - id: 'z-ai/glm-5v-turbo', - name: 'Z.ai: GLM 5V Turbo', - supports: { - input: ['image', 'text', 'video'], - output: ['text'], - supports: [ - 'maxCompletionTokens', - 'reasoning', - 'responseFormat', - 'temperature', - 'toolChoice', - 'topP', - ], - }, - context_window: 202752, - max_output_tokens: 131072, - pricing: { - text: { - input: { - normal: 1.2, - cached: 0.24, - }, - output: { - normal: 4, - }, - }, - image: 0, - }, -} as const export type OpenRouterModelOptionsByName = { + [_ANTHROPIC_CLAUDE_FABLE_LATEST.id]: OpenRouterCommonOptions & + Pick< + OpenRouterBaseOptions, + | 'maxCompletionTokens' + | 'maxCompletionTokens' + | 'reasoning' + | 'responseFormat' + | 'stop' + | 'toolChoice' + > [_ANTHROPIC_CLAUDE_HAIKU_LATEST.id]: OpenRouterCommonOptions & Pick< OpenRouterBaseOptions, @@ -10985,6 +10848,16 @@ export type OpenRouterModelOptionsByName = { OpenRouterBaseOptions, 'maxCompletionTokens' | 'stop' | 'temperature' | 'toolChoice' | 'topP' > + [ANTHROPIC_CLAUDE_FABLE_5.id]: OpenRouterCommonOptions & + Pick< + OpenRouterBaseOptions, + | 'maxCompletionTokens' + | 'maxCompletionTokens' + | 'reasoning' + | 'responseFormat' + | 'stop' + | 'toolChoice' + > [ANTHROPIC_CLAUDE_HAIKU_4_5.id]: OpenRouterCommonOptions & Pick< OpenRouterBaseOptions, @@ -11130,28 +11003,6 @@ export type OpenRouterModelOptionsByName = { | 'temperature' | 'topP' > - [ARCEE_AI_MAESTRO_REASONING.id]: OpenRouterCommonOptions & - Pick< - OpenRouterBaseOptions, - | 'frequencyPenalty' - | 'logitBias' - | 'maxCompletionTokens' - | 'presencePenalty' - | 'stop' - | 'temperature' - | 'topP' - > - [ARCEE_AI_SPOTLIGHT.id]: OpenRouterCommonOptions & - Pick< - OpenRouterBaseOptions, - | 'frequencyPenalty' - | 'logitBias' - | 'maxCompletionTokens' - | 'presencePenalty' - | 'stop' - | 'temperature' - | 'topP' - > [ARCEE_AI_TRINITY_LARGE_THINKING.id]: OpenRouterCommonOptions & Pick< OpenRouterBaseOptions, @@ -11191,19 +11042,6 @@ export type OpenRouterModelOptionsByName = { | 'toolChoice' | 'topP' > - [BAIDU_ERNIE_4_5_VL_28B_A3B.id]: OpenRouterCommonOptions & - Pick< - OpenRouterBaseOptions, - | 'frequencyPenalty' - | 'maxCompletionTokens' - | 'presencePenalty' - | 'reasoning' - | 'seed' - | 'stop' - | 'temperature' - | 'toolChoice' - | 'topP' - > [BAIDU_ERNIE_4_5_VL_424B_A47B.id]: OpenRouterCommonOptions & Pick< OpenRouterBaseOptions, @@ -12032,8 +11870,6 @@ export type OpenRouterModelOptionsByName = { | 'logitBias' | 'maxCompletionTokens' | 'presencePenalty' - | 'responseFormat' - | 'seed' | 'stop' | 'temperature' | 'topP' @@ -12654,34 +12490,22 @@ export type OpenRouterModelOptionsByName = { | 'topLogprobs' | 'topP' > - [MOONSHOTAI_KIMI_K2_6_FREE.id]: OpenRouterCommonOptions & - Pick [MORPH_MORPH_V3_FAST.id]: OpenRouterCommonOptions & Pick [MORPH_MORPH_V3_LARGE.id]: OpenRouterCommonOptions & Pick - [NEX_AGI_DEEPSEEK_V3_1_NEX_N1.id]: OpenRouterCommonOptions & + [NEX_AGI_NEX_N2_PRO_FREE.id]: OpenRouterCommonOptions & Pick< OpenRouterBaseOptions, | 'frequencyPenalty' + | 'logprobs' | 'maxCompletionTokens' + | 'reasoning' | 'responseFormat' | 'temperature' | 'toolChoice' | 'topP' > - [NOUSRESEARCH_HERMES_2_PRO_LLAMA_3_8B.id]: OpenRouterCommonOptions & - Pick< - OpenRouterBaseOptions, - | 'frequencyPenalty' - | 'maxCompletionTokens' - | 'presencePenalty' - | 'responseFormat' - | 'seed' - | 'stop' - | 'temperature' - | 'topP' - > [NOUSRESEARCH_HERMES_3_LLAMA_3_1_405B.id]: OpenRouterCommonOptions & Pick< OpenRouterBaseOptions, @@ -12818,82 +12642,79 @@ export type OpenRouterModelOptionsByName = { | 'toolChoice' | 'topP' > - [NVIDIA_NEMOTRON_NANO_12B_V2_VL_FREE.id]: OpenRouterCommonOptions & + [NVIDIA_NEMOTRON_3_ULTRA_550B_A55B.id]: OpenRouterCommonOptions & Pick< OpenRouterBaseOptions, + | 'frequencyPenalty' + | 'logitBias' | 'maxCompletionTokens' + | 'presencePenalty' | 'reasoning' + | 'responseFormat' | 'seed' + | 'stop' | 'temperature' | 'toolChoice' | 'topP' > - [NVIDIA_NEMOTRON_NANO_9B_V2.id]: OpenRouterCommonOptions & + [NVIDIA_NEMOTRON_3_ULTRA_550B_A55B_FREE.id]: OpenRouterCommonOptions & Pick< OpenRouterBaseOptions, - | 'frequencyPenalty' - | 'logitBias' | 'maxCompletionTokens' - | 'presencePenalty' | 'reasoning' - | 'responseFormat' | 'seed' - | 'stop' | 'temperature' | 'toolChoice' | 'topP' > - [NVIDIA_NEMOTRON_NANO_9B_V2_FREE.id]: OpenRouterCommonOptions & + [NVIDIA_NEMOTRON_3_5_CONTENT_SAFETY_FREE.id]: OpenRouterCommonOptions & + Pick< + OpenRouterBaseOptions, + 'maxCompletionTokens' | 'reasoning' | 'seed' | 'temperature' | 'topP' + > + [NVIDIA_NEMOTRON_NANO_12B_V2_VL_FREE.id]: OpenRouterCommonOptions & Pick< OpenRouterBaseOptions, | 'maxCompletionTokens' | 'reasoning' - | 'responseFormat' | 'seed' | 'temperature' | 'toolChoice' | 'topP' > - [OPENAI_GPT_3_5_TURBO.id]: OpenRouterCommonOptions & + [NVIDIA_NEMOTRON_NANO_9B_V2.id]: OpenRouterCommonOptions & Pick< OpenRouterBaseOptions, | 'frequencyPenalty' | 'logitBias' - | 'logprobs' | 'maxCompletionTokens' | 'presencePenalty' + | 'reasoning' | 'responseFormat' | 'seed' | 'stop' | 'temperature' | 'toolChoice' - | 'topLogprobs' | 'topP' > - [OPENAI_GPT_3_5_TURBO_0613.id]: OpenRouterCommonOptions & + [NVIDIA_NEMOTRON_NANO_9B_V2_FREE.id]: OpenRouterCommonOptions & Pick< OpenRouterBaseOptions, - | 'frequencyPenalty' - | 'logitBias' - | 'logprobs' | 'maxCompletionTokens' - | 'presencePenalty' + | 'reasoning' | 'responseFormat' | 'seed' - | 'stop' | 'temperature' | 'toolChoice' - | 'topLogprobs' | 'topP' > - [OPENAI_GPT_3_5_TURBO_16K.id]: OpenRouterCommonOptions & + [OPENAI_GPT_3_5_TURBO.id]: OpenRouterCommonOptions & Pick< OpenRouterBaseOptions, | 'frequencyPenalty' | 'logitBias' | 'logprobs' | 'maxCompletionTokens' - | 'maxCompletionTokens' | 'presencePenalty' | 'responseFormat' | 'seed' @@ -12903,7 +12724,7 @@ export type OpenRouterModelOptionsByName = { | 'topLogprobs' | 'topP' > - [OPENAI_GPT_3_5_TURBO_INSTRUCT.id]: OpenRouterCommonOptions & + [OPENAI_GPT_3_5_TURBO_0613.id]: OpenRouterCommonOptions & Pick< OpenRouterBaseOptions, | 'frequencyPenalty' @@ -12915,10 +12736,11 @@ export type OpenRouterModelOptionsByName = { | 'seed' | 'stop' | 'temperature' + | 'toolChoice' | 'topLogprobs' | 'topP' > - [OPENAI_GPT_4.id]: OpenRouterCommonOptions & + [OPENAI_GPT_3_5_TURBO_16K.id]: OpenRouterCommonOptions & Pick< OpenRouterBaseOptions, | 'frequencyPenalty' @@ -12935,7 +12757,7 @@ export type OpenRouterModelOptionsByName = { | 'topLogprobs' | 'topP' > - [OPENAI_GPT_4_0314.id]: OpenRouterCommonOptions & + [OPENAI_GPT_3_5_TURBO_INSTRUCT.id]: OpenRouterCommonOptions & Pick< OpenRouterBaseOptions, | 'frequencyPenalty' @@ -12947,17 +12769,17 @@ export type OpenRouterModelOptionsByName = { | 'seed' | 'stop' | 'temperature' - | 'toolChoice' | 'topLogprobs' | 'topP' > - [OPENAI_GPT_4_1106_PREVIEW.id]: OpenRouterCommonOptions & + [OPENAI_GPT_4.id]: OpenRouterCommonOptions & Pick< OpenRouterBaseOptions, | 'frequencyPenalty' | 'logitBias' | 'logprobs' | 'maxCompletionTokens' + | 'maxCompletionTokens' | 'presencePenalty' | 'responseFormat' | 'seed' @@ -14364,48 +14186,50 @@ export type OpenRouterModelOptionsByName = { | 'topLogprobs' | 'topP' > - [REKAAI_REKA_EDGE.id]: OpenRouterCommonOptions & + [QWEN_QWEN3_7_PLUS.id]: OpenRouterCommonOptions & Pick< OpenRouterBaseOptions, - | 'frequencyPenalty' + | 'logprobs' | 'maxCompletionTokens' | 'presencePenalty' + | 'reasoning' + | 'responseFormat' | 'seed' - | 'stop' | 'temperature' | 'toolChoice' + | 'topLogprobs' | 'topP' > - [REKAAI_REKA_FLASH_3.id]: OpenRouterCommonOptions & + [REKAAI_REKA_EDGE.id]: OpenRouterCommonOptions & Pick< OpenRouterBaseOptions, | 'frequencyPenalty' | 'maxCompletionTokens' | 'presencePenalty' - | 'reasoning' | 'seed' | 'stop' | 'temperature' + | 'toolChoice' | 'topP' > - [RELACE_RELACE_APPLY_3.id]: OpenRouterCommonOptions & - Pick - [RELACE_RELACE_SEARCH.id]: OpenRouterCommonOptions & + [REKAAI_REKA_FLASH_3.id]: OpenRouterCommonOptions & Pick< OpenRouterBaseOptions, + | 'frequencyPenalty' | 'maxCompletionTokens' + | 'presencePenalty' + | 'reasoning' | 'seed' | 'stop' | 'temperature' - | 'toolChoice' | 'topP' > - [SAO10K_L3_EURYALE_70B.id]: OpenRouterCommonOptions & + [RELACE_RELACE_APPLY_3.id]: OpenRouterCommonOptions & + Pick + [RELACE_RELACE_SEARCH.id]: OpenRouterCommonOptions & Pick< OpenRouterBaseOptions, - | 'frequencyPenalty' | 'maxCompletionTokens' - | 'presencePenalty' | 'seed' | 'stop' | 'temperature' @@ -14675,7 +14499,6 @@ export type OpenRouterModelOptionsByName = { | 'presencePenalty' | 'reasoning' | 'responseFormat' - | 'seed' | 'stop' | 'temperature' | 'toolChoice' @@ -14709,11 +14532,6 @@ export type OpenRouterModelOptionsByName = { | 'toolChoice' | 'topP' > - [Z_AI_GLM_4_32B.id]: OpenRouterCommonOptions & - Pick< - OpenRouterBaseOptions, - 'maxCompletionTokens' | 'temperature' | 'toolChoice' | 'topP' - > [Z_AI_GLM_4_5.id]: OpenRouterCommonOptions & Pick< OpenRouterBaseOptions, @@ -14732,6 +14550,7 @@ export type OpenRouterModelOptionsByName = { Pick< OpenRouterBaseOptions, | 'frequencyPenalty' + | 'logprobs' | 'maxCompletionTokens' | 'presencePenalty' | 'reasoning' @@ -14740,15 +14559,7 @@ export type OpenRouterModelOptionsByName = { | 'stop' | 'temperature' | 'toolChoice' - | 'topP' - > - [Z_AI_GLM_4_5_AIR_FREE.id]: OpenRouterCommonOptions & - Pick< - OpenRouterBaseOptions, - | 'maxCompletionTokens' - | 'reasoning' - | 'temperature' - | 'toolChoice' + | 'topLogprobs' | 'topP' > [Z_AI_GLM_4_5V.id]: OpenRouterCommonOptions & @@ -14874,20 +14685,13 @@ export type OpenRouterModelOptionsByName = { | 'topLogprobs' | 'topP' > - [Z_AI_GLM_5V_TURBO.id]: OpenRouterCommonOptions & - Pick< - OpenRouterBaseOptions, - | 'maxCompletionTokens' - | 'reasoning' - | 'responseFormat' - | 'temperature' - | 'toolChoice' - | 'topP' - > 'openrouter/auto': OpenRouterCommonOptions & OpenRouterBaseOptions } export type OpenRouterModelInputModalitiesByName = { + [_ANTHROPIC_CLAUDE_FABLE_LATEST.id]: ReadonlyArray< + 'text' | 'image' | 'document' + > [_ANTHROPIC_CLAUDE_HAIKU_LATEST.id]: ReadonlyArray< 'text' | 'image' | 'document' > @@ -14922,6 +14726,7 @@ export type OpenRouterModelInputModalitiesByName = { [ANTHRACITE_ORG_MAGNUM_V4_72B.id]: ReadonlyArray<'text'> [ANTHROPIC_CLAUDE_3_HAIKU.id]: ReadonlyArray<'text' | 'image'> [ANTHROPIC_CLAUDE_3_5_HAIKU.id]: ReadonlyArray<'text' | 'image'> + [ANTHROPIC_CLAUDE_FABLE_5.id]: ReadonlyArray<'text' | 'image' | 'document'> [ANTHROPIC_CLAUDE_HAIKU_4_5.id]: ReadonlyArray<'text' | 'image' | 'document'> [ANTHROPIC_CLAUDE_OPUS_4.id]: ReadonlyArray<'image' | 'text' | 'document'> [ANTHROPIC_CLAUDE_OPUS_4_1.id]: ReadonlyArray<'image' | 'text' | 'document'> @@ -14942,12 +14747,9 @@ export type OpenRouterModelInputModalitiesByName = { [ANTHROPIC_CLAUDE_SONNET_4_5.id]: ReadonlyArray<'text' | 'image' | 'document'> [ANTHROPIC_CLAUDE_SONNET_4_6.id]: ReadonlyArray<'text' | 'image' | 'document'> [ARCEE_AI_CODER_LARGE.id]: ReadonlyArray<'text'> - [ARCEE_AI_MAESTRO_REASONING.id]: ReadonlyArray<'text'> - [ARCEE_AI_SPOTLIGHT.id]: ReadonlyArray<'image' | 'text'> [ARCEE_AI_TRINITY_LARGE_THINKING.id]: ReadonlyArray<'text'> [ARCEE_AI_TRINITY_MINI.id]: ReadonlyArray<'text'> [ARCEE_AI_VIRTUOSO_LARGE.id]: ReadonlyArray<'text'> - [BAIDU_ERNIE_4_5_VL_28B_A3B.id]: ReadonlyArray<'text' | 'image'> [BAIDU_ERNIE_4_5_VL_424B_A47B.id]: ReadonlyArray<'image' | 'text'> [BYTEDANCE_SEED_SEED_1_6.id]: ReadonlyArray<'image' | 'text' | 'video'> [BYTEDANCE_SEED_SEED_1_6_FLASH.id]: ReadonlyArray<'image' | 'text' | 'video'> @@ -15094,11 +14896,9 @@ export type OpenRouterModelInputModalitiesByName = { [MOONSHOTAI_KIMI_K2_THINKING.id]: ReadonlyArray<'text'> [MOONSHOTAI_KIMI_K2_5.id]: ReadonlyArray<'text' | 'image'> [MOONSHOTAI_KIMI_K2_6.id]: ReadonlyArray<'text' | 'image'> - [MOONSHOTAI_KIMI_K2_6_FREE.id]: ReadonlyArray<'text' | 'image'> [MORPH_MORPH_V3_FAST.id]: ReadonlyArray<'text'> [MORPH_MORPH_V3_LARGE.id]: ReadonlyArray<'text'> - [NEX_AGI_DEEPSEEK_V3_1_NEX_N1.id]: ReadonlyArray<'text'> - [NOUSRESEARCH_HERMES_2_PRO_LLAMA_3_8B.id]: ReadonlyArray<'text'> + [NEX_AGI_NEX_N2_PRO_FREE.id]: ReadonlyArray<'text' | 'image'> [NOUSRESEARCH_HERMES_3_LLAMA_3_1_405B.id]: ReadonlyArray<'text'> [NOUSRESEARCH_HERMES_3_LLAMA_3_1_405B_FREE.id]: ReadonlyArray<'text'> [NOUSRESEARCH_HERMES_3_LLAMA_3_1_70B.id]: ReadonlyArray<'text'> @@ -15112,6 +14912,9 @@ export type OpenRouterModelInputModalitiesByName = { > [NVIDIA_NEMOTRON_3_SUPER_120B_A12B.id]: ReadonlyArray<'text'> [NVIDIA_NEMOTRON_3_SUPER_120B_A12B_FREE.id]: ReadonlyArray<'text'> + [NVIDIA_NEMOTRON_3_ULTRA_550B_A55B.id]: ReadonlyArray<'text'> + [NVIDIA_NEMOTRON_3_ULTRA_550B_A55B_FREE.id]: ReadonlyArray<'text'> + [NVIDIA_NEMOTRON_3_5_CONTENT_SAFETY_FREE.id]: ReadonlyArray<'text' | 'image'> [NVIDIA_NEMOTRON_NANO_12B_V2_VL_FREE.id]: ReadonlyArray< 'image' | 'text' | 'video' > @@ -15122,8 +14925,6 @@ export type OpenRouterModelInputModalitiesByName = { [OPENAI_GPT_3_5_TURBO_16K.id]: ReadonlyArray<'text'> [OPENAI_GPT_3_5_TURBO_INSTRUCT.id]: ReadonlyArray<'text'> [OPENAI_GPT_4.id]: ReadonlyArray<'text'> - [OPENAI_GPT_4_0314.id]: ReadonlyArray<'text'> - [OPENAI_GPT_4_1106_PREVIEW.id]: ReadonlyArray<'text'> [OPENAI_GPT_4_TURBO.id]: ReadonlyArray<'text' | 'image'> [OPENAI_GPT_4_TURBO_PREVIEW.id]: ReadonlyArray<'text'> [OPENAI_GPT_4_1.id]: ReadonlyArray<'image' | 'text' | 'document'> @@ -15243,11 +15044,11 @@ export type OpenRouterModelInputModalitiesByName = { [QWEN_QWEN3_6_MAX_PREVIEW.id]: ReadonlyArray<'text'> [QWEN_QWEN3_6_PLUS.id]: ReadonlyArray<'text' | 'image' | 'video'> [QWEN_QWEN3_7_MAX.id]: ReadonlyArray<'text'> + [QWEN_QWEN3_7_PLUS.id]: ReadonlyArray<'text' | 'image'> [REKAAI_REKA_EDGE.id]: ReadonlyArray<'image' | 'text' | 'video'> [REKAAI_REKA_FLASH_3.id]: ReadonlyArray<'text'> [RELACE_RELACE_APPLY_3.id]: ReadonlyArray<'text'> [RELACE_RELACE_SEARCH.id]: ReadonlyArray<'text'> - [SAO10K_L3_EURYALE_70B.id]: ReadonlyArray<'text'> [SAO10K_L3_LUNARIS_8B.id]: ReadonlyArray<'text'> [SAO10K_L3_1_70B_HANAMI_X1.id]: ReadonlyArray<'text'> [SAO10K_L3_1_EURYALE_70B.id]: ReadonlyArray<'text'> @@ -15271,10 +15072,8 @@ export type OpenRouterModelInputModalitiesByName = { [XIAOMI_MIMO_V2_FLASH.id]: ReadonlyArray<'text'> [XIAOMI_MIMO_V2_5.id]: ReadonlyArray<'text' | 'audio' | 'image' | 'video'> [XIAOMI_MIMO_V2_5_PRO.id]: ReadonlyArray<'text'> - [Z_AI_GLM_4_32B.id]: ReadonlyArray<'text'> [Z_AI_GLM_4_5.id]: ReadonlyArray<'text'> [Z_AI_GLM_4_5_AIR.id]: ReadonlyArray<'text'> - [Z_AI_GLM_4_5_AIR_FREE.id]: ReadonlyArray<'text'> [Z_AI_GLM_4_5V.id]: ReadonlyArray<'text' | 'image'> [Z_AI_GLM_4_6.id]: ReadonlyArray<'text'> [Z_AI_GLM_4_6V.id]: ReadonlyArray<'image' | 'text' | 'video'> @@ -15283,13 +15082,13 @@ export type OpenRouterModelInputModalitiesByName = { [Z_AI_GLM_5.id]: ReadonlyArray<'text'> [Z_AI_GLM_5_TURBO.id]: ReadonlyArray<'text'> [Z_AI_GLM_5_1.id]: ReadonlyArray<'text'> - [Z_AI_GLM_5V_TURBO.id]: ReadonlyArray<'image' | 'text' | 'video'> 'openrouter/auto': ReadonlyArray< 'text' | 'image' | 'audio' | 'video' | 'document' > } export const OPENROUTER_CHAT_MODELS = [ + _ANTHROPIC_CLAUDE_FABLE_LATEST.id, _ANTHROPIC_CLAUDE_HAIKU_LATEST.id, _ANTHROPIC_CLAUDE_OPUS_LATEST.id, _ANTHROPIC_CLAUDE_SONNET_LATEST.id, @@ -15312,6 +15111,7 @@ export const OPENROUTER_CHAT_MODELS = [ ANTHRACITE_ORG_MAGNUM_V4_72B.id, ANTHROPIC_CLAUDE_3_HAIKU.id, ANTHROPIC_CLAUDE_3_5_HAIKU.id, + ANTHROPIC_CLAUDE_FABLE_5.id, ANTHROPIC_CLAUDE_HAIKU_4_5.id, ANTHROPIC_CLAUDE_OPUS_4.id, ANTHROPIC_CLAUDE_OPUS_4_1.id, @@ -15326,12 +15126,9 @@ export const OPENROUTER_CHAT_MODELS = [ ANTHROPIC_CLAUDE_SONNET_4_5.id, ANTHROPIC_CLAUDE_SONNET_4_6.id, ARCEE_AI_CODER_LARGE.id, - ARCEE_AI_MAESTRO_REASONING.id, - ARCEE_AI_SPOTLIGHT.id, ARCEE_AI_TRINITY_LARGE_THINKING.id, ARCEE_AI_TRINITY_MINI.id, ARCEE_AI_VIRTUOSO_LARGE.id, - BAIDU_ERNIE_4_5_VL_28B_A3B.id, BAIDU_ERNIE_4_5_VL_424B_A47B.id, BYTEDANCE_SEED_SEED_1_6.id, BYTEDANCE_SEED_SEED_1_6_FLASH.id, @@ -15444,11 +15241,9 @@ export const OPENROUTER_CHAT_MODELS = [ MOONSHOTAI_KIMI_K2_THINKING.id, MOONSHOTAI_KIMI_K2_5.id, MOONSHOTAI_KIMI_K2_6.id, - MOONSHOTAI_KIMI_K2_6_FREE.id, MORPH_MORPH_V3_FAST.id, MORPH_MORPH_V3_LARGE.id, - NEX_AGI_DEEPSEEK_V3_1_NEX_N1.id, - NOUSRESEARCH_HERMES_2_PRO_LLAMA_3_8B.id, + NEX_AGI_NEX_N2_PRO_FREE.id, NOUSRESEARCH_HERMES_3_LLAMA_3_1_405B.id, NOUSRESEARCH_HERMES_3_LLAMA_3_1_405B_FREE.id, NOUSRESEARCH_HERMES_3_LLAMA_3_1_70B.id, @@ -15460,6 +15255,9 @@ export const OPENROUTER_CHAT_MODELS = [ NVIDIA_NEMOTRON_3_NANO_OMNI_30B_A3B_REASONING_FREE.id, NVIDIA_NEMOTRON_3_SUPER_120B_A12B.id, NVIDIA_NEMOTRON_3_SUPER_120B_A12B_FREE.id, + NVIDIA_NEMOTRON_3_ULTRA_550B_A55B.id, + NVIDIA_NEMOTRON_3_ULTRA_550B_A55B_FREE.id, + NVIDIA_NEMOTRON_3_5_CONTENT_SAFETY_FREE.id, NVIDIA_NEMOTRON_NANO_12B_V2_VL_FREE.id, NVIDIA_NEMOTRON_NANO_9B_V2.id, NVIDIA_NEMOTRON_NANO_9B_V2_FREE.id, @@ -15468,8 +15266,6 @@ export const OPENROUTER_CHAT_MODELS = [ OPENAI_GPT_3_5_TURBO_16K.id, OPENAI_GPT_3_5_TURBO_INSTRUCT.id, OPENAI_GPT_4.id, - OPENAI_GPT_4_0314.id, - OPENAI_GPT_4_1106_PREVIEW.id, OPENAI_GPT_4_TURBO.id, OPENAI_GPT_4_TURBO_PREVIEW.id, OPENAI_GPT_4_1.id, @@ -15585,11 +15381,11 @@ export const OPENROUTER_CHAT_MODELS = [ QWEN_QWEN3_6_MAX_PREVIEW.id, QWEN_QWEN3_6_PLUS.id, QWEN_QWEN3_7_MAX.id, + QWEN_QWEN3_7_PLUS.id, REKAAI_REKA_EDGE.id, REKAAI_REKA_FLASH_3.id, RELACE_RELACE_APPLY_3.id, RELACE_RELACE_SEARCH.id, - SAO10K_L3_EURYALE_70B.id, SAO10K_L3_LUNARIS_8B.id, SAO10K_L3_1_70B_HANAMI_X1.id, SAO10K_L3_1_EURYALE_70B.id, @@ -15613,10 +15409,8 @@ export const OPENROUTER_CHAT_MODELS = [ XIAOMI_MIMO_V2_FLASH.id, XIAOMI_MIMO_V2_5.id, XIAOMI_MIMO_V2_5_PRO.id, - Z_AI_GLM_4_32B.id, Z_AI_GLM_4_5.id, Z_AI_GLM_4_5_AIR.id, - Z_AI_GLM_4_5_AIR_FREE.id, Z_AI_GLM_4_5V.id, Z_AI_GLM_4_6.id, Z_AI_GLM_4_6V.id, @@ -15625,7 +15419,6 @@ export const OPENROUTER_CHAT_MODELS = [ Z_AI_GLM_5.id, Z_AI_GLM_5_TURBO.id, Z_AI_GLM_5_1.id, - Z_AI_GLM_5V_TURBO.id, 'openrouter/auto', ] as const diff --git a/scripts/.sync-models-last-run b/scripts/.sync-models-last-run index be7a0996a..717f86528 100644 --- a/scripts/.sync-models-last-run +++ b/scripts/.sync-models-last-run @@ -1 +1 @@ -1780482493 +1781171945 diff --git a/scripts/openrouter.models.json b/scripts/openrouter.models.json index bcc2eeacd..a8a9b7624 100644 --- a/scripts/openrouter.models.json +++ b/scripts/openrouter.models.json @@ -1,4 +1,59 @@ [ + { + "id": "~anthropic/claude-fable-latest", + "canonical_slug": "~anthropic/claude-fable-latest", + "hugging_face_id": null, + "name": "Anthropic: Claude Fable Latest", + "created": 1781029944, + "description": "This model always redirects to the latest model in the Claude Fable family.", + "context_length": 1000000, + "architecture": { + "modality": "text+image+file->text", + "input_modalities": ["text", "image", "file"], + "output_modalities": ["text"], + "tokenizer": "Router", + "instruct_type": null + }, + "pricing": { + "prompt": "0.00001", + "completion": "0.00005", + "web_search": "0.01", + "input_cache_read": "0.000001", + "input_cache_write": "0.0000125" + }, + "top_provider": { + "context_length": 1000000, + "max_completion_tokens": 128000, + "is_moderated": true + }, + "per_request_limits": null, + "supported_parameters": [ + "include_reasoning", + "max_completion_tokens", + "max_tokens", + "reasoning", + "response_format", + "stop", + "structured_outputs", + "tool_choice", + "tools", + "verbosity" + ], + "default_parameters": { + "temperature": null, + "top_p": null, + "top_k": null, + "frequency_penalty": null, + "presence_penalty": null, + "repetition_penalty": null + }, + "supported_voices": null, + "knowledge_cutoff": null, + "expiration_date": null, + "links": { + "details": "/api/v1/models/~anthropic/claude-fable-latest/endpoints" + } + }, { "id": "~anthropic/claude-haiku-latest", "canonical_slug": "~anthropic/claude-haiku-latest", @@ -301,13 +356,13 @@ "instruct_type": null }, "pricing": { - "prompt": "0.000000684", - "completion": "0.00000342", - "input_cache_read": "0.000000144" + "prompt": "0.00000068", + "completion": "0.00000341", + "input_cache_read": "0.00000034" }, "top_provider": { - "context_length": 262144, - "max_completion_tokens": 262144, + "context_length": 262142, + "max_completion_tokens": 262142, "is_moderated": false }, "per_request_limits": null, @@ -994,6 +1049,7 @@ "pricing": { "prompt": "0.00000025", "completion": "0.00000125", + "web_search": "0.01", "input_cache_read": "0.00000003", "input_cache_write": "0.0000003" }, @@ -1069,6 +1125,61 @@ "details": "/api/v1/models/anthropic/claude-3-5-haiku/endpoints" } }, + { + "id": "anthropic/claude-fable-5", + "canonical_slug": "anthropic/claude-5-fable-20260609", + "hugging_face_id": null, + "name": "Anthropic: Claude Fable 5", + "created": 1781007515, + "description": "Claude Fable 5 is a Mythos-class model from Anthropic, built for autonomous knowledge work and coding. It supports text, image, and file inputs with text output, with reasoning support and...", + "context_length": 1000000, + "architecture": { + "modality": "text+image+file->text", + "input_modalities": ["text", "image", "file"], + "output_modalities": ["text"], + "tokenizer": "Claude", + "instruct_type": null + }, + "pricing": { + "prompt": "0.00001", + "completion": "0.00005", + "web_search": "0.01", + "input_cache_read": "0.000001", + "input_cache_write": "0.0000125" + }, + "top_provider": { + "context_length": 1000000, + "max_completion_tokens": 128000, + "is_moderated": true + }, + "per_request_limits": null, + "supported_parameters": [ + "include_reasoning", + "max_completion_tokens", + "max_tokens", + "reasoning", + "response_format", + "stop", + "structured_outputs", + "tool_choice", + "tools", + "verbosity" + ], + "default_parameters": { + "temperature": null, + "top_p": null, + "top_k": null, + "frequency_penalty": null, + "presence_penalty": null, + "repetition_penalty": null + }, + "supported_voices": null, + "knowledge_cutoff": null, + "expiration_date": null, + "links": { + "details": "/api/v1/models/anthropic/claude-5-fable-20260609/endpoints" + } + }, { "id": "anthropic/claude-haiku-4.5", "canonical_slug": "anthropic/claude-4.5-haiku-20251001", @@ -1833,96 +1944,6 @@ "details": "/api/v1/models/arcee-ai/coder-large/endpoints" } }, - { - "id": "arcee-ai/maestro-reasoning", - "canonical_slug": "arcee-ai/maestro-reasoning", - "hugging_face_id": "", - "name": "Arcee AI: Maestro Reasoning", - "created": 1746481269, - "description": "Maestro Reasoning is Arcee's flagship analysis model: a 32 B‑parameter derivative of Qwen 2.5‑32 B tuned with DPO and chain‑of‑thought RL for step‑by‑step logic. Compared to the earlier 7 B...", - "context_length": 131072, - "architecture": { - "modality": "text->text", - "input_modalities": ["text"], - "output_modalities": ["text"], - "tokenizer": "Other", - "instruct_type": null - }, - "pricing": { - "prompt": "0.0000009", - "completion": "0.0000033" - }, - "top_provider": { - "context_length": 131072, - "max_completion_tokens": 32000, - "is_moderated": false - }, - "per_request_limits": null, - "supported_parameters": [ - "frequency_penalty", - "logit_bias", - "max_tokens", - "min_p", - "presence_penalty", - "repetition_penalty", - "stop", - "temperature", - "top_k", - "top_p" - ], - "default_parameters": {}, - "supported_voices": null, - "knowledge_cutoff": "2025-03-31", - "expiration_date": null, - "links": { - "details": "/api/v1/models/arcee-ai/maestro-reasoning/endpoints" - } - }, - { - "id": "arcee-ai/spotlight", - "canonical_slug": "arcee-ai/spotlight", - "hugging_face_id": "", - "name": "Arcee AI: Spotlight", - "created": 1746481552, - "description": "Spotlight is a 7‑billion‑parameter vision‑language model derived from Qwen 2.5‑VL and fine‑tuned by Arcee AI for tight image‑text grounding tasks. It offers a 32 k‑token context window, enabling rich multimodal...", - "context_length": 131072, - "architecture": { - "modality": "text+image->text", - "input_modalities": ["image", "text"], - "output_modalities": ["text"], - "tokenizer": "Other", - "instruct_type": null - }, - "pricing": { - "prompt": "0.00000018", - "completion": "0.00000018" - }, - "top_provider": { - "context_length": 131072, - "max_completion_tokens": 65537, - "is_moderated": false - }, - "per_request_limits": null, - "supported_parameters": [ - "frequency_penalty", - "logit_bias", - "max_tokens", - "min_p", - "presence_penalty", - "repetition_penalty", - "stop", - "temperature", - "top_k", - "top_p" - ], - "default_parameters": {}, - "supported_voices": null, - "knowledge_cutoff": "2025-03-31", - "expiration_date": null, - "links": { - "details": "/api/v1/models/arcee-ai/spotlight/endpoints" - } - }, { "id": "arcee-ai/trinity-large-thinking", "canonical_slug": "arcee-ai/trinity-large-thinking", @@ -2079,54 +2100,6 @@ "details": "/api/v1/models/arcee-ai/virtuoso-large/endpoints" } }, - { - "id": "baidu/ernie-4.5-vl-28b-a3b", - "canonical_slug": "baidu/ernie-4.5-vl-28b-a3b", - "hugging_face_id": "baidu/ERNIE-4.5-VL-28B-A3B-PT", - "name": "Baidu: ERNIE 4.5 VL 28B A3B", - "created": 1755032836, - "description": "A powerful multimodal Mixture-of-Experts chat model featuring 28B total parameters with 3B activated per token, delivering exceptional text and vision understanding through its innovative heterogeneous MoE structure with modality-isolated routing....", - "context_length": 131072, - "architecture": { - "modality": "text+image->text", - "input_modalities": ["text", "image"], - "output_modalities": ["text"], - "tokenizer": "Other", - "instruct_type": null - }, - "pricing": { - "prompt": "0.00000014", - "completion": "0.00000056" - }, - "top_provider": { - "context_length": 30000, - "max_completion_tokens": 8000, - "is_moderated": false - }, - "per_request_limits": null, - "supported_parameters": [ - "frequency_penalty", - "include_reasoning", - "max_tokens", - "presence_penalty", - "reasoning", - "repetition_penalty", - "seed", - "stop", - "temperature", - "tool_choice", - "tools", - "top_k", - "top_p" - ], - "default_parameters": {}, - "supported_voices": null, - "knowledge_cutoff": "2025-03-31", - "expiration_date": null, - "links": { - "details": "/api/v1/models/baidu/ernie-4.5-vl-28b-a3b/endpoints" - } - }, { "id": "baidu/ernie-4.5-vl-424b-a47b", "canonical_slug": "baidu/ernie-4.5-vl-424b-a47b", @@ -2760,7 +2733,7 @@ "name": "DeepSeek: DeepSeek V3 0324", "created": 1742824755, "description": "DeepSeek V3, a 685B-parameter, mixture-of-experts model, is the latest iteration of the flagship chat model family from the DeepSeek team. It succeeds the [DeepSeek V3](/deepseek/deepseek-chat-v3) model and performs really well...", - "context_length": 163840, + "context_length": 131072, "architecture": { "modality": "text->text", "input_modalities": ["text"], @@ -2774,7 +2747,7 @@ "input_cache_read": "0.000000135" }, "top_provider": { - "context_length": 163840, + "context_length": 32768, "max_completion_tokens": 16384, "is_moderated": false }, @@ -3016,7 +2989,7 @@ "default_parameters": {}, "supported_voices": null, "knowledge_cutoff": "2024-07-31", - "expiration_date": null, + "expiration_date": "2026-06-11", "links": { "details": "/api/v1/models/deepseek/deepseek-r1-distill-llama-70b/endpoints" } @@ -4324,8 +4297,8 @@ "instruct_type": "gemma" }, "pricing": { - "prompt": "0.00000004", - "completion": "0.00000013" + "prompt": "0.00000005", + "completion": "0.00000015" }, "top_provider": { "context_length": 131072, @@ -4428,8 +4401,8 @@ "instruct_type": "gemma" }, "pricing": { - "prompt": "0.00000004", - "completion": "0.00000008" + "prompt": "0.00000005", + "completion": "0.0000001" }, "top_provider": { "context_length": 131072, @@ -4628,11 +4601,12 @@ }, "pricing": { "prompt": "0.00000012", - "completion": "0.00000037" + "completion": "0.00000036", + "input_cache_read": "0.00000009" }, "top_provider": { - "context_length": 262144, - "max_completion_tokens": 16384, + "context_length": 256000, + "max_completion_tokens": 8192, "is_moderated": false }, "per_request_limits": null, @@ -5564,7 +5538,7 @@ "default_parameters": {}, "supported_voices": null, "knowledge_cutoff": "2023-12-31", - "expiration_date": null, + "expiration_date": "2026-06-19", "links": { "details": "/api/v1/models/meta-llama/llama-3-70b-instruct/endpoints" } @@ -5585,12 +5559,12 @@ "instruct_type": "llama3" }, "pricing": { - "prompt": "0.00000004", - "completion": "0.00000004" + "prompt": "0.00000014", + "completion": "0.00000014" }, "top_provider": { "context_length": 8192, - "max_completion_tokens": 8192, + "max_completion_tokens": null, "is_moderated": false }, "per_request_limits": null, @@ -5601,8 +5575,6 @@ "min_p", "presence_penalty", "repetition_penalty", - "response_format", - "seed", "stop", "temperature", "top_k", @@ -5683,10 +5655,10 @@ }, "pricing": { "prompt": "0.00000002", - "completion": "0.00000005" + "completion": "0.00000003" }, "top_provider": { - "context_length": 16384, + "context_length": 131072, "max_completion_tokens": 16384, "is_moderated": false }, @@ -5732,8 +5704,8 @@ "instruct_type": "llama3" }, "pricing": { - "prompt": "0.000000245", - "completion": "0.000000245" + "prompt": "0.000000345", + "completion": "0.000000345" }, "top_provider": { "context_length": 131072, @@ -6057,7 +6029,7 @@ "instruct_type": null }, "pricing": { - "prompt": "0.00000008", + "prompt": "0.0000001", "completion": "0.0000003" }, "top_provider": { @@ -6586,7 +6558,8 @@ }, "pricing": { "prompt": "0.00000015", - "completion": "0.00000115" + "completion": "0.0000009", + "input_cache_read": "0.00000005" }, "top_provider": { "context_length": 196608, @@ -6648,11 +6621,12 @@ "instruct_type": null }, "pricing": { - "prompt": "0.000000279", - "completion": "0.0000012" + "prompt": "0.00000027", + "completion": "0.00000108", + "input_cache_read": "0.000000054" }, "top_provider": { - "context_length": 196608, + "context_length": 204800, "max_completion_tokens": 131072, "is_moderated": false }, @@ -7887,13 +7861,12 @@ "instruct_type": null }, "pricing": { - "prompt": "0.0000004", - "completion": "0.0000019", - "input_cache_read": "0.00000009" + "prompt": "0.00000035", + "completion": "0.00000189" }, "top_provider": { - "context_length": 262144, - "max_completion_tokens": 262144, + "context_length": 256000, + "max_completion_tokens": null, "is_moderated": false }, "per_request_limits": null, @@ -7949,13 +7922,13 @@ "instruct_type": null }, "pricing": { - "prompt": "0.000000684", - "completion": "0.00000342", - "input_cache_read": "0.000000144" + "prompt": "0.00000068", + "completion": "0.00000341", + "input_cache_read": "0.00000034" }, "top_provider": { - "context_length": 262144, - "max_completion_tokens": 262144, + "context_length": 262142, + "max_completion_tokens": 262142, "is_moderated": false }, "per_request_limits": null, @@ -7997,52 +7970,6 @@ "details": "/api/v1/models/moonshotai/kimi-k2.6-20260420/endpoints" } }, - { - "id": "moonshotai/kimi-k2.6:free", - "canonical_slug": "moonshotai/kimi-k2.6-20260420", - "hugging_face_id": "moonshotai/Kimi-K2.6", - "name": "MoonshotAI: Kimi K2.6 (free)", - "created": 1776699402, - "description": "Kimi K2.6 is Moonshot AI's next-generation multimodal model, designed for long-horizon coding, coding-driven UI/UX generation, and multi-agent orchestration. It handles complex end-to-end coding tasks across Python, Rust, and Go, and...", - "context_length": 262144, - "architecture": { - "modality": "text+image->text", - "input_modalities": ["text", "image"], - "output_modalities": ["text"], - "tokenizer": "Other", - "instruct_type": null - }, - "pricing": { - "prompt": "0", - "completion": "0" - }, - "top_provider": { - "context_length": 262144, - "max_completion_tokens": null, - "is_moderated": false - }, - "per_request_limits": null, - "supported_parameters": [ - "include_reasoning", - "reasoning", - "tool_choice", - "tools" - ], - "default_parameters": { - "temperature": null, - "top_p": null, - "top_k": null, - "frequency_penalty": null, - "presence_penalty": null, - "repetition_penalty": null - }, - "supported_voices": null, - "knowledge_cutoff": null, - "expiration_date": null, - "links": { - "details": "/api/v1/models/moonshotai/kimi-k2.6-20260420/endpoints" - } - }, { "id": "morph/morph-v3-fast", "canonical_slug": "morph/morph-v3-fast", @@ -8120,33 +8047,36 @@ } }, { - "id": "nex-agi/deepseek-v3.1-nex-n1", - "canonical_slug": "nex-agi/deepseek-v3.1-nex-n1", - "hugging_face_id": "nex-agi/DeepSeek-V3.1-Nex-N1", - "name": "Nex AGI: DeepSeek V3.1 Nex N1", - "created": 1765204393, - "description": "DeepSeek V3.1 Nex-N1 is the flagship release of the Nex-N1 series — a post-trained model designed to highlight agent autonomy, tool use, and real-world productivity. Nex-N1 demonstrates competitive performance across...", - "context_length": 131072, + "id": "nex-agi/nex-n2-pro:free", + "canonical_slug": "nex-agi/nex-n2-pro", + "hugging_face_id": "nex-agi/Nex-N2-Pro", + "name": "Nex AGI: Nex-N2-Pro (free)", + "created": 1780937140, + "description": "Nex-N2-Pro is an agentic mixture-of-experts model from Nex AGI, with 17B active parameters out of 397B total. Built on the Qwen3.5 architecture, it accepts text and image input and produces...", + "context_length": 262144, "architecture": { - "modality": "text->text", - "input_modalities": ["text"], + "modality": "text+image->text", + "input_modalities": ["text", "image"], "output_modalities": ["text"], - "tokenizer": "DeepSeek", + "tokenizer": "Qwen3", "instruct_type": null }, "pricing": { - "prompt": "0.000000135", - "completion": "0.0000005" + "prompt": "0", + "completion": "0" }, "top_provider": { - "context_length": 131072, - "max_completion_tokens": 163840, + "context_length": 262144, + "max_completion_tokens": 262144, "is_moderated": false }, "per_request_limits": null, "supported_parameters": [ "frequency_penalty", + "include_reasoning", + "logprobs", "max_tokens", + "reasoning", "response_format", "structured_outputs", "temperature", @@ -8156,61 +8086,18 @@ "top_p" ], "default_parameters": { - "temperature": null, - "top_p": null, - "frequency_penalty": null + "temperature": 0.7, + "top_p": 0.95, + "top_k": 40, + "frequency_penalty": null, + "presence_penalty": null, + "repetition_penalty": null }, "supported_voices": null, "knowledge_cutoff": null, - "expiration_date": "2026-06-08", - "links": { - "details": "/api/v1/models/nex-agi/deepseek-v3.1-nex-n1/endpoints" - } - }, - { - "id": "nousresearch/hermes-2-pro-llama-3-8b", - "canonical_slug": "nousresearch/hermes-2-pro-llama-3-8b", - "hugging_face_id": "NousResearch/Hermes-2-Pro-Llama-3-8B", - "name": "NousResearch: Hermes 2 Pro - Llama-3 8B", - "created": 1716768000, - "description": "Hermes 2 Pro is an upgraded, retrained version of Nous Hermes 2, consisting of an updated and cleaned version of the OpenHermes 2.5 Dataset, as well as a newly introduced...", - "context_length": 8192, - "architecture": { - "modality": "text->text", - "input_modalities": ["text"], - "output_modalities": ["text"], - "tokenizer": "Llama3", - "instruct_type": "chatml" - }, - "pricing": { - "prompt": "0.00000014", - "completion": "0.00000014" - }, - "top_provider": { - "context_length": 8192, - "max_completion_tokens": 8192, - "is_moderated": false - }, - "per_request_limits": null, - "supported_parameters": [ - "frequency_penalty", - "max_tokens", - "presence_penalty", - "repetition_penalty", - "response_format", - "seed", - "stop", - "structured_outputs", - "temperature", - "top_k", - "top_p" - ], - "default_parameters": {}, - "supported_voices": null, - "knowledge_cutoff": "2023-12-31", - "expiration_date": "2026-06-05", + "expiration_date": null, "links": { - "details": "/api/v1/models/nousresearch/hermes-2-pro-llama-3-8b/endpoints" + "details": "/api/v1/models/nex-agi/nex-n2-pro/endpoints" } }, { @@ -8319,8 +8206,8 @@ "instruct_type": "chatml" }, "pricing": { - "prompt": "0.0000003", - "completion": "0.0000003" + "prompt": "0.0000007", + "completion": "0.0000007" }, "top_provider": { "context_length": 131072, @@ -8457,7 +8344,7 @@ "instruct_type": null }, "pricing": { - "prompt": "0.0000001", + "prompt": "0.0000004", "completion": "0.0000004" }, "top_provider": { @@ -8689,6 +8576,7 @@ "response_format", "seed", "stop", + "structured_outputs", "temperature", "tool_choice", "tools", @@ -8763,6 +8651,164 @@ "details": "/api/v1/models/nvidia/nemotron-3-super-120b-a12b-20230311/endpoints" } }, + { + "id": "nvidia/nemotron-3-ultra-550b-a55b", + "canonical_slug": "nvidia/nemotron-3-ultra-550b-a55b-20260604", + "hugging_face_id": "nvidia/NVIDIA-Nemotron-3-Ultra-550B-A55B-BF16", + "name": "NVIDIA: Nemotron 3 Ultra", + "created": 1780551208, + "description": "NVIDIA Nemotron 3 Ultra is an open frontier-reasoning and orchestration model from NVIDIA, with 55B active parameters out of 550B total (MoE). Built on a hybrid Transformer-Mamba mixture-of-experts architecture, it...", + "context_length": 1000000, + "architecture": { + "modality": "text->text", + "input_modalities": ["text"], + "output_modalities": ["text"], + "tokenizer": "Other", + "instruct_type": null + }, + "pricing": { + "prompt": "0.0000005", + "completion": "0.0000025", + "input_cache_read": "0.00000015" + }, + "top_provider": { + "context_length": 262144, + "max_completion_tokens": 16384, + "is_moderated": false + }, + "per_request_limits": null, + "supported_parameters": [ + "frequency_penalty", + "include_reasoning", + "logit_bias", + "max_tokens", + "min_p", + "presence_penalty", + "reasoning", + "repetition_penalty", + "response_format", + "seed", + "stop", + "structured_outputs", + "temperature", + "tool_choice", + "tools", + "top_k", + "top_p" + ], + "default_parameters": { + "temperature": 1, + "top_p": 0.95, + "top_k": null, + "frequency_penalty": null, + "presence_penalty": null, + "repetition_penalty": null + }, + "supported_voices": null, + "knowledge_cutoff": null, + "expiration_date": null, + "links": { + "details": "/api/v1/models/nvidia/nemotron-3-ultra-550b-a55b-20260604/endpoints" + } + }, + { + "id": "nvidia/nemotron-3-ultra-550b-a55b:free", + "canonical_slug": "nvidia/nemotron-3-ultra-550b-a55b-20260604", + "hugging_face_id": "nvidia/NVIDIA-Nemotron-3-Ultra-550B-A55B-BF16", + "name": "NVIDIA: Nemotron 3 Ultra (free)", + "created": 1780551208, + "description": "NVIDIA Nemotron 3 Ultra is an open frontier-reasoning and orchestration model from NVIDIA, with 55B active parameters out of 550B total (MoE). Built on a hybrid Transformer-Mamba mixture-of-experts architecture, it...", + "context_length": 1000000, + "architecture": { + "modality": "text->text", + "input_modalities": ["text"], + "output_modalities": ["text"], + "tokenizer": "Other", + "instruct_type": null + }, + "pricing": { + "prompt": "0", + "completion": "0" + }, + "top_provider": { + "context_length": 1000000, + "max_completion_tokens": 65536, + "is_moderated": false + }, + "per_request_limits": null, + "supported_parameters": [ + "include_reasoning", + "max_tokens", + "reasoning", + "seed", + "temperature", + "tool_choice", + "tools", + "top_p" + ], + "default_parameters": { + "temperature": 1, + "top_p": 0.95, + "top_k": null, + "frequency_penalty": null, + "presence_penalty": null, + "repetition_penalty": null + }, + "supported_voices": null, + "knowledge_cutoff": null, + "expiration_date": null, + "links": { + "details": "/api/v1/models/nvidia/nemotron-3-ultra-550b-a55b-20260604/endpoints" + } + }, + { + "id": "nvidia/nemotron-3.5-content-safety:free", + "canonical_slug": "nvidia/nemotron-3.5-content-safety-20260604", + "hugging_face_id": "nvidia/Nemotron-3.5-Content-Safety", + "name": "NVIDIA: Nemotron 3.5 Content Safety (free)", + "created": 1780581864, + "description": "NVIDIA Nemotron 3.5 Content Safety is a compact 4B-parameter multimodal guardrail model from NVIDIA, fine-tuned from Google Gemma-3-4B. It moderates both inputs to and responses from LLMs and VLMs, accepting...", + "context_length": 128000, + "architecture": { + "modality": "text+image->text", + "input_modalities": ["text", "image"], + "output_modalities": ["text"], + "tokenizer": "Other", + "instruct_type": null + }, + "pricing": { + "prompt": "0", + "completion": "0" + }, + "top_provider": { + "context_length": 128000, + "max_completion_tokens": 8192, + "is_moderated": false + }, + "per_request_limits": null, + "supported_parameters": [ + "include_reasoning", + "max_tokens", + "reasoning", + "seed", + "temperature", + "top_p" + ], + "default_parameters": { + "temperature": null, + "top_p": null, + "top_k": null, + "frequency_penalty": null, + "presence_penalty": null, + "repetition_penalty": null + }, + "supported_voices": null, + "knowledge_cutoff": null, + "expiration_date": null, + "links": { + "details": "/api/v1/models/nvidia/nemotron-3.5-content-safety-20260604/endpoints" + } + }, { "id": "nvidia/nemotron-nano-12b-v2-vl:free", "canonical_slug": "nvidia/nemotron-nano-12b-v2-vl", @@ -8860,7 +8906,7 @@ }, "supported_voices": null, "knowledge_cutoff": "2025-03-31", - "expiration_date": null, + "expiration_date": "2026-06-11", "links": { "details": "/api/v1/models/nvidia/nemotron-nano-9b-v2/endpoints" } @@ -9106,116 +9152,17 @@ "knowledge_cutoff": "2021-09-30", "expiration_date": null, "links": { - "details": "/api/v1/models/openai/gpt-3.5-turbo-instruct/endpoints" - } - }, - { - "id": "openai/gpt-4", - "canonical_slug": "openai/gpt-4", - "hugging_face_id": null, - "name": "OpenAI: GPT-4", - "created": 1685232000, - "description": "OpenAI's flagship model, GPT-4 is a large-scale multimodal language model capable of solving difficult problems with greater accuracy than previous models due to its broader general knowledge and advanced reasoning...", - "context_length": 8191, - "architecture": { - "modality": "text->text", - "input_modalities": ["text"], - "output_modalities": ["text"], - "tokenizer": "GPT", - "instruct_type": null - }, - "pricing": { - "prompt": "0.00003", - "completion": "0.00006" - }, - "top_provider": { - "context_length": 8191, - "max_completion_tokens": 4096, - "is_moderated": true - }, - "per_request_limits": null, - "supported_parameters": [ - "frequency_penalty", - "logit_bias", - "logprobs", - "max_completion_tokens", - "max_tokens", - "presence_penalty", - "response_format", - "seed", - "stop", - "structured_outputs", - "temperature", - "tool_choice", - "tools", - "top_logprobs", - "top_p" - ], - "default_parameters": {}, - "supported_voices": null, - "knowledge_cutoff": "2021-09-30", - "expiration_date": null, - "links": { - "details": "/api/v1/models/openai/gpt-4/endpoints" - } - }, - { - "id": "openai/gpt-4-0314", - "canonical_slug": "openai/gpt-4-0314", - "hugging_face_id": null, - "name": "OpenAI: GPT-4 (older v0314)", - "created": 1685232000, - "description": "GPT-4-0314 is the first version of GPT-4 released, with a context length of 8,192 tokens, and was supported until June 14. Training data: up to Sep 2021.", - "context_length": 8191, - "architecture": { - "modality": "text->text", - "input_modalities": ["text"], - "output_modalities": ["text"], - "tokenizer": "GPT", - "instruct_type": null - }, - "pricing": { - "prompt": "0.00003", - "completion": "0.00006" - }, - "top_provider": { - "context_length": 8191, - "max_completion_tokens": 4096, - "is_moderated": true - }, - "per_request_limits": null, - "supported_parameters": [ - "frequency_penalty", - "logit_bias", - "logprobs", - "max_tokens", - "presence_penalty", - "response_format", - "seed", - "stop", - "structured_outputs", - "temperature", - "tool_choice", - "tools", - "top_logprobs", - "top_p" - ], - "default_parameters": {}, - "supported_voices": null, - "knowledge_cutoff": "2021-09-30", - "expiration_date": null, - "links": { - "details": "/api/v1/models/openai/gpt-4-0314/endpoints" + "details": "/api/v1/models/openai/gpt-3.5-turbo-instruct/endpoints" } }, { - "id": "openai/gpt-4-1106-preview", - "canonical_slug": "openai/gpt-4-1106-preview", + "id": "openai/gpt-4", + "canonical_slug": "openai/gpt-4", "hugging_face_id": null, - "name": "OpenAI: GPT-4 Turbo (older v1106)", - "created": 1699228800, - "description": "The latest GPT-4 Turbo model with vision capabilities. Vision requests can now use JSON mode and function calling.\n\nTraining data: up to April 2023.", - "context_length": 128000, + "name": "OpenAI: GPT-4", + "created": 1685232000, + "description": "OpenAI's flagship model, GPT-4 is a large-scale multimodal language model capable of solving difficult problems with greater accuracy than previous models due to its broader general knowledge and advanced reasoning...", + "context_length": 8191, "architecture": { "modality": "text->text", "input_modalities": ["text"], @@ -9224,12 +9171,11 @@ "instruct_type": null }, "pricing": { - "prompt": "0.00001", - "completion": "0.00003", - "web_search": "0.01" + "prompt": "0.00003", + "completion": "0.00006" }, "top_provider": { - "context_length": 128000, + "context_length": 8191, "max_completion_tokens": 4096, "is_moderated": true }, @@ -9238,6 +9184,7 @@ "frequency_penalty", "logit_bias", "logprobs", + "max_completion_tokens", "max_tokens", "presence_penalty", "response_format", @@ -9252,10 +9199,10 @@ ], "default_parameters": {}, "supported_voices": null, - "knowledge_cutoff": "2023-04-30", + "knowledge_cutoff": "2021-09-30", "expiration_date": null, "links": { - "details": "/api/v1/models/openai/gpt-4-1106-preview/endpoints" + "details": "/api/v1/models/openai/gpt-4/endpoints" } }, { @@ -13072,7 +13019,7 @@ "instruct_type": null }, "pricing": { - "prompt": "0.000000071", + "prompt": "0.00000009", "completion": "0.0000001" }, "top_provider": { @@ -13179,12 +13126,12 @@ "instruct_type": "qwen3" }, "pricing": { - "prompt": "0.00000009", - "completion": "0.00000045" + "prompt": "0.00000012", + "completion": "0.0000005" }, "top_provider": { "context_length": 40960, - "max_completion_tokens": 20000, + "max_completion_tokens": 16384, "is_moderated": false }, "per_request_limits": null, @@ -13216,7 +13163,7 @@ }, "supported_voices": null, "knowledge_cutoff": "2025-03-31", - "expiration_date": "2026-06-05", + "expiration_date": null, "links": { "details": "/api/v1/models/qwen/qwen3-30b-a3b-04-28/endpoints" } @@ -13237,8 +13184,8 @@ "instruct_type": null }, "pricing": { - "prompt": "0.0000000428", - "completion": "0.0000001716" + "prompt": "0.00000004815", + "completion": "0.00000019305" }, "top_provider": { "context_length": 128000, @@ -14622,12 +14569,12 @@ "instruct_type": null }, "pricing": { - "prompt": "0.00000004", + "prompt": "0.0000001", "completion": "0.00000015" }, "top_provider": { "context_length": 262144, - "max_completion_tokens": 81920, + "max_completion_tokens": 262144, "is_moderated": false }, "per_request_limits": null, @@ -14830,12 +14777,12 @@ "instruct_type": null }, "pricing": { - "prompt": "0.00000029", - "completion": "0.0000032" + "prompt": "0.000000289", + "completion": "0.0000024" }, "top_provider": { - "context_length": 262140, - "max_completion_tokens": 262140, + "context_length": 131072, + "max_completion_tokens": 131072, "is_moderated": false }, "per_request_limits": null, @@ -14891,12 +14838,13 @@ "instruct_type": null }, "pricing": { - "prompt": "0.00000014", - "completion": "0.000001" + "prompt": "0.00000015", + "completion": "0.000001", + "input_cache_read": "0.00000005" }, "top_provider": { - "context_length": 262140, - "max_completion_tokens": 262140, + "context_length": 262144, + "max_completion_tokens": 262144, "is_moderated": false }, "per_request_limits": null, @@ -15140,6 +15088,56 @@ "details": "/api/v1/models/qwen/qwen3.7-max-20260520/endpoints" } }, + { + "id": "qwen/qwen3.7-plus", + "canonical_slug": "qwen/qwen3.7-plus-20260602", + "hugging_face_id": null, + "name": "Qwen: Qwen3.7 Plus", + "created": 1780491783, + "description": "Qwen3.7-Plus is a cost-effective model in Alibaba's Qwen3.7 series. It supports text and image input with text output, building on the series' text capabilities with a comprehensive upgrade to its...", + "context_length": 1000000, + "architecture": { + "modality": "text+image->text", + "input_modalities": ["text", "image"], + "output_modalities": ["text"], + "tokenizer": "Qwen", + "instruct_type": null + }, + "pricing": { + "prompt": "0.0000004", + "completion": "0.0000016", + "input_cache_read": "0.00000008", + "input_cache_write": "0.0000005" + }, + "top_provider": { + "context_length": 1000000, + "max_completion_tokens": 65536, + "is_moderated": false + }, + "per_request_limits": null, + "supported_parameters": [ + "include_reasoning", + "logprobs", + "max_tokens", + "presence_penalty", + "reasoning", + "response_format", + "seed", + "structured_outputs", + "temperature", + "tool_choice", + "tools", + "top_logprobs", + "top_p" + ], + "default_parameters": {}, + "supported_voices": null, + "knowledge_cutoff": null, + "expiration_date": null, + "links": { + "details": "/api/v1/models/qwen/qwen3.7-plus-20260602/endpoints" + } + }, { "id": "rekaai/reka-edge", "canonical_slug": "rekaai/reka-edge-2603", @@ -15329,52 +15327,6 @@ "details": "/api/v1/models/relace/relace-search-20251208/endpoints" } }, - { - "id": "sao10k/l3-euryale-70b", - "canonical_slug": "sao10k/l3-euryale-70b", - "hugging_face_id": "Sao10K/L3-70B-Euryale-v2.1", - "name": "Sao10k: Llama 3 Euryale 70B v2.1", - "created": 1718668800, - "description": "Euryale 70B v2.1 is a model focused on creative roleplay from [Sao10k](https://ko-fi.com/sao10k). - Better prompt adherence. - Better anatomy / spatial awareness. - Adapts much better to unique and custom...", - "context_length": 8192, - "architecture": { - "modality": "text->text", - "input_modalities": ["text"], - "output_modalities": ["text"], - "tokenizer": "Llama3", - "instruct_type": "llama3" - }, - "pricing": { - "prompt": "0.00000148", - "completion": "0.00000148" - }, - "top_provider": { - "context_length": 8192, - "max_completion_tokens": 8192, - "is_moderated": false - }, - "per_request_limits": null, - "supported_parameters": [ - "frequency_penalty", - "max_tokens", - "presence_penalty", - "repetition_penalty", - "seed", - "stop", - "temperature", - "tool_choice", - "tools", - "top_k", - "top_p" - ], - "default_parameters": {}, - "supported_voices": null, - "knowledge_cutoff": "2023-12-31", - "expiration_date": "2026-06-05", - "links": { - "details": "/api/v1/models/sao10k/l3-euryale-70b/endpoints" - } - }, { "id": "sao10k/l3-lunaris-8b", "canonical_slug": "sao10k/l3-lunaris-8b", @@ -16425,14 +16377,11 @@ "max_tokens", "presence_penalty", "reasoning", - "repetition_penalty", "response_format", - "seed", "stop", "temperature", "tool_choice", "tools", - "top_k", "top_p" ], "default_parameters": { @@ -16561,50 +16510,6 @@ "details": "/api/v1/models/xiaomi/mimo-v2.5-pro-20260422/endpoints" } }, - { - "id": "z-ai/glm-4-32b", - "canonical_slug": "z-ai/glm-4-32b-0414", - "hugging_face_id": "", - "name": "Z.ai: GLM 4 32B ", - "created": 1753376617, - "description": "GLM 4 32B is a cost-effective foundation language model. It can efficiently perform complex tasks and has significantly enhanced capabilities in tool use, online search, and code-related intelligent tasks. It...", - "context_length": 128000, - "architecture": { - "modality": "text->text", - "input_modalities": ["text"], - "output_modalities": ["text"], - "tokenizer": "Other", - "instruct_type": null - }, - "pricing": { - "prompt": "0.0000001", - "completion": "0.0000001" - }, - "top_provider": { - "context_length": 128000, - "max_completion_tokens": null, - "is_moderated": false - }, - "per_request_limits": null, - "supported_parameters": [ - "max_tokens", - "temperature", - "tool_choice", - "tools", - "top_p" - ], - "default_parameters": { - "temperature": 0.75, - "top_p": null, - "frequency_penalty": null - }, - "supported_voices": null, - "knowledge_cutoff": "2024-06-30", - "expiration_date": null, - "links": { - "details": "/api/v1/models/z-ai/glm-4-32b-0414/endpoints" - } - }, { "id": "z-ai/glm-4.5", "canonical_slug": "z-ai/glm-4.5", @@ -16654,7 +16559,7 @@ }, "supported_voices": null, "knowledge_cutoff": "2024-12-31", - "expiration_date": null, + "expiration_date": "2026-06-19", "links": { "details": "/api/v1/models/z-ai/glm-4.5/endpoints" } @@ -16688,6 +16593,7 @@ "supported_parameters": [ "frequency_penalty", "include_reasoning", + "logprobs", "max_tokens", "presence_penalty", "reasoning", @@ -16699,52 +16605,7 @@ "tool_choice", "tools", "top_k", - "top_p" - ], - "default_parameters": { - "temperature": 0.75, - "top_p": null, - "frequency_penalty": null - }, - "supported_voices": null, - "knowledge_cutoff": "2024-12-31", - "expiration_date": null, - "links": { - "details": "/api/v1/models/z-ai/glm-4.5-air/endpoints" - } - }, - { - "id": "z-ai/glm-4.5-air:free", - "canonical_slug": "z-ai/glm-4.5-air", - "hugging_face_id": "zai-org/GLM-4.5-Air", - "name": "Z.ai: GLM 4.5 Air (free)", - "created": 1753471258, - "description": "GLM-4.5-Air is the lightweight variant of our latest flagship model family, also purpose-built for agent-centric applications. Like GLM-4.5, it adopts the Mixture-of-Experts (MoE) architecture but with a more compact parameter...", - "context_length": 131072, - "architecture": { - "modality": "text->text", - "input_modalities": ["text"], - "output_modalities": ["text"], - "tokenizer": "Other", - "instruct_type": null - }, - "pricing": { - "prompt": "0", - "completion": "0" - }, - "top_provider": { - "context_length": 131072, - "max_completion_tokens": 96000, - "is_moderated": false - }, - "per_request_limits": null, - "supported_parameters": [ - "include_reasoning", - "max_tokens", - "reasoning", - "temperature", - "tool_choice", - "tools", + "top_logprobs", "top_p" ], "default_parameters": { @@ -16891,11 +16752,11 @@ "pricing": { "prompt": "0.0000003", "completion": "0.0000009", - "input_cache_read": "0.00000005" + "input_cache_read": "0.000000055" }, "top_provider": { "context_length": 131072, - "max_completion_tokens": 24000, + "max_completion_tokens": 32768, "is_moderated": false }, "per_request_limits": null, @@ -17107,7 +16968,7 @@ "name": "Z.ai: GLM 5 Turbo", "created": 1773583573, "description": "GLM-5 Turbo is a new model from Z.ai designed for fast inference and strong performance in agent-driven environments such as OpenClaw scenarios. It is deeply optimized for real-world agent workflows...", - "context_length": 202752, + "context_length": 262144, "architecture": { "modality": "text->text", "input_modalities": ["text"], @@ -17121,7 +16982,7 @@ "input_cache_read": "0.00000024" }, "top_provider": { - "context_length": 202752, + "context_length": 262144, "max_completion_tokens": 131072, "is_moderated": false }, @@ -17222,56 +17083,5 @@ "links": { "details": "/api/v1/models/z-ai/glm-5.1-20260406/endpoints" } - }, - { - "id": "z-ai/glm-5v-turbo", - "canonical_slug": "z-ai/glm-5v-turbo-20260401", - "hugging_face_id": "", - "name": "Z.ai: GLM 5V Turbo", - "created": 1775061458, - "description": "GLM-5V-Turbo is Z.ai’s first native multimodal agent foundation model, built for vision-based coding and agent-driven tasks. It natively handles image, video, and text inputs, excels at long-horizon planning, complex coding,...", - "context_length": 202752, - "architecture": { - "modality": "text+image+video->text", - "input_modalities": ["image", "text", "video"], - "output_modalities": ["text"], - "tokenizer": "Other", - "instruct_type": null - }, - "pricing": { - "prompt": "0.0000012", - "completion": "0.000004", - "input_cache_read": "0.00000024" - }, - "top_provider": { - "context_length": 202752, - "max_completion_tokens": 131072, - "is_moderated": false - }, - "per_request_limits": null, - "supported_parameters": [ - "include_reasoning", - "max_tokens", - "reasoning", - "response_format", - "temperature", - "tool_choice", - "tools", - "top_p" - ], - "default_parameters": { - "temperature": 1, - "top_p": 0.95, - "top_k": null, - "frequency_penalty": null, - "presence_penalty": null, - "repetition_penalty": null - }, - "supported_voices": null, - "knowledge_cutoff": null, - "expiration_date": null, - "links": { - "details": "/api/v1/models/z-ai/glm-5v-turbo-20260401/endpoints" - } } ]