diff --git a/.changeset/sync-models.md b/.changeset/sync-models.md
new file mode 100644
index 000000000..3949386d6
--- /dev/null
+++ b/.changeset/sync-models.md
@@ -0,0 +1,5 @@
+---
+'@tanstack/ai-anthropic': patch
+---
+
+Update model metadata from OpenRouter API
diff --git a/packages/ai-anthropic/src/model-meta.ts b/packages/ai-anthropic/src/model-meta.ts
index 86301ed7d..94df2ba39 100644
--- a/packages/ai-anthropic/src/model-meta.ts
+++ b/packages/ai-anthropic/src/model-meta.ts
@@ -710,6 +710,45 @@ const CLAUDE_OPUS_4_8_FAST = {
     AnthropicSamplingOptions
 >
 
+const CLAUDE_FABLE_5 = {
+  name: 'claude-fable-5',
+  id: 'claude-fable-5',
+  context_window: 1_000_000,
+  max_output_tokens: 128_000,
+  supports: {
+    input: ['text', 'image', 'document'],
+    extended_thinking: true,
+    priority_tier: true,
+    tools: [
+      'web_search',
+      'web_fetch',
+      'code_execution',
+      'computer_use',
+      'bash',
+      'text_editor',
+      'memory',
+    ],
+  },
+  pricing: {
+    input: {
+      normal: 10,
+      cached: 1,
+    },
+    output: {
+      normal: 50,
+    },
+  },
+} as const satisfies ModelMeta<
+  AnthropicContainerOptions &
+    AnthropicContextManagementOptions &
+    AnthropicMCPOptions &
+    AnthropicServiceTierOptions &
+    AnthropicStopSequencesOptions &
+    AnthropicThinkingOptions &
+    AnthropicToolChoiceOptions &
+    AnthropicSamplingOptions
+>
+
 export const ANTHROPIC_MODELS = [
   CLAUDE_OPUS_4_6.id,
   CLAUDE_OPUS_4_5.id,
@@ -731,6 +770,8 @@ export const ANTHROPIC_MODELS = [
 
   CLAUDE_OPUS_4_8.id,
   CLAUDE_OPUS_4_8_FAST.id,
+
+  CLAUDE_FABLE_5.id,
 ] as const
 
 /**
@@ -891,6 +932,14 @@ export type AnthropicChatModelProviderOptionsByName = {
     AnthropicThinkingOptions &
     AnthropicToolChoiceOptions &
     AnthropicSamplingOptions
+  [CLAUDE_FABLE_5.id]: AnthropicContainerOptions &
+    AnthropicContextManagementOptions &
+    AnthropicMCPOptions &
+    AnthropicServiceTierOptions &
+    AnthropicStopSequencesOptions &
+    AnthropicThinkingOptions &
+    AnthropicToolChoiceOptions &
+    AnthropicSamplingOptions
 }
 
 export type AnthropicChatModelToolCapabilitiesByName = {
@@ -937,4 +986,5 @@ export type AnthropicModelInputModalitiesByName = {
   [CLAUDE_OPUS_4_7_FAST.id]: typeof CLAUDE_OPUS_4_7_FAST.supports.input
   [CLAUDE_OPUS_4_8.id]: typeof CLAUDE_OPUS_4_8.supports.input
   [CLAUDE_OPUS_4_8_FAST.id]: typeof CLAUDE_OPUS_4_8_FAST.supports.input
+  [CLAUDE_FABLE_5.id]: typeof CLAUDE_FABLE_5.supports.input
 }
diff --git a/packages/ai-openrouter/src/model-meta.ts b/packages/ai-openrouter/src/model-meta.ts
index 42122cd2c..d7b08cc41 100644
--- a/packages/ai-openrouter/src/model-meta.ts
+++ b/packages/ai-openrouter/src/model-meta.ts
@@ -3,6 +3,36 @@ import type {
   OpenRouterCommonOptions,
 } from './text/text-provider-options'
 
+const _ANTHROPIC_CLAUDE_FABLE_LATEST = {
+  id: '~anthropic/claude-fable-latest',
+  name: 'Anthropic: Claude Fable Latest',
+  supports: {
+    input: ['text', 'image', 'document'],
+    output: ['text'],
+    supports: [
+      'maxCompletionTokens',
+      'maxCompletionTokens',
+      'reasoning',
+      'responseFormat',
+      'stop',
+      'toolChoice',
+    ],
+  },
+  context_window: 1000000,
+  max_output_tokens: 128000,
+  pricing: {
+    text: {
+      input: {
+        normal: 10,
+        cached: 13.5,
+      },
+      output: {
+        normal: 50,
+      },
+    },
+    image: 0,
+  },
+} as const
 const _ANTHROPIC_CLAUDE_HAIKU_LATEST = {
   id: '~anthropic/claude-haiku-latest',
   name: 'Anthropic Claude Haiku Latest',
@@ -183,15 +213,15 @@ const _MOONSHOTAI_KIMI_LATEST = {
     ],
   },
   context_window: 262144,
-  max_output_tokens: 262144,
+  max_output_tokens: 262142,
   pricing: {
     text: {
       input: {
-        normal: 0.684,
-        cached: 0.144,
+        normal: 0.68,
+        cached: 0.34,
       },
       output: {
-        normal: 3.42,
+        normal: 3.41,
       },
     },
     image: 0,
@@ -628,6 +658,36 @@ const ANTHROPIC_CLAUDE_3_5_HAIKU = {
     image: 0,
   },
 } as const
+const ANTHROPIC_CLAUDE_FABLE_5 = {
+  id: 'anthropic/claude-fable-5',
+  name: 'Anthropic: Claude Fable 5',
+  supports: {
+    input: ['text', 'image', 'document'],
+    output: ['text'],
+    supports: [
+      'maxCompletionTokens',
+      'maxCompletionTokens',
+      'reasoning',
+      'responseFormat',
+      'stop',
+      'toolChoice',
+    ],
+  },
+  context_window: 1000000,
+  max_output_tokens: 128000,
+  pricing: {
+    text: {
+      input: {
+        normal: 10,
+        cached: 13.5,
+      },
+      output: {
+        normal: 50,
+      },
+    },
+    image: 0,
+  },
+} as const
 const ANTHROPIC_CLAUDE_HAIKU_4_5 = {
   id: 'anthropic/claude-haiku-4.5',
   name: 'Anthropic: Claude Haiku 4.5',
@@ -1052,68 +1112,6 @@ const ARCEE_AI_CODER_LARGE = {
     image: 0,
   },
 } as const
-const ARCEE_AI_MAESTRO_REASONING = {
-  id: 'arcee-ai/maestro-reasoning',
-  name: 'Arcee AI: Maestro Reasoning',
-  supports: {
-    input: ['text'],
-    output: ['text'],
-    supports: [
-      'frequencyPenalty',
-      'logitBias',
-      'maxCompletionTokens',
-      'presencePenalty',
-      'stop',
-      'temperature',
-      'topP',
-    ],
-  },
-  context_window: 131072,
-  max_output_tokens: 32000,
-  pricing: {
-    text: {
-      input: {
-        normal: 0.9,
-        cached: 0,
-      },
-      output: {
-        normal: 3.3,
-      },
-    },
-    image: 0,
-  },
-} as const
-const ARCEE_AI_SPOTLIGHT = {
-  id: 'arcee-ai/spotlight',
-  name: 'Arcee AI: Spotlight',
-  supports: {
-    input: ['image', 'text'],
-    output: ['text'],
-    supports: [
-      'frequencyPenalty',
-      'logitBias',
-      'maxCompletionTokens',
-      'presencePenalty',
-      'stop',
-      'temperature',
-      'topP',
-    ],
-  },
-  context_window: 131072,
-  max_output_tokens: 65537,
-  pricing: {
-    text: {
-      input: {
-        normal: 0.18,
-        cached: 0,
-      },
-      output: {
-        normal: 0.18,
-      },
-    },
-    image: 0,
-  },
-} as const
 const ARCEE_AI_TRINITY_LARGE_THINKING = {
   id: 'arcee-ai/trinity-large-thinking',
   name: 'Arcee AI: Trinity Large Thinking',
@@ -1213,39 +1211,6 @@ const ARCEE_AI_VIRTUOSO_LARGE = {
     image: 0,
   },
 } as const
-const BAIDU_ERNIE_4_5_VL_28B_A3B = {
-  id: 'baidu/ernie-4.5-vl-28b-a3b',
-  name: 'Baidu: ERNIE 4.5 VL 28B A3B',
-  supports: {
-    input: ['text', 'image'],
-    output: ['text'],
-    supports: [
-      'frequencyPenalty',
-      'maxCompletionTokens',
-      'presencePenalty',
-      'reasoning',
-      'seed',
-      'stop',
-      'temperature',
-      'toolChoice',
-      'topP',
-    ],
-  },
-  context_window: 131072,
-  max_output_tokens: 8000,
-  pricing: {
-    text: {
-      input: {
-        normal: 0.14,
-        cached: 0,
-      },
-      output: {
-        normal: 0.56,
-      },
-    },
-    image: 0,
-  },
-} as const
 const BAIDU_ERNIE_4_5_VL_424B_A47B = {
   id: 'baidu/ernie-4.5-vl-424b-a47b',
   name: 'Baidu: ERNIE 4.5 VL 424B A47B ',
@@ -1683,7 +1648,7 @@ const DEEPSEEK_DEEPSEEK_CHAT_V3_0324 = {
       'topP',
     ],
   },
-  context_window: 163840,
+  context_window: 131072,
   max_output_tokens: 16384,
   pricing: {
     text: {
@@ -2615,11 +2580,11 @@ const GOOGLE_GEMMA_3_12B_IT = {
   pricing: {
     text: {
       input: {
-        normal: 0.04,
+        normal: 0.05,
         cached: 0,
       },
       output: {
-        normal: 0.13,
+        normal: 0.15,
       },
     },
     image: 0,
@@ -2682,11 +2647,11 @@ const GOOGLE_GEMMA_3_4B_IT = {
   pricing: {
     text: {
       input: {
-        normal: 0.04,
+        normal: 0.05,
         cached: 0,
       },
       output: {
-        normal: 0.08,
+        normal: 0.1,
       },
     },
     image: 0,
@@ -2812,15 +2777,15 @@ const GOOGLE_GEMMA_4_31B_IT = {
     ],
   },
   context_window: 262144,
-  max_output_tokens: 16384,
+  max_output_tokens: 8192,
   pricing: {
     text: {
       input: {
         normal: 0.12,
-        cached: 0,
+        cached: 0.09,
       },
       output: {
-        normal: 0.37,
+        normal: 0.36,
       },
     },
     image: 0,
@@ -3394,23 +3359,20 @@ const META_LLAMA_LLAMA_3_8B_INSTRUCT = {
       'logitBias',
       'maxCompletionTokens',
       'presencePenalty',
-      'responseFormat',
-      'seed',
       'stop',
       'temperature',
       'topP',
     ],
   },
   context_window: 8192,
-  max_output_tokens: 8192,
   pricing: {
     text: {
       input: {
-        normal: 0.04,
+        normal: 0.14,
         cached: 0,
       },
       output: {
-        normal: 0.04,
+        normal: 0.14,
       },
     },
     image: 0,
@@ -3478,7 +3440,7 @@ const META_LLAMA_LLAMA_3_1_8B_INSTRUCT = {
         cached: 0,
       },
       output: {
-        normal: 0.05,
+        normal: 0.03,
       },
     },
     image: 0,
@@ -3507,11 +3469,11 @@ const META_LLAMA_LLAMA_3_2_11B_VISION_INSTRUCT = {
   pricing: {
     text: {
       input: {
-        normal: 0.245,
+        normal: 0.345,
         cached: 0,
       },
       output: {
-        normal: 0.245,
+        normal: 0.345,
       },
     },
     image: 0,
@@ -3732,7 +3694,7 @@ const META_LLAMA_LLAMA_4_SCOUT = {
   pricing: {
     text: {
       input: {
-        normal: 0.08,
+        normal: 0.1,
         cached: 0,
       },
       output: {
@@ -4084,10 +4046,10 @@ const MINIMAX_MINIMAX_M2_5 = {
     text: {
       input: {
         normal: 0.15,
-        cached: 0,
+        cached: 0.05,
       },
       output: {
-        normal: 1.15,
+        normal: 0.9,
       },
     },
     image: 0,
@@ -4120,11 +4082,11 @@ const MINIMAX_MINIMAX_M2_7 = {
   pricing: {
     text: {
       input: {
-        normal: 0.279,
-        cached: 0,
+        normal: 0.27,
+        cached: 0.054,
       },
       output: {
-        normal: 1.2,
+        normal: 1.08,
       },
     },
     image: 0,
@@ -4904,15 +4866,14 @@ const MOONSHOTAI_KIMI_K2_5 = {
     ],
   },
   context_window: 262144,
-  max_output_tokens: 262144,
   pricing: {
     text: {
       input: {
-        normal: 0.4,
-        cached: 0.09,
+        normal: 0.35,
+        cached: 0,
       },
       output: {
-        normal: 1.9,
+        normal: 1.89,
       },
     },
     image: 0,
@@ -4942,37 +4903,15 @@ const MOONSHOTAI_KIMI_K2_6 = {
     ],
   },
   context_window: 262144,
-  max_output_tokens: 262144,
-  pricing: {
-    text: {
-      input: {
-        normal: 0.684,
-        cached: 0.144,
-      },
-      output: {
-        normal: 3.42,
-      },
-    },
-    image: 0,
-  },
-} as const
-const MOONSHOTAI_KIMI_K2_6_FREE = {
-  id: 'moonshotai/kimi-k2.6:free',
-  name: 'MoonshotAI: Kimi K2.6 (free)',
-  supports: {
-    input: ['text', 'image'],
-    output: ['text'],
-    supports: ['reasoning', 'toolChoice'],
-  },
-  context_window: 262144,
+  max_output_tokens: 262142,
   pricing: {
     text: {
       input: {
-        normal: 0,
-        cached: 0,
+        normal: 0.68,
+        cached: 0.34,
       },
       output: {
-        normal: 0,
+        normal: 3.41,
       },
     },
     image: 0,
@@ -5024,63 +4963,33 @@ const MORPH_MORPH_V3_LARGE = {
     image: 0,
   },
 } as const
-const NEX_AGI_DEEPSEEK_V3_1_NEX_N1 = {
-  id: 'nex-agi/deepseek-v3.1-nex-n1',
-  name: 'Nex AGI: DeepSeek V3.1 Nex N1',
+const NEX_AGI_NEX_N2_PRO_FREE = {
+  id: 'nex-agi/nex-n2-pro:free',
+  name: 'Nex AGI: Nex-N2-Pro (free)',
   supports: {
-    input: ['text'],
+    input: ['text', 'image'],
     output: ['text'],
     supports: [
       'frequencyPenalty',
+      'logprobs',
       'maxCompletionTokens',
+      'reasoning',
       'responseFormat',
       'temperature',
       'toolChoice',
       'topP',
     ],
   },
-  context_window: 131072,
-  max_output_tokens: 163840,
-  pricing: {
-    text: {
-      input: {
-        normal: 0.135,
-        cached: 0,
-      },
-      output: {
-        normal: 0.5,
-      },
-    },
-    image: 0,
-  },
-} as const
-const NOUSRESEARCH_HERMES_2_PRO_LLAMA_3_8B = {
-  id: 'nousresearch/hermes-2-pro-llama-3-8b',
-  name: 'NousResearch: Hermes 2 Pro - Llama-3 8B',
-  supports: {
-    input: ['text'],
-    output: ['text'],
-    supports: [
-      'frequencyPenalty',
-      'maxCompletionTokens',
-      'presencePenalty',
-      'responseFormat',
-      'seed',
-      'stop',
-      'temperature',
-      'topP',
-    ],
-  },
-  context_window: 8192,
-  max_output_tokens: 8192,
+  context_window: 262144,
+  max_output_tokens: 262144,
   pricing: {
     text: {
       input: {
-        normal: 0.14,
+        normal: 0,
         cached: 0,
       },
       output: {
-        normal: 0.14,
+        normal: 0,
       },
     },
     image: 0,
@@ -5171,11 +5080,11 @@ const NOUSRESEARCH_HERMES_3_LLAMA_3_1_70B = {
   pricing: {
     text: {
       input: {
-        normal: 0.3,
+        normal: 0.7,
         cached: 0,
       },
       output: {
-        normal: 0.3,
+        normal: 0.7,
       },
     },
     image: 0,
@@ -5266,7 +5175,7 @@ const NVIDIA_LLAMA_3_3_NEMOTRON_SUPER_49B_V1_5 = {
   pricing: {
     text: {
       input: {
-        normal: 0.1,
+        normal: 0.4,
         cached: 0,
       },
       output: {
@@ -5437,81 +5346,109 @@ const NVIDIA_NEMOTRON_3_SUPER_120B_A12B_FREE = {
     image: 0,
   },
 } as const
-const NVIDIA_NEMOTRON_NANO_12B_V2_VL_FREE = {
-  id: 'nvidia/nemotron-nano-12b-v2-vl:free',
-  name: 'NVIDIA: Nemotron Nano 12B 2 VL (free)',
+const NVIDIA_NEMOTRON_3_ULTRA_550B_A55B = {
+  id: 'nvidia/nemotron-3-ultra-550b-a55b',
+  name: 'NVIDIA: Nemotron 3 Ultra',
   supports: {
-    input: ['image', 'text', 'video'],
+    input: ['text'],
     output: ['text'],
     supports: [
+      'frequencyPenalty',
+      'logitBias',
       'maxCompletionTokens',
+      'presencePenalty',
       'reasoning',
+      'responseFormat',
       'seed',
+      'stop',
       'temperature',
       'toolChoice',
       'topP',
     ],
   },
-  context_window: 128000,
-  max_output_tokens: 128000,
+  context_window: 1000000,
+  max_output_tokens: 16384,
   pricing: {
     text: {
       input: {
-        normal: 0,
-        cached: 0,
+        normal: 0.5,
+        cached: 0.15,
       },
       output: {
-        normal: 0,
+        normal: 2.5,
       },
     },
     image: 0,
   },
 } as const
-const NVIDIA_NEMOTRON_NANO_9B_V2 = {
-  id: 'nvidia/nemotron-nano-9b-v2',
-  name: 'NVIDIA: Nemotron Nano 9B V2',
+const NVIDIA_NEMOTRON_3_ULTRA_550B_A55B_FREE = {
+  id: 'nvidia/nemotron-3-ultra-550b-a55b:free',
+  name: 'NVIDIA: Nemotron 3 Ultra (free)',
   supports: {
     input: ['text'],
     output: ['text'],
     supports: [
-      'frequencyPenalty',
-      'logitBias',
       'maxCompletionTokens',
-      'presencePenalty',
       'reasoning',
-      'responseFormat',
       'seed',
-      'stop',
       'temperature',
       'toolChoice',
       'topP',
     ],
   },
-  context_window: 131072,
-  max_output_tokens: 16384,
+  context_window: 1000000,
+  max_output_tokens: 65536,
   pricing: {
     text: {
       input: {
-        normal: 0.04,
+        normal: 0,
         cached: 0,
       },
       output: {
-        normal: 0.16,
+        normal: 0,
       },
     },
     image: 0,
   },
 } as const
-const NVIDIA_NEMOTRON_NANO_9B_V2_FREE = {
-  id: 'nvidia/nemotron-nano-9b-v2:free',
-  name: 'NVIDIA: Nemotron Nano 9B V2 (free)',
+const NVIDIA_NEMOTRON_3_5_CONTENT_SAFETY_FREE = {
+  id: 'nvidia/nemotron-3.5-content-safety:free',
+  name: 'NVIDIA: Nemotron 3.5 Content Safety (free)',
   supports: {
-    input: ['text'],
+    input: ['text', 'image'],
+    output: ['text'],
+    supports: [
+      'maxCompletionTokens',
+      'reasoning',
+      'seed',
+      'temperature',
+      'topP',
+    ],
+  },
+  context_window: 128000,
+  max_output_tokens: 8192,
+  pricing: {
+    text: {
+      input: {
+        normal: 0,
+        cached: 0,
+      },
+      output: {
+        normal: 0,
+      },
+    },
+    image: 0,
+  },
+} as const
+const NVIDIA_NEMOTRON_NANO_12B_V2_VL_FREE = {
+  id: 'nvidia/nemotron-nano-12b-v2-vl:free',
+  name: 'NVIDIA: Nemotron Nano 12B 2 VL (free)',
+  supports: {
+    input: ['image', 'text', 'video'],
     output: ['text'],
     supports: [
       'maxCompletionTokens',
       'reasoning',
-      'responseFormat',
       'seed',
       'temperature',
       'toolChoice',
@@ -5519,6 +5456,7 @@ const NVIDIA_NEMOTRON_NANO_9B_V2_FREE = {
     ],
   },
   context_window: 128000,
+  max_output_tokens: 128000,
   pricing: {
     text: {
       input: {
@@ -5532,81 +5470,74 @@ const NVIDIA_NEMOTRON_NANO_9B_V2_FREE = {
     image: 0,
   },
 } as const
-const OPENAI_GPT_3_5_TURBO = {
-  id: 'openai/gpt-3.5-turbo',
-  name: 'OpenAI: GPT-3.5 Turbo',
+const NVIDIA_NEMOTRON_NANO_9B_V2 = {
+  id: 'nvidia/nemotron-nano-9b-v2',
+  name: 'NVIDIA: Nemotron Nano 9B V2',
   supports: {
     input: ['text'],
     output: ['text'],
     supports: [
       'frequencyPenalty',
       'logitBias',
-      'logprobs',
       'maxCompletionTokens',
       'presencePenalty',
+      'reasoning',
       'responseFormat',
       'seed',
       'stop',
       'temperature',
       'toolChoice',
-      'topLogprobs',
       'topP',
     ],
   },
-  context_window: 16385,
-  max_output_tokens: 4096,
+  context_window: 131072,
+  max_output_tokens: 16384,
   pricing: {
     text: {
       input: {
-        normal: 0.5,
+        normal: 0.04,
         cached: 0,
       },
       output: {
-        normal: 1.5,
+        normal: 0.16,
       },
     },
     image: 0,
   },
 } as const
-const OPENAI_GPT_3_5_TURBO_0613 = {
-  id: 'openai/gpt-3.5-turbo-0613',
-  name: 'OpenAI: GPT-3.5 Turbo (older v0613)',
+const NVIDIA_NEMOTRON_NANO_9B_V2_FREE = {
+  id: 'nvidia/nemotron-nano-9b-v2:free',
+  name: 'NVIDIA: Nemotron Nano 9B V2 (free)',
   supports: {
     input: ['text'],
     output: ['text'],
     supports: [
-      'frequencyPenalty',
-      'logitBias',
-      'logprobs',
       'maxCompletionTokens',
-      'presencePenalty',
+      'reasoning',
       'responseFormat',
       'seed',
-      'stop',
       'temperature',
       'toolChoice',
-      'topLogprobs',
       'topP',
     ],
   },
-  context_window: 4095,
-  max_output_tokens: 4096,
+  context_window: 128000,
   pricing: {
     text: {
       input: {
-        normal: 1,
+        normal: 0,
         cached: 0,
       },
       output: {
-        normal: 2,
+        normal: 0,
       },
     },
     image: 0,
   },
 } as const
-const OPENAI_GPT_3_5_TURBO_16K = {
-  id: 'openai/gpt-3.5-turbo-16k',
-  name: 'OpenAI: GPT-3.5 Turbo 16k',
+const OPENAI_GPT_3_5_TURBO = {
+  id: 'openai/gpt-3.5-turbo',
+  name: 'OpenAI: GPT-3.5 Turbo',
   supports: {
     input: ['text'],
     output: ['text'],
@@ -5615,7 +5546,6 @@ const OPENAI_GPT_3_5_TURBO_16K = {
       'logitBias',
       'logprobs',
       'maxCompletionTokens',
-      'maxCompletionTokens',
       'presencePenalty',
       'responseFormat',
       'seed',
@@ -5631,19 +5561,19 @@ const OPENAI_GPT_3_5_TURBO_16K = {
   pricing: {
     text: {
       input: {
-        normal: 3,
+        normal: 0.5,
         cached: 0,
       },
       output: {
-        normal: 4,
+        normal: 1.5,
       },
     },
     image: 0,
   },
 } as const
-const OPENAI_GPT_3_5_TURBO_INSTRUCT = {
-  id: 'openai/gpt-3.5-turbo-instruct',
-  name: 'OpenAI: GPT-3.5 Turbo Instruct',
+const OPENAI_GPT_3_5_TURBO_0613 = {
+  id: 'openai/gpt-3.5-turbo-0613',
+  name: 'OpenAI: GPT-3.5 Turbo (older v0613)',
   supports: {
     input: ['text'],
     output: ['text'],
@@ -5657,6 +5587,7 @@ const OPENAI_GPT_3_5_TURBO_INSTRUCT = {
       'seed',
       'stop',
       'temperature',
+      'toolChoice',
       'topLogprobs',
       'topP',
     ],
@@ -5666,7 +5597,7 @@ const OPENAI_GPT_3_5_TURBO_INSTRUCT = {
   pricing: {
     text: {
       input: {
-        normal: 1.5,
+        normal: 1,
         cached: 0,
       },
       output: {
@@ -5676,9 +5607,9 @@ const OPENAI_GPT_3_5_TURBO_INSTRUCT = {
     image: 0,
   },
 } as const
-const OPENAI_GPT_4 = {
-  id: 'openai/gpt-4',
-  name: 'OpenAI: GPT-4',
+const OPENAI_GPT_3_5_TURBO_16K = {
+  id: 'openai/gpt-3.5-turbo-16k',
+  name: 'OpenAI: GPT-3.5 Turbo 16k',
   supports: {
     input: ['text'],
     output: ['text'],
@@ -5698,24 +5629,24 @@ const OPENAI_GPT_4 = {
       'topP',
     ],
   },
-  context_window: 8191,
+  context_window: 16385,
   max_output_tokens: 4096,
   pricing: {
     text: {
       input: {
-        normal: 30,
+        normal: 3,
         cached: 0,
       },
       output: {
-        normal: 60,
+        normal: 4,
       },
     },
     image: 0,
   },
 } as const
-const OPENAI_GPT_4_0314 = {
-  id: 'openai/gpt-4-0314',
-  name: 'OpenAI: GPT-4 (older v0314)',
+const OPENAI_GPT_3_5_TURBO_INSTRUCT = {
+  id: 'openai/gpt-3.5-turbo-instruct',
+  name: 'OpenAI: GPT-3.5 Turbo Instruct',
   supports: {
     input: ['text'],
     output: ['text'],
@@ -5729,29 +5660,28 @@ const OPENAI_GPT_4_0314 = {
       'seed',
       'stop',
       'temperature',
-      'toolChoice',
       'topLogprobs',
       'topP',
     ],
   },
-  context_window: 8191,
+  context_window: 4095,
   max_output_tokens: 4096,
   pricing: {
     text: {
       input: {
-        normal: 30,
+        normal: 1.5,
         cached: 0,
       },
       output: {
-        normal: 60,
+        normal: 2,
       },
     },
     image: 0,
   },
 } as const
-const OPENAI_GPT_4_1106_PREVIEW = {
-  id: 'openai/gpt-4-1106-preview',
-  name: 'OpenAI: GPT-4 Turbo (older v1106)',
+const OPENAI_GPT_4 = {
+  id: 'openai/gpt-4',
+  name: 'OpenAI: GPT-4',
   supports: {
     input: ['text'],
     output: ['text'],
@@ -5760,6 +5690,7 @@ const OPENAI_GPT_4_1106_PREVIEW = {
       'logitBias',
       'logprobs',
       'maxCompletionTokens',
+      'maxCompletionTokens',
       'presencePenalty',
       'responseFormat',
       'seed',
@@ -5770,16 +5701,16 @@ const OPENAI_GPT_4_1106_PREVIEW = {
       'topP',
     ],
   },
-  context_window: 128000,
+  context_window: 8191,
   max_output_tokens: 4096,
   pricing: {
     text: {
       input: {
-        normal: 10,
+        normal: 30,
         cached: 0,
       },
       output: {
-        normal: 30,
+        normal: 60,
       },
     },
     image: 0,
@@ -8169,7 +8100,7 @@ const QWEN_QWEN3_235B_A22B_2507 = {
   pricing: {
     text: {
       input: {
-        normal: 0.071,
+        normal: 0.09,
         cached: 0,
       },
       output: {
@@ -8237,15 +8168,15 @@ const QWEN_QWEN3_30B_A3B = {
     ],
   },
   context_window: 131072,
-  max_output_tokens: 20000,
+  max_output_tokens: 16384,
   pricing: {
     text: {
       input: {
-        normal: 0.09,
+        normal: 0.12,
         cached: 0,
       },
       output: {
-        normal: 0.45,
+        normal: 0.5,
       },
     },
     image: 0,
@@ -8275,11 +8206,11 @@ const QWEN_QWEN3_30B_A3B_INSTRUCT_2507 = {
   pricing: {
     text: {
       input: {
-        normal: 0.0428,
+        normal: 0.04815,
         cached: 0,
       },
       output: {
-        normal: 0.1716,
+        normal: 0.19305,
       },
     },
     image: 0,
@@ -9151,11 +9082,11 @@ const QWEN_QWEN3_5_9B = {
     ],
   },
   context_window: 262144,
-  max_output_tokens: 81920,
+  max_output_tokens: 262144,
   pricing: {
     text: {
       input: {
-        normal: 0.04,
+        normal: 0.1,
         cached: 0,
       },
       output: {
@@ -9284,15 +9215,15 @@ const QWEN_QWEN3_6_27B = {
     ],
   },
   context_window: 262144,
-  max_output_tokens: 262140,
+  max_output_tokens: 131072,
   pricing: {
     text: {
       input: {
-        normal: 0.29,
+        normal: 0.289,
         cached: 0,
       },
       output: {
-        normal: 3.2,
+        normal: 2.4,
       },
     },
     image: 0,
@@ -9321,12 +9252,12 @@ const QWEN_QWEN3_6_35B_A3B = {
     ],
   },
   context_window: 262144,
-  max_output_tokens: 262140,
+  max_output_tokens: 262144,
   pricing: {
     text: {
       input: {
-        normal: 0.14,
-        cached: 0,
+        normal: 0.15,
+        cached: 0.05,
       },
       output: {
         normal: 1,
@@ -9467,6 +9398,40 @@ const QWEN_QWEN3_7_MAX = {
     image: 0,
   },
 } as const
+const QWEN_QWEN3_7_PLUS = {
+  id: 'qwen/qwen3.7-plus',
+  name: 'Qwen: Qwen3.7 Plus',
+  supports: {
+    input: ['text', 'image'],
+    output: ['text'],
+    supports: [
+      'logprobs',
+      'maxCompletionTokens',
+      'presencePenalty',
+      'reasoning',
+      'responseFormat',
+      'seed',
+      'temperature',
+      'toolChoice',
+      'topLogprobs',
+      'topP',
+    ],
+  },
+  context_window: 1000000,
+  max_output_tokens: 65536,
+  pricing: {
+    text: {
+      input: {
+        normal: 0.4,
+        cached: 0.58,
+      },
+      output: {
+        normal: 1.6,
+      },
+    },
+    image: 0,
+  },
+} as const
 const REKAAI_REKA_EDGE = {
   id: 'rekaai/reka-edge',
   name: 'Reka Edge',
@@ -9584,38 +9549,6 @@ const RELACE_RELACE_SEARCH = {
     image: 0,
   },
 } as const
-const SAO10K_L3_EURYALE_70B = {
-  id: 'sao10k/l3-euryale-70b',
-  name: 'Sao10k: Llama 3 Euryale 70B v2.1',
-  supports: {
-    input: ['text'],
-    output: ['text'],
-    supports: [
-      'frequencyPenalty',
-      'maxCompletionTokens',
-      'presencePenalty',
-      'seed',
-      'stop',
-      'temperature',
-      'toolChoice',
-      'topP',
-    ],
-  },
-  context_window: 8192,
-  max_output_tokens: 8192,
-  pricing: {
-    text: {
-      input: {
-        normal: 1.48,
-        cached: 0,
-      },
-      output: {
-        normal: 1.48,
-      },
-    },
-    image: 0,
-  },
-} as const
 const SAO10K_L3_LUNARIS_8B = {
   id: 'sao10k/l3-lunaris-8b',
   name: 'Sao10K: Llama 3 8B Lunaris',
@@ -10273,7 +10206,6 @@ const XIAOMI_MIMO_V2_FLASH = {
       'presencePenalty',
       'reasoning',
       'responseFormat',
-      'seed',
       'stop',
       'temperature',
       'toolChoice',
@@ -10363,28 +10295,6 @@ const XIAOMI_MIMO_V2_5_PRO = {
     image: 0,
   },
 } as const
-const Z_AI_GLM_4_32B = {
-  id: 'z-ai/glm-4-32b',
-  name: 'Z.ai: GLM 4 32B ',
-  supports: {
-    input: ['text'],
-    output: ['text'],
-    supports: ['maxCompletionTokens', 'temperature', 'toolChoice', 'topP'],
-  },
-  context_window: 128000,
-  pricing: {
-    text: {
-      input: {
-        normal: 0.1,
-        cached: 0,
-      },
-      output: {
-        normal: 0.1,
-      },
-    },
-    image: 0,
-  },
-} as const
 const Z_AI_GLM_4_5 = {
   id: 'z-ai/glm-4.5',
   name: 'Z.ai: GLM 4.5',
@@ -10427,6 +10337,7 @@ const Z_AI_GLM_4_5_AIR = {
     output: ['text'],
     supports: [
       'frequencyPenalty',
+      'logprobs',
       'maxCompletionTokens',
       'presencePenalty',
       'reasoning',
@@ -10435,6 +10346,7 @@ const Z_AI_GLM_4_5_AIR = {
       'stop',
       'temperature',
       'toolChoice',
+      'topLogprobs',
       'topP',
     ],
   },
@@ -10453,35 +10365,6 @@ const Z_AI_GLM_4_5_AIR = {
     image: 0,
   },
 } as const
-const Z_AI_GLM_4_5_AIR_FREE = {
-  id: 'z-ai/glm-4.5-air:free',
-  name: 'Z.ai: GLM 4.5 Air (free)',
-  supports: {
-    input: ['text'],
-    output: ['text'],
-    supports: [
-      'maxCompletionTokens',
-      'reasoning',
-      'temperature',
-      'toolChoice',
-      'topP',
-    ],
-  },
-  context_window: 131072,
-  max_output_tokens: 96000,
-  pricing: {
-    text: {
-      input: {
-        normal: 0,
-        cached: 0,
-      },
-      output: {
-        normal: 0,
-      },
-    },
-    image: 0,
-  },
-} as const
 const Z_AI_GLM_4_5V = {
   id: 'z-ai/glm-4.5v',
   name: 'Z.ai: GLM 4.5V',
@@ -10571,12 +10454,12 @@ const Z_AI_GLM_4_6V = {
     ],
   },
   context_window: 131072,
-  max_output_tokens: 24000,
+  max_output_tokens: 32768,
   pricing: {
     text: {
       input: {
         normal: 0.3,
-        cached: 0.05,
+        cached: 0.055,
       },
       output: {
         normal: 0.9,
@@ -10711,7 +10594,7 @@ const Z_AI_GLM_5_TURBO = {
       'topP',
     ],
   },
-  context_window: 202752,
+  context_window: 262144,
   max_output_tokens: 131072,
   pricing: {
     text: {
@@ -10763,38 +10646,18 @@ const Z_AI_GLM_5_1 = {
     image: 0,
   },
 } as const
-const Z_AI_GLM_5V_TURBO = {
-  id: 'z-ai/glm-5v-turbo',
-  name: 'Z.ai: GLM 5V Turbo',
-  supports: {
-    input: ['image', 'text', 'video'],
-    output: ['text'],
-    supports: [
-      'maxCompletionTokens',
-      'reasoning',
-      'responseFormat',
-      'temperature',
-      'toolChoice',
-      'topP',
-    ],
-  },
-  context_window: 202752,
-  max_output_tokens: 131072,
-  pricing: {
-    text: {
-      input: {
-        normal: 1.2,
-        cached: 0.24,
-      },
-      output: {
-        normal: 4,
-      },
-    },
-    image: 0,
-  },
-} as const
 
 export type OpenRouterModelOptionsByName = {
+  [_ANTHROPIC_CLAUDE_FABLE_LATEST.id]: OpenRouterCommonOptions &
+    Pick<
+      OpenRouterBaseOptions,
+      | 'maxCompletionTokens'
+      | 'maxCompletionTokens'
+      | 'reasoning'
+      | 'responseFormat'
+      | 'stop'
+      | 'toolChoice'
+    >
   [_ANTHROPIC_CLAUDE_HAIKU_LATEST.id]: OpenRouterCommonOptions &
     Pick<
       OpenRouterBaseOptions,
@@ -10985,6 +10848,16 @@ export type OpenRouterModelOptionsByName = {
       OpenRouterBaseOptions,
       'maxCompletionTokens' | 'stop' | 'temperature' | 'toolChoice' | 'topP'
     >
+  [ANTHROPIC_CLAUDE_FABLE_5.id]: OpenRouterCommonOptions &
+    Pick<
+      OpenRouterBaseOptions,
+      | 'maxCompletionTokens'
+      | 'maxCompletionTokens'
+      | 'reasoning'
+      | 'responseFormat'
+      | 'stop'
+      | 'toolChoice'
+    >
   [ANTHROPIC_CLAUDE_HAIKU_4_5.id]: OpenRouterCommonOptions &
     Pick<
       OpenRouterBaseOptions,
@@ -11130,28 +11003,6 @@ export type OpenRouterModelOptionsByName = {
       | 'temperature'
       | 'topP'
     >
-  [ARCEE_AI_MAESTRO_REASONING.id]: OpenRouterCommonOptions &
-    Pick<
-      OpenRouterBaseOptions,
-      | 'frequencyPenalty'
-      | 'logitBias'
-      | 'maxCompletionTokens'
-      | 'presencePenalty'
-      | 'stop'
-      | 'temperature'
-      | 'topP'
-    >
-  [ARCEE_AI_SPOTLIGHT.id]: OpenRouterCommonOptions &
-    Pick<
-      OpenRouterBaseOptions,
-      | 'frequencyPenalty'
-      | 'logitBias'
-      | 'maxCompletionTokens'
-      | 'presencePenalty'
-      | 'stop'
-      | 'temperature'
-      | 'topP'
-    >
   [ARCEE_AI_TRINITY_LARGE_THINKING.id]: OpenRouterCommonOptions &
     Pick<
       OpenRouterBaseOptions,
@@ -11191,19 +11042,6 @@ export type OpenRouterModelOptionsByName = {
       | 'toolChoice'
       | 'topP'
     >
-  [BAIDU_ERNIE_4_5_VL_28B_A3B.id]: OpenRouterCommonOptions &
-    Pick<
-      OpenRouterBaseOptions,
-      | 'frequencyPenalty'
-      | 'maxCompletionTokens'
-      | 'presencePenalty'
-      | 'reasoning'
-      | 'seed'
-      | 'stop'
-      | 'temperature'
-      | 'toolChoice'
-      | 'topP'
-    >
   [BAIDU_ERNIE_4_5_VL_424B_A47B.id]: OpenRouterCommonOptions &
     Pick<
       OpenRouterBaseOptions,
@@ -12032,8 +11870,6 @@ export type OpenRouterModelOptionsByName = {
       | 'logitBias'
       | 'maxCompletionTokens'
       | 'presencePenalty'
-      | 'responseFormat'
-      | 'seed'
       | 'stop'
       | 'temperature'
       | 'topP'
@@ -12654,34 +12490,22 @@ export type OpenRouterModelOptionsByName = {
       | 'topLogprobs'
       | 'topP'
     >
-  [MOONSHOTAI_KIMI_K2_6_FREE.id]: OpenRouterCommonOptions &
-    Pick<OpenRouterBaseOptions, 'reasoning' | 'toolChoice'>
   [MORPH_MORPH_V3_FAST.id]: OpenRouterCommonOptions &
     Pick<OpenRouterBaseOptions, 'maxCompletionTokens' | 'stop' | 'temperature'>
   [MORPH_MORPH_V3_LARGE.id]: OpenRouterCommonOptions &
     Pick<OpenRouterBaseOptions, 'maxCompletionTokens' | 'stop' | 'temperature'>
-  [NEX_AGI_DEEPSEEK_V3_1_NEX_N1.id]: OpenRouterCommonOptions &
+  [NEX_AGI_NEX_N2_PRO_FREE.id]: OpenRouterCommonOptions &
     Pick<
       OpenRouterBaseOptions,
       | 'frequencyPenalty'
+      | 'logprobs'
       | 'maxCompletionTokens'
+      | 'reasoning'
       | 'responseFormat'
       | 'temperature'
       | 'toolChoice'
       | 'topP'
     >
-  [NOUSRESEARCH_HERMES_2_PRO_LLAMA_3_8B.id]: OpenRouterCommonOptions &
-    Pick<
-      OpenRouterBaseOptions,
-      | 'frequencyPenalty'
-      | 'maxCompletionTokens'
-      | 'presencePenalty'
-      | 'responseFormat'
-      | 'seed'
-      | 'stop'
-      | 'temperature'
-      | 'topP'
-    >
   [NOUSRESEARCH_HERMES_3_LLAMA_3_1_405B.id]: OpenRouterCommonOptions &
     Pick<
       OpenRouterBaseOptions,
@@ -12818,82 +12642,79 @@ export type OpenRouterModelOptionsByName = {
       | 'toolChoice'
       | 'topP'
     >
-  [NVIDIA_NEMOTRON_NANO_12B_V2_VL_FREE.id]: OpenRouterCommonOptions &
+  [NVIDIA_NEMOTRON_3_ULTRA_550B_A55B.id]: OpenRouterCommonOptions &
     Pick<
       OpenRouterBaseOptions,
+      | 'frequencyPenalty'
+      | 'logitBias'
       | 'maxCompletionTokens'
+      | 'presencePenalty'
       | 'reasoning'
+      | 'responseFormat'
       | 'seed'
+      | 'stop'
       | 'temperature'
       | 'toolChoice'
       | 'topP'
     >
-  [NVIDIA_NEMOTRON_NANO_9B_V2.id]: OpenRouterCommonOptions &
+  [NVIDIA_NEMOTRON_3_ULTRA_550B_A55B_FREE.id]: OpenRouterCommonOptions &
     Pick<
       OpenRouterBaseOptions,
-      | 'frequencyPenalty'
-      | 'logitBias'
       | 'maxCompletionTokens'
-      | 'presencePenalty'
       | 'reasoning'
-      | 'responseFormat'
       | 'seed'
-      | 'stop'
       | 'temperature'
       | 'toolChoice'
       | 'topP'
     >
-  [NVIDIA_NEMOTRON_NANO_9B_V2_FREE.id]: OpenRouterCommonOptions &
+  [NVIDIA_NEMOTRON_3_5_CONTENT_SAFETY_FREE.id]: OpenRouterCommonOptions &
+    Pick<
+      OpenRouterBaseOptions,
+      'maxCompletionTokens' | 'reasoning' | 'seed' | 'temperature' | 'topP'
+    >
+  [NVIDIA_NEMOTRON_NANO_12B_V2_VL_FREE.id]: OpenRouterCommonOptions &
     Pick<
       OpenRouterBaseOptions,
       | 'maxCompletionTokens'
       | 'reasoning'
-      | 'responseFormat'
       | 'seed'
       | 'temperature'
       | 'toolChoice'
       | 'topP'
     >
-  [OPENAI_GPT_3_5_TURBO.id]: OpenRouterCommonOptions &
+  [NVIDIA_NEMOTRON_NANO_9B_V2.id]: OpenRouterCommonOptions &
     Pick<
       OpenRouterBaseOptions,
       | 'frequencyPenalty'
       | 'logitBias'
-      | 'logprobs'
       | 'maxCompletionTokens'
       | 'presencePenalty'
+      | 'reasoning'
       | 'responseFormat'
       | 'seed'
       | 'stop'
       | 'temperature'
       | 'toolChoice'
-      | 'topLogprobs'
       | 'topP'
     >
-  [OPENAI_GPT_3_5_TURBO_0613.id]: OpenRouterCommonOptions &
+  [NVIDIA_NEMOTRON_NANO_9B_V2_FREE.id]: OpenRouterCommonOptions &
     Pick<
       OpenRouterBaseOptions,
-      | 'frequencyPenalty'
-      | 'logitBias'
-      | 'logprobs'
       | 'maxCompletionTokens'
-      | 'presencePenalty'
+      | 'reasoning'
       | 'responseFormat'
       | 'seed'
-      | 'stop'
       | 'temperature'
       | 'toolChoice'
-      | 'topLogprobs'
       | 'topP'
     >
-  [OPENAI_GPT_3_5_TURBO_16K.id]: OpenRouterCommonOptions &
+  [OPENAI_GPT_3_5_TURBO.id]: OpenRouterCommonOptions &
     Pick<
       OpenRouterBaseOptions,
       | 'frequencyPenalty'
       | 'logitBias'
       | 'logprobs'
       | 'maxCompletionTokens'
-      | 'maxCompletionTokens'
       | 'presencePenalty'
       | 'responseFormat'
       | 'seed'
@@ -12903,7 +12724,7 @@ export type OpenRouterModelOptionsByName = {
       | 'topLogprobs'
       | 'topP'
     >
-  [OPENAI_GPT_3_5_TURBO_INSTRUCT.id]: OpenRouterCommonOptions &
+  [OPENAI_GPT_3_5_TURBO_0613.id]: OpenRouterCommonOptions &
     Pick<
       OpenRouterBaseOptions,
       | 'frequencyPenalty'
@@ -12915,10 +12736,11 @@ export type OpenRouterModelOptionsByName = {
       | 'seed'
       | 'stop'
       | 'temperature'
+      | 'toolChoice'
       | 'topLogprobs'
       | 'topP'
     >
-  [OPENAI_GPT_4.id]: OpenRouterCommonOptions &
+  [OPENAI_GPT_3_5_TURBO_16K.id]: OpenRouterCommonOptions &
     Pick<
       OpenRouterBaseOptions,
       | 'frequencyPenalty'
@@ -12935,7 +12757,7 @@ export type OpenRouterModelOptionsByName = {
       | 'topLogprobs'
       | 'topP'
     >
-  [OPENAI_GPT_4_0314.id]: OpenRouterCommonOptions &
+  [OPENAI_GPT_3_5_TURBO_INSTRUCT.id]: OpenRouterCommonOptions &
     Pick<
       OpenRouterBaseOptions,
       | 'frequencyPenalty'
@@ -12947,17 +12769,17 @@ export type OpenRouterModelOptionsByName = {
       | 'seed'
       | 'stop'
       | 'temperature'
-      | 'toolChoice'
       | 'topLogprobs'
       | 'topP'
     >
-  [OPENAI_GPT_4_1106_PREVIEW.id]: OpenRouterCommonOptions &
+  [OPENAI_GPT_4.id]: OpenRouterCommonOptions &
     Pick<
       OpenRouterBaseOptions,
       | 'frequencyPenalty'
       | 'logitBias'
       | 'logprobs'
       | 'maxCompletionTokens'
+      | 'maxCompletionTokens'
       | 'presencePenalty'
       | 'responseFormat'
       | 'seed'
@@ -14364,48 +14186,50 @@ export type OpenRouterModelOptionsByName = {
       | 'topLogprobs'
       | 'topP'
     >
-  [REKAAI_REKA_EDGE.id]: OpenRouterCommonOptions &
+  [QWEN_QWEN3_7_PLUS.id]: OpenRouterCommonOptions &
     Pick<
       OpenRouterBaseOptions,
-      | 'frequencyPenalty'
+      | 'logprobs'
       | 'maxCompletionTokens'
       | 'presencePenalty'
+      | 'reasoning'
+      | 'responseFormat'
       | 'seed'
-      | 'stop'
       | 'temperature'
       | 'toolChoice'
+      | 'topLogprobs'
       | 'topP'
     >
-  [REKAAI_REKA_FLASH_3.id]: OpenRouterCommonOptions &
+  [REKAAI_REKA_EDGE.id]: OpenRouterCommonOptions &
     Pick<
       OpenRouterBaseOptions,
       | 'frequencyPenalty'
       | 'maxCompletionTokens'
       | 'presencePenalty'
-      | 'reasoning'
       | 'seed'
       | 'stop'
       | 'temperature'
+      | 'toolChoice'
       | 'topP'
     >
-  [RELACE_RELACE_APPLY_3.id]: OpenRouterCommonOptions &
-    Pick<OpenRouterBaseOptions, 'maxCompletionTokens' | 'seed' | 'stop'>
-  [RELACE_RELACE_SEARCH.id]: OpenRouterCommonOptions &
+  [REKAAI_REKA_FLASH_3.id]: OpenRouterCommonOptions &
     Pick<
       OpenRouterBaseOptions,
+      | 'frequencyPenalty'
       | 'maxCompletionTokens'
+      | 'presencePenalty'
+      | 'reasoning'
       | 'seed'
       | 'stop'
       | 'temperature'
-      | 'toolChoice'
       | 'topP'
     >
-  [SAO10K_L3_EURYALE_70B.id]: OpenRouterCommonOptions &
+  [RELACE_RELACE_APPLY_3.id]: OpenRouterCommonOptions &
+    Pick<OpenRouterBaseOptions, 'maxCompletionTokens' | 'seed' | 'stop'>
+  [RELACE_RELACE_SEARCH.id]: OpenRouterCommonOptions &
     Pick<
       OpenRouterBaseOptions,
-      | 'frequencyPenalty'
       | 'maxCompletionTokens'
-      | 'presencePenalty'
       | 'seed'
       | 'stop'
       | 'temperature'
@@ -14675,7 +14499,6 @@ export type OpenRouterModelOptionsByName = {
       | 'presencePenalty'
       | 'reasoning'
       | 'responseFormat'
-      | 'seed'
       | 'stop'
       | 'temperature'
       | 'toolChoice'
@@ -14709,11 +14532,6 @@ export type OpenRouterModelOptionsByName = {
       | 'toolChoice'
       | 'topP'
     >
-  [Z_AI_GLM_4_32B.id]: OpenRouterCommonOptions &
-    Pick<
-      OpenRouterBaseOptions,
-      'maxCompletionTokens' | 'temperature' | 'toolChoice' | 'topP'
-    >
   [Z_AI_GLM_4_5.id]: OpenRouterCommonOptions &
     Pick<
       OpenRouterBaseOptions,
@@ -14732,6 +14550,7 @@ export type OpenRouterModelOptionsByName = {
     Pick<
       OpenRouterBaseOptions,
       | 'frequencyPenalty'
+      | 'logprobs'
       | 'maxCompletionTokens'
       | 'presencePenalty'
       | 'reasoning'
@@ -14740,15 +14559,7 @@ export type OpenRouterModelOptionsByName = {
       | 'stop'
       | 'temperature'
       | 'toolChoice'
-      | 'topP'
-    >
-  [Z_AI_GLM_4_5_AIR_FREE.id]: OpenRouterCommonOptions &
-    Pick<
-      OpenRouterBaseOptions,
-      | 'maxCompletionTokens'
-      | 'reasoning'
-      | 'temperature'
-      | 'toolChoice'
+      | 'topLogprobs'
       | 'topP'
     >
   [Z_AI_GLM_4_5V.id]: OpenRouterCommonOptions &
@@ -14874,20 +14685,13 @@ export type OpenRouterModelOptionsByName = {
       | 'topLogprobs'
       | 'topP'
     >
-  [Z_AI_GLM_5V_TURBO.id]: OpenRouterCommonOptions &
-    Pick<
-      OpenRouterBaseOptions,
-      | 'maxCompletionTokens'
-      | 'reasoning'
-      | 'responseFormat'
-      | 'temperature'
-      | 'toolChoice'
-      | 'topP'
-    >
   'openrouter/auto': OpenRouterCommonOptions & OpenRouterBaseOptions
 }
 
 export type OpenRouterModelInputModalitiesByName = {
+  [_ANTHROPIC_CLAUDE_FABLE_LATEST.id]: ReadonlyArray<
+    'text' | 'image' | 'document'
+  >
   [_ANTHROPIC_CLAUDE_HAIKU_LATEST.id]: ReadonlyArray<
     'text' | 'image' | 'document'
   >
@@ -14922,6 +14726,7 @@ export type OpenRouterModelInputModalitiesByName = {
   [ANTHRACITE_ORG_MAGNUM_V4_72B.id]: ReadonlyArray<'text'>
   [ANTHROPIC_CLAUDE_3_HAIKU.id]: ReadonlyArray<'text' | 'image'>
   [ANTHROPIC_CLAUDE_3_5_HAIKU.id]: ReadonlyArray<'text' | 'image'>
+  [ANTHROPIC_CLAUDE_FABLE_5.id]: ReadonlyArray<'text' | 'image' | 'document'>
   [ANTHROPIC_CLAUDE_HAIKU_4_5.id]: ReadonlyArray<'text' | 'image' | 'document'>
   [ANTHROPIC_CLAUDE_OPUS_4.id]: ReadonlyArray<'image' | 'text' | 'document'>
   [ANTHROPIC_CLAUDE_OPUS_4_1.id]: ReadonlyArray<'image' | 'text' | 'document'>
@@ -14942,12 +14747,9 @@ export type OpenRouterModelInputModalitiesByName = {
   [ANTHROPIC_CLAUDE_SONNET_4_5.id]: ReadonlyArray<'text' | 'image' | 'document'>
   [ANTHROPIC_CLAUDE_SONNET_4_6.id]: ReadonlyArray<'text' | 'image' | 'document'>
   [ARCEE_AI_CODER_LARGE.id]: ReadonlyArray<'text'>
-  [ARCEE_AI_MAESTRO_REASONING.id]: ReadonlyArray<'text'>
-  [ARCEE_AI_SPOTLIGHT.id]: ReadonlyArray<'image' | 'text'>
   [ARCEE_AI_TRINITY_LARGE_THINKING.id]: ReadonlyArray<'text'>
   [ARCEE_AI_TRINITY_MINI.id]: ReadonlyArray<'text'>
   [ARCEE_AI_VIRTUOSO_LARGE.id]: ReadonlyArray<'text'>
-  [BAIDU_ERNIE_4_5_VL_28B_A3B.id]: ReadonlyArray<'text' | 'image'>
   [BAIDU_ERNIE_4_5_VL_424B_A47B.id]: ReadonlyArray<'image' | 'text'>
   [BYTEDANCE_SEED_SEED_1_6.id]: ReadonlyArray<'image' | 'text' | 'video'>
   [BYTEDANCE_SEED_SEED_1_6_FLASH.id]: ReadonlyArray<'image' | 'text' | 'video'>
@@ -15094,11 +14896,9 @@ export type OpenRouterModelInputModalitiesByName = {
   [MOONSHOTAI_KIMI_K2_THINKING.id]: ReadonlyArray<'text'>
   [MOONSHOTAI_KIMI_K2_5.id]: ReadonlyArray<'text' | 'image'>
   [MOONSHOTAI_KIMI_K2_6.id]: ReadonlyArray<'text' | 'image'>
-  [MOONSHOTAI_KIMI_K2_6_FREE.id]: ReadonlyArray<'text' | 'image'>
   [MORPH_MORPH_V3_FAST.id]: ReadonlyArray<'text'>
   [MORPH_MORPH_V3_LARGE.id]: ReadonlyArray<'text'>
-  [NEX_AGI_DEEPSEEK_V3_1_NEX_N1.id]: ReadonlyArray<'text'>
-  [NOUSRESEARCH_HERMES_2_PRO_LLAMA_3_8B.id]: ReadonlyArray<'text'>
+  [NEX_AGI_NEX_N2_PRO_FREE.id]: ReadonlyArray<'text' | 'image'>
   [NOUSRESEARCH_HERMES_3_LLAMA_3_1_405B.id]: ReadonlyArray<'text'>
   [NOUSRESEARCH_HERMES_3_LLAMA_3_1_405B_FREE.id]: ReadonlyArray<'text'>
   [NOUSRESEARCH_HERMES_3_LLAMA_3_1_70B.id]: ReadonlyArray<'text'>
@@ -15112,6 +14912,9 @@ export type OpenRouterModelInputModalitiesByName = {
   >
   [NVIDIA_NEMOTRON_3_SUPER_120B_A12B.id]: ReadonlyArray<'text'>
   [NVIDIA_NEMOTRON_3_SUPER_120B_A12B_FREE.id]: ReadonlyArray<'text'>
+  [NVIDIA_NEMOTRON_3_ULTRA_550B_A55B.id]: ReadonlyArray<'text'>
+  [NVIDIA_NEMOTRON_3_ULTRA_550B_A55B_FREE.id]: ReadonlyArray<'text'>
+  [NVIDIA_NEMOTRON_3_5_CONTENT_SAFETY_FREE.id]: ReadonlyArray<'text' | 'image'>
   [NVIDIA_NEMOTRON_NANO_12B_V2_VL_FREE.id]: ReadonlyArray<
     'image' | 'text' | 'video'
   >
@@ -15122,8 +14925,6 @@ export type OpenRouterModelInputModalitiesByName = {
   [OPENAI_GPT_3_5_TURBO_16K.id]: ReadonlyArray<'text'>
   [OPENAI_GPT_3_5_TURBO_INSTRUCT.id]: ReadonlyArray<'text'>
   [OPENAI_GPT_4.id]: ReadonlyArray<'text'>
-  [OPENAI_GPT_4_0314.id]: ReadonlyArray<'text'>
-  [OPENAI_GPT_4_1106_PREVIEW.id]: ReadonlyArray<'text'>
   [OPENAI_GPT_4_TURBO.id]: ReadonlyArray<'text' | 'image'>
   [OPENAI_GPT_4_TURBO_PREVIEW.id]: ReadonlyArray<'text'>
   [OPENAI_GPT_4_1.id]: ReadonlyArray<'image' | 'text' | 'document'>
@@ -15243,11 +15044,11 @@ export type OpenRouterModelInputModalitiesByName = {
   [QWEN_QWEN3_6_MAX_PREVIEW.id]: ReadonlyArray<'text'>
   [QWEN_QWEN3_6_PLUS.id]: ReadonlyArray<'text' | 'image' | 'video'>
   [QWEN_QWEN3_7_MAX.id]: ReadonlyArray<'text'>
+  [QWEN_QWEN3_7_PLUS.id]: ReadonlyArray<'text' | 'image'>
   [REKAAI_REKA_EDGE.id]: ReadonlyArray<'image' | 'text' | 'video'>
   [REKAAI_REKA_FLASH_3.id]: ReadonlyArray<'text'>
   [RELACE_RELACE_APPLY_3.id]: ReadonlyArray<'text'>
   [RELACE_RELACE_SEARCH.id]: ReadonlyArray<'text'>
-  [SAO10K_L3_EURYALE_70B.id]: ReadonlyArray<'text'>
   [SAO10K_L3_LUNARIS_8B.id]: ReadonlyArray<'text'>
   [SAO10K_L3_1_70B_HANAMI_X1.id]: ReadonlyArray<'text'>
   [SAO10K_L3_1_EURYALE_70B.id]: ReadonlyArray<'text'>
@@ -15271,10 +15072,8 @@ export type OpenRouterModelInputModalitiesByName = {
   [XIAOMI_MIMO_V2_FLASH.id]: ReadonlyArray<'text'>
   [XIAOMI_MIMO_V2_5.id]: ReadonlyArray<'text' | 'audio' | 'image' | 'video'>
   [XIAOMI_MIMO_V2_5_PRO.id]: ReadonlyArray<'text'>
-  [Z_AI_GLM_4_32B.id]: ReadonlyArray<'text'>
   [Z_AI_GLM_4_5.id]: ReadonlyArray<'text'>
   [Z_AI_GLM_4_5_AIR.id]: ReadonlyArray<'text'>
-  [Z_AI_GLM_4_5_AIR_FREE.id]: ReadonlyArray<'text'>
   [Z_AI_GLM_4_5V.id]: ReadonlyArray<'text' | 'image'>
   [Z_AI_GLM_4_6.id]: ReadonlyArray<'text'>
   [Z_AI_GLM_4_6V.id]: ReadonlyArray<'image' | 'text' | 'video'>
@@ -15283,13 +15082,13 @@ export type OpenRouterModelInputModalitiesByName = {
   [Z_AI_GLM_5.id]: ReadonlyArray<'text'>
   [Z_AI_GLM_5_TURBO.id]: ReadonlyArray<'text'>
   [Z_AI_GLM_5_1.id]: ReadonlyArray<'text'>
-  [Z_AI_GLM_5V_TURBO.id]: ReadonlyArray<'image' | 'text' | 'video'>
   'openrouter/auto': ReadonlyArray<
     'text' | 'image' | 'audio' | 'video' | 'document'
   >
 }
 
 export const OPENROUTER_CHAT_MODELS = [
+  _ANTHROPIC_CLAUDE_FABLE_LATEST.id,
   _ANTHROPIC_CLAUDE_HAIKU_LATEST.id,
   _ANTHROPIC_CLAUDE_OPUS_LATEST.id,
   _ANTHROPIC_CLAUDE_SONNET_LATEST.id,
@@ -15312,6 +15111,7 @@ export const OPENROUTER_CHAT_MODELS = [
   ANTHRACITE_ORG_MAGNUM_V4_72B.id,
   ANTHROPIC_CLAUDE_3_HAIKU.id,
   ANTHROPIC_CLAUDE_3_5_HAIKU.id,
+  ANTHROPIC_CLAUDE_FABLE_5.id,
   ANTHROPIC_CLAUDE_HAIKU_4_5.id,
   ANTHROPIC_CLAUDE_OPUS_4.id,
   ANTHROPIC_CLAUDE_OPUS_4_1.id,
@@ -15326,12 +15126,9 @@ export const OPENROUTER_CHAT_MODELS = [
   ANTHROPIC_CLAUDE_SONNET_4_5.id,
   ANTHROPIC_CLAUDE_SONNET_4_6.id,
   ARCEE_AI_CODER_LARGE.id,
-  ARCEE_AI_MAESTRO_REASONING.id,
-  ARCEE_AI_SPOTLIGHT.id,
   ARCEE_AI_TRINITY_LARGE_THINKING.id,
   ARCEE_AI_TRINITY_MINI.id,
   ARCEE_AI_VIRTUOSO_LARGE.id,
-  BAIDU_ERNIE_4_5_VL_28B_A3B.id,
   BAIDU_ERNIE_4_5_VL_424B_A47B.id,
   BYTEDANCE_SEED_SEED_1_6.id,
   BYTEDANCE_SEED_SEED_1_6_FLASH.id,
@@ -15444,11 +15241,9 @@ export const OPENROUTER_CHAT_MODELS = [
   MOONSHOTAI_KIMI_K2_THINKING.id,
   MOONSHOTAI_KIMI_K2_5.id,
   MOONSHOTAI_KIMI_K2_6.id,
-  MOONSHOTAI_KIMI_K2_6_FREE.id,
   MORPH_MORPH_V3_FAST.id,
   MORPH_MORPH_V3_LARGE.id,
-  NEX_AGI_DEEPSEEK_V3_1_NEX_N1.id,
-  NOUSRESEARCH_HERMES_2_PRO_LLAMA_3_8B.id,
+  NEX_AGI_NEX_N2_PRO_FREE.id,
   NOUSRESEARCH_HERMES_3_LLAMA_3_1_405B.id,
   NOUSRESEARCH_HERMES_3_LLAMA_3_1_405B_FREE.id,
   NOUSRESEARCH_HERMES_3_LLAMA_3_1_70B.id,
@@ -15460,6 +15255,9 @@ export const OPENROUTER_CHAT_MODELS = [
   NVIDIA_NEMOTRON_3_NANO_OMNI_30B_A3B_REASONING_FREE.id,
   NVIDIA_NEMOTRON_3_SUPER_120B_A12B.id,
   NVIDIA_NEMOTRON_3_SUPER_120B_A12B_FREE.id,
+  NVIDIA_NEMOTRON_3_ULTRA_550B_A55B.id,
+  NVIDIA_NEMOTRON_3_ULTRA_550B_A55B_FREE.id,
+  NVIDIA_NEMOTRON_3_5_CONTENT_SAFETY_FREE.id,
   NVIDIA_NEMOTRON_NANO_12B_V2_VL_FREE.id,
   NVIDIA_NEMOTRON_NANO_9B_V2.id,
   NVIDIA_NEMOTRON_NANO_9B_V2_FREE.id,
@@ -15468,8 +15266,6 @@ export const OPENROUTER_CHAT_MODELS = [
   OPENAI_GPT_3_5_TURBO_16K.id,
   OPENAI_GPT_3_5_TURBO_INSTRUCT.id,
   OPENAI_GPT_4.id,
-  OPENAI_GPT_4_0314.id,
-  OPENAI_GPT_4_1106_PREVIEW.id,
   OPENAI_GPT_4_TURBO.id,
   OPENAI_GPT_4_TURBO_PREVIEW.id,
   OPENAI_GPT_4_1.id,
@@ -15585,11 +15381,11 @@ export const OPENROUTER_CHAT_MODELS = [
   QWEN_QWEN3_6_MAX_PREVIEW.id,
   QWEN_QWEN3_6_PLUS.id,
   QWEN_QWEN3_7_MAX.id,
+  QWEN_QWEN3_7_PLUS.id,
   REKAAI_REKA_EDGE.id,
   REKAAI_REKA_FLASH_3.id,
   RELACE_RELACE_APPLY_3.id,
   RELACE_RELACE_SEARCH.id,
-  SAO10K_L3_EURYALE_70B.id,
   SAO10K_L3_LUNARIS_8B.id,
   SAO10K_L3_1_70B_HANAMI_X1.id,
   SAO10K_L3_1_EURYALE_70B.id,
@@ -15613,10 +15409,8 @@ export const OPENROUTER_CHAT_MODELS = [
   XIAOMI_MIMO_V2_FLASH.id,
   XIAOMI_MIMO_V2_5.id,
   XIAOMI_MIMO_V2_5_PRO.id,
-  Z_AI_GLM_4_32B.id,
   Z_AI_GLM_4_5.id,
   Z_AI_GLM_4_5_AIR.id,
-  Z_AI_GLM_4_5_AIR_FREE.id,
   Z_AI_GLM_4_5V.id,
   Z_AI_GLM_4_6.id,
   Z_AI_GLM_4_6V.id,
@@ -15625,7 +15419,6 @@ export const OPENROUTER_CHAT_MODELS = [
   Z_AI_GLM_5.id,
   Z_AI_GLM_5_TURBO.id,
   Z_AI_GLM_5_1.id,
-  Z_AI_GLM_5V_TURBO.id,
   'openrouter/auto',
 ] as const
 
diff --git a/scripts/.sync-models-last-run b/scripts/.sync-models-last-run
index be7a0996a..717f86528 100644
--- a/scripts/.sync-models-last-run
+++ b/scripts/.sync-models-last-run
@@ -1 +1 @@
-1780482493
+1781171945
diff --git a/scripts/openrouter.models.json b/scripts/openrouter.models.json
index bcc2eeacd..a8a9b7624 100644
--- a/scripts/openrouter.models.json
+++ b/scripts/openrouter.models.json
@@ -1,4 +1,59 @@
 [
+  {
+    "id": "~anthropic/claude-fable-latest",
+    "canonical_slug": "~anthropic/claude-fable-latest",
+    "hugging_face_id": null,
+    "name": "Anthropic: Claude Fable Latest",
+    "created": 1781029944,
+    "description": "This model always redirects to the latest model in the Claude Fable family.",
+    "context_length": 1000000,
+    "architecture": {
+      "modality": "text+image+file->text",
+      "input_modalities": ["text", "image", "file"],
+      "output_modalities": ["text"],
+      "tokenizer": "Router",
+      "instruct_type": null
+    },
+    "pricing": {
+      "prompt": "0.00001",
+      "completion": "0.00005",
+      "web_search": "0.01",
+      "input_cache_read": "0.000001",
+      "input_cache_write": "0.0000125"
+    },
+    "top_provider": {
+      "context_length": 1000000,
+      "max_completion_tokens": 128000,
+      "is_moderated": true
+    },
+    "per_request_limits": null,
+    "supported_parameters": [
+      "include_reasoning",
+      "max_completion_tokens",
+      "max_tokens",
+      "reasoning",
+      "response_format",
+      "stop",
+      "structured_outputs",
+      "tool_choice",
+      "tools",
+      "verbosity"
+    ],
+    "default_parameters": {
+      "temperature": null,
+      "top_p": null,
+      "top_k": null,
+      "frequency_penalty": null,
+      "presence_penalty": null,
+      "repetition_penalty": null
+    },
+    "supported_voices": null,
+    "knowledge_cutoff": null,
+    "expiration_date": null,
+    "links": {
+      "details": "/api/v1/models/~anthropic/claude-fable-latest/endpoints"
+    }
+  },
   {
     "id": "~anthropic/claude-haiku-latest",
     "canonical_slug": "~anthropic/claude-haiku-latest",
@@ -301,13 +356,13 @@
       "instruct_type": null
     },
     "pricing": {
-      "prompt": "0.000000684",
-      "completion": "0.00000342",
-      "input_cache_read": "0.000000144"
+      "prompt": "0.00000068",
+      "completion": "0.00000341",
+      "input_cache_read": "0.00000034"
     },
     "top_provider": {
-      "context_length": 262144,
-      "max_completion_tokens": 262144,
+      "context_length": 262142,
+      "max_completion_tokens": 262142,
       "is_moderated": false
     },
     "per_request_limits": null,
@@ -994,6 +1049,7 @@
     "pricing": {
       "prompt": "0.00000025",
       "completion": "0.00000125",
+      "web_search": "0.01",
       "input_cache_read": "0.00000003",
       "input_cache_write": "0.0000003"
     },
@@ -1069,6 +1125,61 @@
       "details": "/api/v1/models/anthropic/claude-3-5-haiku/endpoints"
     }
   },
+  {
+    "id": "anthropic/claude-fable-5",
+    "canonical_slug": "anthropic/claude-5-fable-20260609",
+    "hugging_face_id": null,
+    "name": "Anthropic: Claude Fable 5",
+    "created": 1781007515,
+    "description": "Claude Fable 5 is a Mythos-class model from Anthropic, built for autonomous knowledge work and coding. It supports text, image, and file inputs with text output, with reasoning support and...",
+    "context_length": 1000000,
+    "architecture": {
+      "modality": "text+image+file->text",
+      "input_modalities": ["text", "image", "file"],
+      "output_modalities": ["text"],
+      "tokenizer": "Claude",
+      "instruct_type": null
+    },
+    "pricing": {
+      "prompt": "0.00001",
+      "completion": "0.00005",
+      "web_search": "0.01",
+      "input_cache_read": "0.000001",
+      "input_cache_write": "0.0000125"
+    },
+    "top_provider": {
+      "context_length": 1000000,
+      "max_completion_tokens": 128000,
+      "is_moderated": true
+    },
+    "per_request_limits": null,
+    "supported_parameters": [
+      "include_reasoning",
+      "max_completion_tokens",
+      "max_tokens",
+      "reasoning",
+      "response_format",
+      "stop",
+      "structured_outputs",
+      "tool_choice",
+      "tools",
+      "verbosity"
+    ],
+    "default_parameters": {
+      "temperature": null,
+      "top_p": null,
+      "top_k": null,
+      "frequency_penalty": null,
+      "presence_penalty": null,
+      "repetition_penalty": null
+    },
+    "supported_voices": null,
+    "knowledge_cutoff": null,
+    "expiration_date": null,
+    "links": {
+      "details": "/api/v1/models/anthropic/claude-5-fable-20260609/endpoints"
+    }
+  },
   {
     "id": "anthropic/claude-haiku-4.5",
     "canonical_slug": "anthropic/claude-4.5-haiku-20251001",
@@ -1833,96 +1944,6 @@
       "details": "/api/v1/models/arcee-ai/coder-large/endpoints"
     }
   },
-  {
-    "id": "arcee-ai/maestro-reasoning",
-    "canonical_slug": "arcee-ai/maestro-reasoning",
-    "hugging_face_id": "",
-    "name": "Arcee AI: Maestro Reasoning",
-    "created": 1746481269,
-    "description": "Maestro Reasoning is Arcee's flagship analysis model: a 32 B‑parameter derivative of Qwen 2.5‑32 B tuned with DPO and chain‑of‑thought RL for step‑by‑step logic. Compared to the earlier 7 B...",
-    "context_length": 131072,
-    "architecture": {
-      "modality": "text->text",
-      "input_modalities": ["text"],
-      "output_modalities": ["text"],
-      "tokenizer": "Other",
-      "instruct_type": null
-    },
-    "pricing": {
-      "prompt": "0.0000009",
-      "completion": "0.0000033"
-    },
-    "top_provider": {
-      "context_length": 131072,
-      "max_completion_tokens": 32000,
-      "is_moderated": false
-    },
-    "per_request_limits": null,
-    "supported_parameters": [
-      "frequency_penalty",
-      "logit_bias",
-      "max_tokens",
-      "min_p",
-      "presence_penalty",
-      "repetition_penalty",
-      "stop",
-      "temperature",
-      "top_k",
-      "top_p"
-    ],
-    "default_parameters": {},
-    "supported_voices": null,
-    "knowledge_cutoff": "2025-03-31",
-    "expiration_date": null,
-    "links": {
-      "details": "/api/v1/models/arcee-ai/maestro-reasoning/endpoints"
-    }
-  },
-  {
-    "id": "arcee-ai/spotlight",
-    "canonical_slug": "arcee-ai/spotlight",
-    "hugging_face_id": "",
-    "name": "Arcee AI: Spotlight",
-    "created": 1746481552,
-    "description": "Spotlight is a 7‑billion‑parameter vision‑language model derived from Qwen 2.5‑VL and fine‑tuned by Arcee AI for tight image‑text grounding tasks. It offers a 32 k‑token context window, enabling rich multimodal...",
-    "context_length": 131072,
-    "architecture": {
-      "modality": "text+image->text",
-      "input_modalities": ["image", "text"],
-      "output_modalities": ["text"],
-      "tokenizer": "Other",
-      "instruct_type": null
-    },
-    "pricing": {
-      "prompt": "0.00000018",
-      "completion": "0.00000018"
-    },
-    "top_provider": {
-      "context_length": 131072,
-      "max_completion_tokens": 65537,
-      "is_moderated": false
-    },
-    "per_request_limits": null,
-    "supported_parameters": [
-      "frequency_penalty",
-      "logit_bias",
-      "max_tokens",
-      "min_p",
-      "presence_penalty",
-      "repetition_penalty",
-      "stop",
-      "temperature",
-      "top_k",
-      "top_p"
-    ],
-    "default_parameters": {},
-    "supported_voices": null,
-    "knowledge_cutoff": "2025-03-31",
-    "expiration_date": null,
-    "links": {
-      "details": "/api/v1/models/arcee-ai/spotlight/endpoints"
-    }
-  },
   {
     "id": "arcee-ai/trinity-large-thinking",
     "canonical_slug": "arcee-ai/trinity-large-thinking",
@@ -2079,54 +2100,6 @@
       "details": "/api/v1/models/arcee-ai/virtuoso-large/endpoints"
     }
   },
-  {
-    "id": "baidu/ernie-4.5-vl-28b-a3b",
-    "canonical_slug": "baidu/ernie-4.5-vl-28b-a3b",
-    "hugging_face_id": "baidu/ERNIE-4.5-VL-28B-A3B-PT",
-    "name": "Baidu: ERNIE 4.5 VL 28B A3B",
-    "created": 1755032836,
-    "description": "A powerful multimodal Mixture-of-Experts chat model featuring 28B total parameters with 3B activated per token, delivering exceptional text and vision understanding through its innovative heterogeneous MoE structure with modality-isolated routing....",
-    "context_length": 131072,
-    "architecture": {
-      "modality": "text+image->text",
-      "input_modalities": ["text", "image"],
-      "output_modalities": ["text"],
-      "tokenizer": "Other",
-      "instruct_type": null
-    },
-    "pricing": {
-      "prompt": "0.00000014",
-      "completion": "0.00000056"
-    },
-    "top_provider": {
-      "context_length": 30000,
-      "max_completion_tokens": 8000,
-      "is_moderated": false
-    },
-    "per_request_limits": null,
-    "supported_parameters": [
-      "frequency_penalty",
-      "include_reasoning",
-      "max_tokens",
-      "presence_penalty",
-      "reasoning",
-      "repetition_penalty",
-      "seed",
-      "stop",
-      "temperature",
-      "tool_choice",
-      "tools",
-      "top_k",
-      "top_p"
-    ],
-    "default_parameters": {},
-    "supported_voices": null,
-    "knowledge_cutoff": "2025-03-31",
-    "expiration_date": null,
-    "links": {
-      "details": "/api/v1/models/baidu/ernie-4.5-vl-28b-a3b/endpoints"
-    }
-  },
   {
     "id": "baidu/ernie-4.5-vl-424b-a47b",
     "canonical_slug": "baidu/ernie-4.5-vl-424b-a47b",
@@ -2760,7 +2733,7 @@
     "name": "DeepSeek: DeepSeek V3 0324",
     "created": 1742824755,
     "description": "DeepSeek V3, a 685B-parameter, mixture-of-experts model, is the latest iteration of the flagship chat model family from the DeepSeek team. It succeeds the [DeepSeek V3](/deepseek/deepseek-chat-v3) model and performs really well...",
-    "context_length": 163840,
+    "context_length": 131072,
     "architecture": {
       "modality": "text->text",
       "input_modalities": ["text"],
@@ -2774,7 +2747,7 @@
       "input_cache_read": "0.000000135"
     },
     "top_provider": {
-      "context_length": 163840,
+      "context_length": 32768,
       "max_completion_tokens": 16384,
       "is_moderated": false
     },
@@ -3016,7 +2989,7 @@
     "default_parameters": {},
     "supported_voices": null,
     "knowledge_cutoff": "2024-07-31",
-    "expiration_date": null,
+    "expiration_date": "2026-06-11",
     "links": {
       "details": "/api/v1/models/deepseek/deepseek-r1-distill-llama-70b/endpoints"
     }
@@ -4324,8 +4297,8 @@
       "instruct_type": "gemma"
     },
     "pricing": {
-      "prompt": "0.00000004",
-      "completion": "0.00000013"
+      "prompt": "0.00000005",
+      "completion": "0.00000015"
     },
     "top_provider": {
       "context_length": 131072,
@@ -4428,8 +4401,8 @@
       "instruct_type": "gemma"
     },
     "pricing": {
-      "prompt": "0.00000004",
-      "completion": "0.00000008"
+      "prompt": "0.00000005",
+      "completion": "0.0000001"
     },
     "top_provider": {
       "context_length": 131072,
@@ -4628,11 +4601,12 @@
     },
     "pricing": {
       "prompt": "0.00000012",
-      "completion": "0.00000037"
+      "completion": "0.00000036",
+      "input_cache_read": "0.00000009"
     },
     "top_provider": {
-      "context_length": 262144,
-      "max_completion_tokens": 16384,
+      "context_length": 256000,
+      "max_completion_tokens": 8192,
       "is_moderated": false
     },
     "per_request_limits": null,
@@ -5564,7 +5538,7 @@
     "default_parameters": {},
     "supported_voices": null,
     "knowledge_cutoff": "2023-12-31",
-    "expiration_date": null,
+    "expiration_date": "2026-06-19",
     "links": {
       "details": "/api/v1/models/meta-llama/llama-3-70b-instruct/endpoints"
     }
@@ -5585,12 +5559,12 @@
       "instruct_type": "llama3"
     },
     "pricing": {
-      "prompt": "0.00000004",
-      "completion": "0.00000004"
+      "prompt": "0.00000014",
+      "completion": "0.00000014"
     },
     "top_provider": {
       "context_length": 8192,
-      "max_completion_tokens": 8192,
+      "max_completion_tokens": null,
       "is_moderated": false
     },
     "per_request_limits": null,
@@ -5601,8 +5575,6 @@
       "min_p",
       "presence_penalty",
       "repetition_penalty",
-      "response_format",
-      "seed",
       "stop",
       "temperature",
       "top_k",
@@ -5683,10 +5655,10 @@
     },
     "pricing": {
       "prompt": "0.00000002",
-      "completion": "0.00000005"
+      "completion": "0.00000003"
     },
     "top_provider": {
-      "context_length": 16384,
+      "context_length": 131072,
       "max_completion_tokens": 16384,
       "is_moderated": false
     },
@@ -5732,8 +5704,8 @@
       "instruct_type": "llama3"
     },
     "pricing": {
-      "prompt": "0.000000245",
-      "completion": "0.000000245"
+      "prompt": "0.000000345",
+      "completion": "0.000000345"
     },
     "top_provider": {
       "context_length": 131072,
@@ -6057,7 +6029,7 @@
       "instruct_type": null
     },
     "pricing": {
-      "prompt": "0.00000008",
+      "prompt": "0.0000001",
       "completion": "0.0000003"
     },
     "top_provider": {
@@ -6586,7 +6558,8 @@
     },
     "pricing": {
       "prompt": "0.00000015",
-      "completion": "0.00000115"
+      "completion": "0.0000009",
+      "input_cache_read": "0.00000005"
     },
     "top_provider": {
       "context_length": 196608,
@@ -6648,11 +6621,12 @@
       "instruct_type": null
     },
     "pricing": {
-      "prompt": "0.000000279",
-      "completion": "0.0000012"
+      "prompt": "0.00000027",
+      "completion": "0.00000108",
+      "input_cache_read": "0.000000054"
     },
     "top_provider": {
-      "context_length": 196608,
+      "context_length": 204800,
       "max_completion_tokens": 131072,
       "is_moderated": false
     },
@@ -7887,13 +7861,12 @@
       "instruct_type": null
     },
     "pricing": {
-      "prompt": "0.0000004",
-      "completion": "0.0000019",
-      "input_cache_read": "0.00000009"
+      "prompt": "0.00000035",
+      "completion": "0.00000189"
     },
     "top_provider": {
-      "context_length": 262144,
-      "max_completion_tokens": 262144,
+      "context_length": 256000,
+      "max_completion_tokens": null,
       "is_moderated": false
     },
     "per_request_limits": null,
@@ -7949,13 +7922,13 @@
       "instruct_type": null
     },
     "pricing": {
-      "prompt": "0.000000684",
-      "completion": "0.00000342",
-      "input_cache_read": "0.000000144"
+      "prompt": "0.00000068",
+      "completion": "0.00000341",
+      "input_cache_read": "0.00000034"
     },
     "top_provider": {
-      "context_length": 262144,
-      "max_completion_tokens": 262144,
+      "context_length": 262142,
+      "max_completion_tokens": 262142,
       "is_moderated": false
     },
     "per_request_limits": null,
@@ -7997,52 +7970,6 @@
       "details": "/api/v1/models/moonshotai/kimi-k2.6-20260420/endpoints"
     }
   },
-  {
-    "id": "moonshotai/kimi-k2.6:free",
-    "canonical_slug": "moonshotai/kimi-k2.6-20260420",
-    "hugging_face_id": "moonshotai/Kimi-K2.6",
-    "name": "MoonshotAI: Kimi K2.6 (free)",
-    "created": 1776699402,
-    "description": "Kimi K2.6 is Moonshot AI's next-generation multimodal model, designed for long-horizon coding, coding-driven UI/UX generation, and multi-agent orchestration. It handles complex end-to-end coding tasks across Python, Rust, and Go, and...",
-    "context_length": 262144,
-    "architecture": {
-      "modality": "text+image->text",
-      "input_modalities": ["text", "image"],
-      "output_modalities": ["text"],
-      "tokenizer": "Other",
-      "instruct_type": null
-    },
-    "pricing": {
-      "prompt": "0",
-      "completion": "0"
-    },
-    "top_provider": {
-      "context_length": 262144,
-      "max_completion_tokens": null,
-      "is_moderated": false
-    },
-    "per_request_limits": null,
-    "supported_parameters": [
-      "include_reasoning",
-      "reasoning",
-      "tool_choice",
-      "tools"
-    ],
-    "default_parameters": {
-      "temperature": null,
-      "top_p": null,
-      "top_k": null,
-      "frequency_penalty": null,
-      "presence_penalty": null,
-      "repetition_penalty": null
-    },
-    "supported_voices": null,
-    "knowledge_cutoff": null,
-    "expiration_date": null,
-    "links": {
-      "details": "/api/v1/models/moonshotai/kimi-k2.6-20260420/endpoints"
-    }
-  },
   {
     "id": "morph/morph-v3-fast",
     "canonical_slug": "morph/morph-v3-fast",
@@ -8120,33 +8047,36 @@
     }
   },
   {
-    "id": "nex-agi/deepseek-v3.1-nex-n1",
-    "canonical_slug": "nex-agi/deepseek-v3.1-nex-n1",
-    "hugging_face_id": "nex-agi/DeepSeek-V3.1-Nex-N1",
-    "name": "Nex AGI: DeepSeek V3.1 Nex N1",
-    "created": 1765204393,
-    "description": "DeepSeek V3.1 Nex-N1 is the flagship release of the Nex-N1 series — a post-trained model designed to highlight agent autonomy, tool use, and real-world productivity. Nex-N1 demonstrates competitive performance across...",
-    "context_length": 131072,
+    "id": "nex-agi/nex-n2-pro:free",
+    "canonical_slug": "nex-agi/nex-n2-pro",
+    "hugging_face_id": "nex-agi/Nex-N2-Pro",
+    "name": "Nex AGI: Nex-N2-Pro (free)",
+    "created": 1780937140,
+    "description": "Nex-N2-Pro is an agentic mixture-of-experts model from Nex AGI, with 17B active parameters out of 397B total. Built on the Qwen3.5 architecture, it accepts text and image input and produces...",
+    "context_length": 262144,
     "architecture": {
-      "modality": "text->text",
-      "input_modalities": ["text"],
+      "modality": "text+image->text",
+      "input_modalities": ["text", "image"],
       "output_modalities": ["text"],
-      "tokenizer": "DeepSeek",
+      "tokenizer": "Qwen3",
       "instruct_type": null
     },
     "pricing": {
-      "prompt": "0.000000135",
-      "completion": "0.0000005"
+      "prompt": "0",
+      "completion": "0"
     },
     "top_provider": {
-      "context_length": 131072,
-      "max_completion_tokens": 163840,
+      "context_length": 262144,
+      "max_completion_tokens": 262144,
       "is_moderated": false
     },
     "per_request_limits": null,
     "supported_parameters": [
       "frequency_penalty",
+      "include_reasoning",
+      "logprobs",
       "max_tokens",
+      "reasoning",
       "response_format",
       "structured_outputs",
       "temperature",
@@ -8156,61 +8086,18 @@
       "top_p"
     ],
     "default_parameters": {
-      "temperature": null,
-      "top_p": null,
-      "frequency_penalty": null
+      "temperature": 0.7,
+      "top_p": 0.95,
+      "top_k": 40,
+      "frequency_penalty": null,
+      "presence_penalty": null,
+      "repetition_penalty": null
     },
     "supported_voices": null,
     "knowledge_cutoff": null,
-    "expiration_date": "2026-06-08",
-    "links": {
-      "details": "/api/v1/models/nex-agi/deepseek-v3.1-nex-n1/endpoints"
-    }
-  },
-  {
-    "id": "nousresearch/hermes-2-pro-llama-3-8b",
-    "canonical_slug": "nousresearch/hermes-2-pro-llama-3-8b",
-    "hugging_face_id": "NousResearch/Hermes-2-Pro-Llama-3-8B",
-    "name": "NousResearch: Hermes 2 Pro - Llama-3 8B",
-    "created": 1716768000,
-    "description": "Hermes 2 Pro is an upgraded, retrained version of Nous Hermes 2, consisting of an updated and cleaned version of the OpenHermes 2.5 Dataset, as well as a newly introduced...",
-    "context_length": 8192,
-    "architecture": {
-      "modality": "text->text",
-      "input_modalities": ["text"],
-      "output_modalities": ["text"],
-      "tokenizer": "Llama3",
-      "instruct_type": "chatml"
-    },
-    "pricing": {
-      "prompt": "0.00000014",
-      "completion": "0.00000014"
-    },
-    "top_provider": {
-      "context_length": 8192,
-      "max_completion_tokens": 8192,
-      "is_moderated": false
-    },
-    "per_request_limits": null,
-    "supported_parameters": [
-      "frequency_penalty",
-      "max_tokens",
-      "presence_penalty",
-      "repetition_penalty",
-      "response_format",
-      "seed",
-      "stop",
-      "structured_outputs",
-      "temperature",
-      "top_k",
-      "top_p"
-    ],
-    "default_parameters": {},
-    "supported_voices": null,
-    "knowledge_cutoff": "2023-12-31",
-    "expiration_date": "2026-06-05",
+    "expiration_date": null,
     "links": {
-      "details": "/api/v1/models/nousresearch/hermes-2-pro-llama-3-8b/endpoints"
+      "details": "/api/v1/models/nex-agi/nex-n2-pro/endpoints"
     }
   },
   {
@@ -8319,8 +8206,8 @@
       "instruct_type": "chatml"
     },
     "pricing": {
-      "prompt": "0.0000003",
-      "completion": "0.0000003"
+      "prompt": "0.0000007",
+      "completion": "0.0000007"
     },
     "top_provider": {
       "context_length": 131072,
@@ -8457,7 +8344,7 @@
       "instruct_type": null
     },
     "pricing": {
-      "prompt": "0.0000001",
+      "prompt": "0.0000004",
       "completion": "0.0000004"
     },
     "top_provider": {
@@ -8689,6 +8576,7 @@
       "response_format",
       "seed",
       "stop",
+      "structured_outputs",
       "temperature",
       "tool_choice",
       "tools",
@@ -8763,6 +8651,164 @@
       "details": "/api/v1/models/nvidia/nemotron-3-super-120b-a12b-20230311/endpoints"
     }
   },
+  {
+    "id": "nvidia/nemotron-3-ultra-550b-a55b",
+    "canonical_slug": "nvidia/nemotron-3-ultra-550b-a55b-20260604",
+    "hugging_face_id": "nvidia/NVIDIA-Nemotron-3-Ultra-550B-A55B-BF16",
+    "name": "NVIDIA: Nemotron 3 Ultra",
+    "created": 1780551208,
+    "description": "NVIDIA Nemotron 3 Ultra is an open frontier-reasoning and orchestration model from NVIDIA, with 55B active parameters out of 550B total (MoE). Built on a hybrid Transformer-Mamba mixture-of-experts architecture, it...",
+    "context_length": 1000000,
+    "architecture": {
+      "modality": "text->text",
+      "input_modalities": ["text"],
+      "output_modalities": ["text"],
+      "tokenizer": "Other",
+      "instruct_type": null
+    },
+    "pricing": {
+      "prompt": "0.0000005",
+      "completion": "0.0000025",
+      "input_cache_read": "0.00000015"
+    },
+    "top_provider": {
+      "context_length": 262144,
+      "max_completion_tokens": 16384,
+      "is_moderated": false
+    },
+    "per_request_limits": null,
+    "supported_parameters": [
+      "frequency_penalty",
+      "include_reasoning",
+      "logit_bias",
+      "max_tokens",
+      "min_p",
+      "presence_penalty",
+      "reasoning",
+      "repetition_penalty",
+      "response_format",
+      "seed",
+      "stop",
+      "structured_outputs",
+      "temperature",
+      "tool_choice",
+      "tools",
+      "top_k",
+      "top_p"
+    ],
+    "default_parameters": {
+      "temperature": 1,
+      "top_p": 0.95,
+      "top_k": null,
+      "frequency_penalty": null,
+      "presence_penalty": null,
+      "repetition_penalty": null
+    },
+    "supported_voices": null,
+    "knowledge_cutoff": null,
+    "expiration_date": null,
+    "links": {
+      "details": "/api/v1/models/nvidia/nemotron-3-ultra-550b-a55b-20260604/endpoints"
+    }
+  },
+  {
+    "id": "nvidia/nemotron-3-ultra-550b-a55b:free",
+    "canonical_slug": "nvidia/nemotron-3-ultra-550b-a55b-20260604",
+    "hugging_face_id": "nvidia/NVIDIA-Nemotron-3-Ultra-550B-A55B-BF16",
+    "name": "NVIDIA: Nemotron 3 Ultra (free)",
+    "created": 1780551208,
+    "description": "NVIDIA Nemotron 3 Ultra is an open frontier-reasoning and orchestration model from NVIDIA, with 55B active parameters out of 550B total (MoE). Built on a hybrid Transformer-Mamba mixture-of-experts architecture, it...",
+    "context_length": 1000000,
+    "architecture": {
+      "modality": "text->text",
+      "input_modalities": ["text"],
+      "output_modalities": ["text"],
+      "tokenizer": "Other",
+      "instruct_type": null
+    },
+    "pricing": {
+      "prompt": "0",
+      "completion": "0"
+    },
+    "top_provider": {
+      "context_length": 1000000,
+      "max_completion_tokens": 65536,
+      "is_moderated": false
+    },
+    "per_request_limits": null,
+    "supported_parameters": [
+      "include_reasoning",
+      "max_tokens",
+      "reasoning",
+      "seed",
+      "temperature",
+      "tool_choice",
+      "tools",
+      "top_p"
+    ],
+    "default_parameters": {
+      "temperature": 1,
+      "top_p": 0.95,
+      "top_k": null,
+      "frequency_penalty": null,
+      "presence_penalty": null,
+      "repetition_penalty": null
+    },
+    "supported_voices": null,
+    "knowledge_cutoff": null,
+    "expiration_date": null,
+    "links": {
+      "details": "/api/v1/models/nvidia/nemotron-3-ultra-550b-a55b-20260604/endpoints"
+    }
+  },
+  {
+    "id": "nvidia/nemotron-3.5-content-safety:free",
+    "canonical_slug": "nvidia/nemotron-3.5-content-safety-20260604",
+    "hugging_face_id": "nvidia/Nemotron-3.5-Content-Safety",
+    "name": "NVIDIA: Nemotron 3.5 Content Safety (free)",
+    "created": 1780581864,
+    "description": "NVIDIA Nemotron 3.5 Content Safety is a compact 4B-parameter multimodal guardrail model from NVIDIA, fine-tuned from Google Gemma-3-4B. It moderates both inputs to and responses from LLMs and VLMs, accepting...",
+    "context_length": 128000,
+    "architecture": {
+      "modality": "text+image->text",
+      "input_modalities": ["text", "image"],
+      "output_modalities": ["text"],
+      "tokenizer": "Other",
+      "instruct_type": null
+    },
+    "pricing": {
+      "prompt": "0",
+      "completion": "0"
+    },
+    "top_provider": {
+      "context_length": 128000,
+      "max_completion_tokens": 8192,
+      "is_moderated": false
+    },
+    "per_request_limits": null,
+    "supported_parameters": [
+      "include_reasoning",
+      "max_tokens",
+      "reasoning",
+      "seed",
+      "temperature",
+      "top_p"
+    ],
+    "default_parameters": {
+      "temperature": null,
+      "top_p": null,
+      "top_k": null,
+      "frequency_penalty": null,
+      "presence_penalty": null,
+      "repetition_penalty": null
+    },
+    "supported_voices": null,
+    "knowledge_cutoff": null,
+    "expiration_date": null,
+    "links": {
+      "details": "/api/v1/models/nvidia/nemotron-3.5-content-safety-20260604/endpoints"
+    }
+  },
   {
     "id": "nvidia/nemotron-nano-12b-v2-vl:free",
     "canonical_slug": "nvidia/nemotron-nano-12b-v2-vl",
@@ -8860,7 +8906,7 @@
     },
     "supported_voices": null,
     "knowledge_cutoff": "2025-03-31",
-    "expiration_date": null,
+    "expiration_date": "2026-06-11",
     "links": {
       "details": "/api/v1/models/nvidia/nemotron-nano-9b-v2/endpoints"
     }
@@ -9106,116 +9152,17 @@
     "knowledge_cutoff": "2021-09-30",
     "expiration_date": null,
     "links": {
-      "details": "/api/v1/models/openai/gpt-3.5-turbo-instruct/endpoints"
-    }
-  },
-  {
-    "id": "openai/gpt-4",
-    "canonical_slug": "openai/gpt-4",
-    "hugging_face_id": null,
-    "name": "OpenAI: GPT-4",
-    "created": 1685232000,
-    "description": "OpenAI's flagship model, GPT-4 is a large-scale multimodal language model capable of solving difficult problems with greater accuracy than previous models due to its broader general knowledge and advanced reasoning...",
-    "context_length": 8191,
-    "architecture": {
-      "modality": "text->text",
-      "input_modalities": ["text"],
-      "output_modalities": ["text"],
-      "tokenizer": "GPT",
-      "instruct_type": null
-    },
-    "pricing": {
-      "prompt": "0.00003",
-      "completion": "0.00006"
-    },
-    "top_provider": {
-      "context_length": 8191,
-      "max_completion_tokens": 4096,
-      "is_moderated": true
-    },
-    "per_request_limits": null,
-    "supported_parameters": [
-      "frequency_penalty",
-      "logit_bias",
-      "logprobs",
-      "max_completion_tokens",
-      "max_tokens",
-      "presence_penalty",
-      "response_format",
-      "seed",
-      "stop",
-      "structured_outputs",
-      "temperature",
-      "tool_choice",
-      "tools",
-      "top_logprobs",
-      "top_p"
-    ],
-    "default_parameters": {},
-    "supported_voices": null,
-    "knowledge_cutoff": "2021-09-30",
-    "expiration_date": null,
-    "links": {
-      "details": "/api/v1/models/openai/gpt-4/endpoints"
-    }
-  },
-  {
-    "id": "openai/gpt-4-0314",
-    "canonical_slug": "openai/gpt-4-0314",
-    "hugging_face_id": null,
-    "name": "OpenAI: GPT-4 (older v0314)",
-    "created": 1685232000,
-    "description": "GPT-4-0314 is the first version of GPT-4 released, with a context length of 8,192 tokens, and was supported until June 14. Training data: up to Sep 2021.",
-    "context_length": 8191,
-    "architecture": {
-      "modality": "text->text",
-      "input_modalities": ["text"],
-      "output_modalities": ["text"],
-      "tokenizer": "GPT",
-      "instruct_type": null
-    },
-    "pricing": {
-      "prompt": "0.00003",
-      "completion": "0.00006"
-    },
-    "top_provider": {
-      "context_length": 8191,
-      "max_completion_tokens": 4096,
-      "is_moderated": true
-    },
-    "per_request_limits": null,
-    "supported_parameters": [
-      "frequency_penalty",
-      "logit_bias",
-      "logprobs",
-      "max_tokens",
-      "presence_penalty",
-      "response_format",
-      "seed",
-      "stop",
-      "structured_outputs",
-      "temperature",
-      "tool_choice",
-      "tools",
-      "top_logprobs",
-      "top_p"
-    ],
-    "default_parameters": {},
-    "supported_voices": null,
-    "knowledge_cutoff": "2021-09-30",
-    "expiration_date": null,
-    "links": {
-      "details": "/api/v1/models/openai/gpt-4-0314/endpoints"
+      "details": "/api/v1/models/openai/gpt-3.5-turbo-instruct/endpoints"
     }
   },
   {
-    "id": "openai/gpt-4-1106-preview",
-    "canonical_slug": "openai/gpt-4-1106-preview",
+    "id": "openai/gpt-4",
+    "canonical_slug": "openai/gpt-4",
     "hugging_face_id": null,
-    "name": "OpenAI: GPT-4 Turbo (older v1106)",
-    "created": 1699228800,
-    "description": "The latest GPT-4 Turbo model with vision capabilities. Vision requests can now use JSON mode and function calling.\n\nTraining data: up to April 2023.",
-    "context_length": 128000,
+    "name": "OpenAI: GPT-4",
+    "created": 1685232000,
+    "description": "OpenAI's flagship model, GPT-4 is a large-scale multimodal language model capable of solving difficult problems with greater accuracy than previous models due to its broader general knowledge and advanced reasoning...",
+    "context_length": 8191,
     "architecture": {
       "modality": "text->text",
       "input_modalities": ["text"],
@@ -9224,12 +9171,11 @@
       "instruct_type": null
     },
     "pricing": {
-      "prompt": "0.00001",
-      "completion": "0.00003",
-      "web_search": "0.01"
+      "prompt": "0.00003",
+      "completion": "0.00006"
     },
     "top_provider": {
-      "context_length": 128000,
+      "context_length": 8191,
       "max_completion_tokens": 4096,
       "is_moderated": true
     },
@@ -9238,6 +9184,7 @@
       "frequency_penalty",
       "logit_bias",
       "logprobs",
+      "max_completion_tokens",
       "max_tokens",
       "presence_penalty",
       "response_format",
@@ -9252,10 +9199,10 @@
     ],
     "default_parameters": {},
     "supported_voices": null,
-    "knowledge_cutoff": "2023-04-30",
+    "knowledge_cutoff": "2021-09-30",
     "expiration_date": null,
     "links": {
-      "details": "/api/v1/models/openai/gpt-4-1106-preview/endpoints"
+      "details": "/api/v1/models/openai/gpt-4/endpoints"
     }
   },
   {
@@ -13072,7 +13019,7 @@
       "instruct_type": null
     },
     "pricing": {
-      "prompt": "0.000000071",
+      "prompt": "0.00000009",
       "completion": "0.0000001"
     },
     "top_provider": {
@@ -13179,12 +13126,12 @@
       "instruct_type": "qwen3"
     },
     "pricing": {
-      "prompt": "0.00000009",
-      "completion": "0.00000045"
+      "prompt": "0.00000012",
+      "completion": "0.0000005"
     },
     "top_provider": {
       "context_length": 40960,
-      "max_completion_tokens": 20000,
+      "max_completion_tokens": 16384,
       "is_moderated": false
     },
     "per_request_limits": null,
@@ -13216,7 +13163,7 @@
     },
     "supported_voices": null,
     "knowledge_cutoff": "2025-03-31",
-    "expiration_date": "2026-06-05",
+    "expiration_date": null,
     "links": {
       "details": "/api/v1/models/qwen/qwen3-30b-a3b-04-28/endpoints"
     }
@@ -13237,8 +13184,8 @@
       "instruct_type": null
     },
     "pricing": {
-      "prompt": "0.0000000428",
-      "completion": "0.0000001716"
+      "prompt": "0.00000004815",
+      "completion": "0.00000019305"
     },
     "top_provider": {
       "context_length": 128000,
@@ -14622,12 +14569,12 @@
       "instruct_type": null
     },
     "pricing": {
-      "prompt": "0.00000004",
+      "prompt": "0.0000001",
       "completion": "0.00000015"
     },
     "top_provider": {
       "context_length": 262144,
-      "max_completion_tokens": 81920,
+      "max_completion_tokens": 262144,
       "is_moderated": false
     },
     "per_request_limits": null,
@@ -14830,12 +14777,12 @@
       "instruct_type": null
     },
     "pricing": {
-      "prompt": "0.00000029",
-      "completion": "0.0000032"
+      "prompt": "0.000000289",
+      "completion": "0.0000024"
     },
     "top_provider": {
-      "context_length": 262140,
-      "max_completion_tokens": 262140,
+      "context_length": 131072,
+      "max_completion_tokens": 131072,
       "is_moderated": false
     },
     "per_request_limits": null,
@@ -14891,12 +14838,13 @@
       "instruct_type": null
     },
     "pricing": {
-      "prompt": "0.00000014",
-      "completion": "0.000001"
+      "prompt": "0.00000015",
+      "completion": "0.000001",
+      "input_cache_read": "0.00000005"
     },
     "top_provider": {
-      "context_length": 262140,
-      "max_completion_tokens": 262140,
+      "context_length": 262144,
+      "max_completion_tokens": 262144,
       "is_moderated": false
     },
     "per_request_limits": null,
@@ -15140,6 +15088,56 @@
       "details": "/api/v1/models/qwen/qwen3.7-max-20260520/endpoints"
     }
   },
+  {
+    "id": "qwen/qwen3.7-plus",
+    "canonical_slug": "qwen/qwen3.7-plus-20260602",
+    "hugging_face_id": null,
+    "name": "Qwen: Qwen3.7 Plus",
+    "created": 1780491783,
+    "description": "Qwen3.7-Plus is a cost-effective model in Alibaba's Qwen3.7 series. It supports text and image input with text output, building on the series' text capabilities with a comprehensive upgrade to its...",
+    "context_length": 1000000,
+    "architecture": {
+      "modality": "text+image->text",
+      "input_modalities": ["text", "image"],
+      "output_modalities": ["text"],
+      "tokenizer": "Qwen",
+      "instruct_type": null
+    },
+    "pricing": {
+      "prompt": "0.0000004",
+      "completion": "0.0000016",
+      "input_cache_read": "0.00000008",
+      "input_cache_write": "0.0000005"
+    },
+    "top_provider": {
+      "context_length": 1000000,
+      "max_completion_tokens": 65536,
+      "is_moderated": false
+    },
+    "per_request_limits": null,
+    "supported_parameters": [
+      "include_reasoning",
+      "logprobs",
+      "max_tokens",
+      "presence_penalty",
+      "reasoning",
+      "response_format",
+      "seed",
+      "structured_outputs",
+      "temperature",
+      "tool_choice",
+      "tools",
+      "top_logprobs",
+      "top_p"
+    ],
+    "default_parameters": {},
+    "supported_voices": null,
+    "knowledge_cutoff": null,
+    "expiration_date": null,
+    "links": {
+      "details": "/api/v1/models/qwen/qwen3.7-plus-20260602/endpoints"
+    }
+  },
   {
     "id": "rekaai/reka-edge",
     "canonical_slug": "rekaai/reka-edge-2603",
@@ -15329,52 +15327,6 @@
       "details": "/api/v1/models/relace/relace-search-20251208/endpoints"
     }
   },
-  {
-    "id": "sao10k/l3-euryale-70b",
-    "canonical_slug": "sao10k/l3-euryale-70b",
-    "hugging_face_id": "Sao10K/L3-70B-Euryale-v2.1",
-    "name": "Sao10k: Llama 3 Euryale 70B v2.1",
-    "created": 1718668800,
-    "description": "Euryale 70B v2.1 is a model focused on creative roleplay from [Sao10k](https://ko-fi.com/sao10k). - Better prompt adherence. - Better anatomy / spatial awareness. - Adapts much better to unique and custom...",
-    "context_length": 8192,
-    "architecture": {
-      "modality": "text->text",
-      "input_modalities": ["text"],
-      "output_modalities": ["text"],
-      "tokenizer": "Llama3",
-      "instruct_type": "llama3"
-    },
-    "pricing": {
-      "prompt": "0.00000148",
-      "completion": "0.00000148"
-    },
-    "top_provider": {
-      "context_length": 8192,
-      "max_completion_tokens": 8192,
-      "is_moderated": false
-    },
-    "per_request_limits": null,
-    "supported_parameters": [
-      "frequency_penalty",
-      "max_tokens",
-      "presence_penalty",
-      "repetition_penalty",
-      "seed",
-      "stop",
-      "temperature",
-      "tool_choice",
-      "tools",
-      "top_k",
-      "top_p"
-    ],
-    "default_parameters": {},
-    "supported_voices": null,
-    "knowledge_cutoff": "2023-12-31",
-    "expiration_date": "2026-06-05",
-    "links": {
-      "details": "/api/v1/models/sao10k/l3-euryale-70b/endpoints"
-    }
-  },
   {
     "id": "sao10k/l3-lunaris-8b",
     "canonical_slug": "sao10k/l3-lunaris-8b",
@@ -16425,14 +16377,11 @@
       "max_tokens",
       "presence_penalty",
       "reasoning",
-      "repetition_penalty",
       "response_format",
-      "seed",
       "stop",
       "temperature",
       "tool_choice",
       "tools",
-      "top_k",
       "top_p"
     ],
     "default_parameters": {
@@ -16561,50 +16510,6 @@
       "details": "/api/v1/models/xiaomi/mimo-v2.5-pro-20260422/endpoints"
     }
   },
-  {
-    "id": "z-ai/glm-4-32b",
-    "canonical_slug": "z-ai/glm-4-32b-0414",
-    "hugging_face_id": "",
-    "name": "Z.ai: GLM 4 32B ",
-    "created": 1753376617,
-    "description": "GLM 4 32B is a cost-effective foundation language model. It can efficiently perform complex tasks and has significantly enhanced capabilities in tool use, online search, and code-related intelligent tasks. It...",
-    "context_length": 128000,
-    "architecture": {
-      "modality": "text->text",
-      "input_modalities": ["text"],
-      "output_modalities": ["text"],
-      "tokenizer": "Other",
-      "instruct_type": null
-    },
-    "pricing": {
-      "prompt": "0.0000001",
-      "completion": "0.0000001"
-    },
-    "top_provider": {
-      "context_length": 128000,
-      "max_completion_tokens": null,
-      "is_moderated": false
-    },
-    "per_request_limits": null,
-    "supported_parameters": [
-      "max_tokens",
-      "temperature",
-      "tool_choice",
-      "tools",
-      "top_p"
-    ],
-    "default_parameters": {
-      "temperature": 0.75,
-      "top_p": null,
-      "frequency_penalty": null
-    },
-    "supported_voices": null,
-    "knowledge_cutoff": "2024-06-30",
-    "expiration_date": null,
-    "links": {
-      "details": "/api/v1/models/z-ai/glm-4-32b-0414/endpoints"
-    }
-  },
   {
     "id": "z-ai/glm-4.5",
     "canonical_slug": "z-ai/glm-4.5",
@@ -16654,7 +16559,7 @@
     },
     "supported_voices": null,
     "knowledge_cutoff": "2024-12-31",
-    "expiration_date": null,
+    "expiration_date": "2026-06-19",
     "links": {
       "details": "/api/v1/models/z-ai/glm-4.5/endpoints"
     }
@@ -16688,6 +16593,7 @@
     "supported_parameters": [
       "frequency_penalty",
       "include_reasoning",
+      "logprobs",
       "max_tokens",
       "presence_penalty",
       "reasoning",
@@ -16699,52 +16605,7 @@
       "tool_choice",
       "tools",
       "top_k",
-      "top_p"
-    ],
-    "default_parameters": {
-      "temperature": 0.75,
-      "top_p": null,
-      "frequency_penalty": null
-    },
-    "supported_voices": null,
-    "knowledge_cutoff": "2024-12-31",
-    "expiration_date": null,
-    "links": {
-      "details": "/api/v1/models/z-ai/glm-4.5-air/endpoints"
-    }
-  },
-  {
-    "id": "z-ai/glm-4.5-air:free",
-    "canonical_slug": "z-ai/glm-4.5-air",
-    "hugging_face_id": "zai-org/GLM-4.5-Air",
-    "name": "Z.ai: GLM 4.5 Air (free)",
-    "created": 1753471258,
-    "description": "GLM-4.5-Air is the lightweight variant of our latest flagship model family, also purpose-built for agent-centric applications. Like GLM-4.5, it adopts the Mixture-of-Experts (MoE) architecture but with a more compact parameter...",
-    "context_length": 131072,
-    "architecture": {
-      "modality": "text->text",
-      "input_modalities": ["text"],
-      "output_modalities": ["text"],
-      "tokenizer": "Other",
-      "instruct_type": null
-    },
-    "pricing": {
-      "prompt": "0",
-      "completion": "0"
-    },
-    "top_provider": {
-      "context_length": 131072,
-      "max_completion_tokens": 96000,
-      "is_moderated": false
-    },
-    "per_request_limits": null,
-    "supported_parameters": [
-      "include_reasoning",
-      "max_tokens",
-      "reasoning",
-      "temperature",
-      "tool_choice",
-      "tools",
+      "top_logprobs",
       "top_p"
     ],
     "default_parameters": {
@@ -16891,11 +16752,11 @@
     "pricing": {
       "prompt": "0.0000003",
       "completion": "0.0000009",
-      "input_cache_read": "0.00000005"
+      "input_cache_read": "0.000000055"
     },
     "top_provider": {
       "context_length": 131072,
-      "max_completion_tokens": 24000,
+      "max_completion_tokens": 32768,
       "is_moderated": false
     },
     "per_request_limits": null,
@@ -17107,7 +16968,7 @@
     "name": "Z.ai: GLM 5 Turbo",
     "created": 1773583573,
     "description": "GLM-5 Turbo is a new model from Z.ai designed for fast inference and strong performance in agent-driven environments such as OpenClaw scenarios. It is deeply optimized for real-world agent workflows...",
-    "context_length": 202752,
+    "context_length": 262144,
     "architecture": {
       "modality": "text->text",
       "input_modalities": ["text"],
@@ -17121,7 +16982,7 @@
       "input_cache_read": "0.00000024"
     },
     "top_provider": {
-      "context_length": 202752,
+      "context_length": 262144,
       "max_completion_tokens": 131072,
       "is_moderated": false
     },
@@ -17222,56 +17083,5 @@
     "links": {
       "details": "/api/v1/models/z-ai/glm-5.1-20260406/endpoints"
     }
-  },
-  {
-    "id": "z-ai/glm-5v-turbo",
-    "canonical_slug": "z-ai/glm-5v-turbo-20260401",
-    "hugging_face_id": "",
-    "name": "Z.ai: GLM 5V Turbo",
-    "created": 1775061458,
-    "description": "GLM-5V-Turbo is Z.ai’s first native multimodal agent foundation model, built for vision-based coding and agent-driven tasks. It natively handles image, video, and text inputs, excels at long-horizon planning, complex coding,...",
-    "context_length": 202752,
-    "architecture": {
-      "modality": "text+image+video->text",
-      "input_modalities": ["image", "text", "video"],
-      "output_modalities": ["text"],
-      "tokenizer": "Other",
-      "instruct_type": null
-    },
-    "pricing": {
-      "prompt": "0.0000012",
-      "completion": "0.000004",
-      "input_cache_read": "0.00000024"
-    },
-    "top_provider": {
-      "context_length": 202752,
-      "max_completion_tokens": 131072,
-      "is_moderated": false
-    },
-    "per_request_limits": null,
-    "supported_parameters": [
-      "include_reasoning",
-      "max_tokens",
-      "reasoning",
-      "response_format",
-      "temperature",
-      "tool_choice",
-      "tools",
-      "top_p"
-    ],
-    "default_parameters": {
-      "temperature": 1,
-      "top_p": 0.95,
-      "top_k": null,
-      "frequency_penalty": null,
-      "presence_penalty": null,
-      "repetition_penalty": null
-    },
-    "supported_voices": null,
-    "knowledge_cutoff": null,
-    "expiration_date": null,
-    "links": {
-      "details": "/api/v1/models/z-ai/glm-5v-turbo-20260401/endpoints"
-    }
   }
 ]