LLMs: Grok 4.3 support

2026-05-10 21:50:14 -07:00 · 2026-05-03 14:22:16 -07:00
parent d5d7cf5a21
commit d3a7b75d1c
1 changed files with 27 additions and 4 deletions
@@ -16,7 +16,14 @@ const DEV_DEBUG_XAI_MODELS = (Release.TenantSlug as any) === 'staging' /* ALSO I

 // Known xAI Models - Manual Mappings
 // List on: https://docs.x.ai/docs/models?cluster=us-east-1
-// Verified: 2026-04-16
+// Verified: 2026-05-03
+
+// Flat pricing for Grok 4.3 flagship (April 2026)
+const PRICE_43 = {
+  input: 1.25,
+  output: 2.5,
+  cache: { cType: 'oai-ac' as const, read: 0.2 },
+};

 // Flat pricing for Grok 4.20 flagship models
 const PRICE_420 = {
@@ -82,11 +89,25 @@ const XAI_PAR_Pre4: ModelDescriptionSchema['parameterSpecs'] = [] as const;

 const _knownXAIChatModels: ManualMappings = [

-  // Grok 4.20 (flagship, March 2026) - note: model IDs use dot (4.20), unlike earlier models
+  // Grok 4.3 (flagship, April 2026) - always-on reasoning, no reasoning_effort support
  {
+    idPrefix: 'grok-4.3',
+    label: 'Grok 4.3',
+    description: 'xAI\'s latest flagship model with always-on reasoning and a 1M token context window. Supports text, image, and video inputs with improved agentic performance at lower cost.',
+    contextWindow: 1000000,
+    maxCompletionTokens: undefined,
+    interfaces: [...XAI_IF_Vision, LLM_IF_OAI_Reasoning],
+    parameterSpecs: XAI_PAR, // no reasoning_effort - always-on reasoning
+    chatPrice: PRICE_43,
+    benchmark: { cbaElo: 1456 }, // grok-4.3
+  },
+
+  // Grok 4.20 (flagship, March 2026) - superseded by 4.3
+  {
+    hidden: true, // yield to 4.3
    idPrefix: 'grok-4.20-0309-reasoning',
    label: 'Grok 4.20 Reasoning',
-    description: 'xAI\'s most advanced flagship reasoning model with a 2M token context window. Deep reasoning and problem-solving capabilities with text and image inputs.',
+    description: 'xAI\'s previous flagship reasoning model with a 2M token context window. Deep reasoning and problem-solving capabilities with text and image inputs.',
    contextWindow: 2000000,
    maxCompletionTokens: undefined,
    interfaces: [...XAI_IF_Vision, LLM_IF_OAI_Reasoning],
@@ -95,9 +116,10 @@ const _knownXAIChatModels: ManualMappings = [
    benchmark: { cbaElo: 1480 }, // grok-4.20-beta-0309-reasoning (CBA name)
  },
  {
+    hidden: true, // yield to 4.3
    idPrefix: 'grok-4.20-0309-non-reasoning',
    label: 'Grok 4.20',
-    description: 'xAI\'s most advanced flagship model with a 2M token context window. Non-reasoning variant for fast, high-quality responses with text and image inputs.',
+    description: 'xAI\'s previous flagship model with a 2M token context window. Non-reasoning variant for fast, high-quality responses with text and image inputs.',
    contextWindow: 2000000,
    maxCompletionTokens: undefined,
    interfaces: XAI_IF_Vision,
@@ -320,6 +342,7 @@ export async function xaiFetchModelDescriptions(access: OpenAIAccessSchema): Pro

 // manual sort order - your desired order
 const _xaiIdStartsWithOrder = [
+  'grok-4.3',
  'grok-4.20-0309-reasoning',
  'grok-4.20-0309-non-reasoning',
  'grok-4.20-multi-agent-0309',