OpenAI: update models

2026-05-10 21:50:14 -07:00 · 2025-06-11 14:11:14 -07:00
parent 702006f6ea
commit 13e0779ced
1 changed files with 93 additions and 14 deletions
@@ -43,6 +43,18 @@ export const _knownOpenAIChatModels: ManualMappings = [
    chatPrice: { input: 3, output: 12 },
    isPreview: true,
  },
+  {
+    hidden: true, // RESPONSES API UNSUPPORTED YET
+    idPrefix: 'codex-mini-latest',
+    label: 'Codex Mini Latest',
+    description: 'Fast reasoning model optimized for the Codex CLI. A fine-tuned version of o4-mini.',
+    contextWindow: 200000,
+    maxCompletionTokens: 100000,
+    trainingDataCutoff: 'May 31, 2024',
+    interfaces: [LLM_IF_OAI_Chat, LLM_IF_OAI_Vision, LLM_IF_OAI_Fn, LLM_IF_OAI_Json, LLM_IF_OAI_Reasoning, LLM_IF_OAI_PromptCaching],
+    parameterSpecs: [{ paramId: 'llmVndOaiReasoningEffort' }],
+    chatPrice: { input: 1.5, cache: { cType: 'oai-ac', read: 0.375 }, output: 6 },
+  },


  /// Reasoning models - o-series
@@ -77,6 +89,36 @@ export const _knownOpenAIChatModels: ManualMappings = [
    // benchmarks not available yet, as of 2025-04-16 (intro)
  },

+  // o3-pro - (v1/responses API - UNSUPPORTED YET) 💎💰
+  {
+    hidden: true, // UNSUPPORTED /responses API yet
+    idPrefix: 'o3-pro-2025-06-10',
+    label: 'o3 Pro (2025-06-10) [unsupported]',
+    description: 'Requires (unsupported) Responses API. Version of o3 with more compute for better responses. Provides consistently better answers for complex tasks.',
+    contextWindow: 200000,
+    maxCompletionTokens: 100000,
+    trainingDataCutoff: 'May 31, 2024',
+    interfaces: [LLM_IF_OAI_Chat, LLM_IF_OAI_Vision, LLM_IF_OAI_Fn, LLM_IF_OAI_Json, LLM_IF_OAI_Reasoning],
+    parameterSpecs: [{ paramId: 'llmForceNoStream' }, { paramId: 'llmVndOaiReasoningEffort' }, { paramId: 'llmVndOaiRestoreMarkdown' }],
+    chatPrice: { input: 20, output: 80 },
+    // benchmark: has not been measured yet
+  },
+  {
+    idPrefix: 'o3-pro',
+    label: 'o3 Pro',
+    description: 'Requires (unsupported) Responses API. Version of o3 with more compute for better responses. Points to o3-pro-2025-06-10.',
+    symLink: 'o3-pro-2025-06-10',
+    hidden: true, // prefer versioned
+    // copied from symlinked
+    contextWindow: 200000,
+    maxCompletionTokens: 100000,
+    trainingDataCutoff: 'May 31, 2024',
+    interfaces: [LLM_IF_OAI_Chat, LLM_IF_OAI_Vision, LLM_IF_OAI_Fn, LLM_IF_OAI_Json, LLM_IF_OAI_Reasoning],
+    parameterSpecs: [{ paramId: 'llmForceNoStream' }, { paramId: 'llmVndOaiReasoningEffort' }, { paramId: 'llmVndOaiRestoreMarkdown' }],
+    chatPrice: { input: 20, output: 80 },
+    // benchmark: has not been measured yet
+  },
+
  /// o3
  {
    isLatest: true,
@@ -88,7 +130,7 @@ export const _knownOpenAIChatModels: ManualMappings = [
    trainingDataCutoff: 'May 31, 2024',
    interfaces: [LLM_IF_OAI_Chat, LLM_IF_OAI_Vision, LLM_IF_OAI_Fn, LLM_IF_OAI_Json, LLM_IF_OAI_Reasoning, LLM_IF_OAI_PromptCaching],
    parameterSpecs: [{ paramId: 'llmForceNoStream' }, { paramId: 'llmVndOaiReasoningEffort' }, { paramId: 'llmVndOaiRestoreMarkdown' }],
-    chatPrice: { input: 10, cache: { cType: 'oai-ac', read: 2.5 }, output: 40 },
+    chatPrice: { input: 2, cache: { cType: 'oai-ac', read: 0.5 }, output: 8 },
    // benchmark: { cbaElo: 1413 /* unknown variant, as of 2025-05-12 */ },
  },
  {
@@ -103,7 +145,7 @@ export const _knownOpenAIChatModels: ManualMappings = [
    trainingDataCutoff: 'May 31, 2024',
    interfaces: [LLM_IF_OAI_Chat, LLM_IF_OAI_Vision, LLM_IF_OAI_Fn, LLM_IF_OAI_Json, LLM_IF_OAI_Reasoning, LLM_IF_OAI_PromptCaching],
    parameterSpecs: [{ paramId: 'llmForceNoStream' }, { paramId: 'llmVndOaiReasoningEffort' }, { paramId: 'llmVndOaiRestoreMarkdown' }],
-    chatPrice: { input: 10, cache: { cType: 'oai-ac', read: 2.5 }, output: 40 },
+    chatPrice: { input: 2, cache: { cType: 'oai-ac', read: 0.5 }, output: 8 },
    // benchmarks not available yet, as of 2025-04-16 (intro)
  },

@@ -123,7 +165,7 @@ export const _knownOpenAIChatModels: ManualMappings = [
  {
    idPrefix: 'o3-mini',
    label: 'o3 Mini',
-    description: 'Points to the most recent o3-mini snapshot: o3-mini-2025-01-31',
+    description: 'A small model alternative to o3. Points to the most recent o3-mini snapshot: o3-mini-2025-01-31',
    symLink: 'o3-mini-2025-01-31',
    hidden: true, // prefer versioned
    // copied from symlinked
@@ -170,7 +212,7 @@ export const _knownOpenAIChatModels: ManualMappings = [
  {
    idPrefix: 'o1-2024-12-17',
    label: 'o1 (2024-12-17)',
-    description: 'Latest o1 model.',
+    description: 'Previous full o-series reasoning model.',
    contextWindow: 200000,
    maxCompletionTokens: 100000,
    trainingDataCutoff: 'Oct 2023',
@@ -182,7 +224,7 @@ export const _knownOpenAIChatModels: ManualMappings = [
  {
    idPrefix: 'o1',
    label: 'o1',
-    description: 'Points to the most recent snapshot of the o1 model: o1-2024-12-17',
+    description: 'Previous full o-series reasoning model. Points to the most recent snapshot: o1-2024-12-17',
    symLink: 'o1-2024-12-17',
    hidden: true, // prefer versioned
    // copied from symlinked
@@ -195,7 +237,7 @@ export const _knownOpenAIChatModels: ManualMappings = [
    benchmark: { cbaElo: 1350 },
  },

-  // o1-preview
+  // o1-preview (deprecated)
  {
    hidden: true, // OUTDATED
    idPrefix: 'o1-preview-2024-09-12',
@@ -208,6 +250,7 @@ export const _knownOpenAIChatModels: ManualMappings = [
    chatPrice: { input: 15, cache: { cType: 'oai-ac', read: 7.5 }, output: 60 },
    benchmark: { cbaElo: 1335 },
    isPreview: true,
+    isLegacy: true,
  },
  {
    idPrefix: 'o1-preview',
@@ -223,24 +266,27 @@ export const _knownOpenAIChatModels: ManualMappings = [
    chatPrice: { input: 15, cache: { cType: 'oai-ac', read: 7.5 }, output: 60 },
    benchmark: { cbaElo: 1335 },
    isPreview: true,
+    isLegacy: true,
  },

-  // o1-mini
+  // o1-mini (deprecated)
  {
+    hidden: true, // DEPRECATED
    idPrefix: 'o1-mini-2024-09-12',
    label: 'o1 Mini (2024-09-12)', // ⏱️
-    description: 'Latest o1-mini model snapshot. Fast, cost-efficient reasoning model tailored to coding, math, and science use cases.',
+    description: 'Deprecated. Fast, cost-efficient reasoning model tailored to coding, math, and science use cases.',
    contextWindow: 128000,
    maxCompletionTokens: 65536,
    trainingDataCutoff: 'Oct 2023',
    interfaces: [LLM_IF_OAI_Chat, LLM_IF_OAI_Reasoning, LLM_IF_OAI_PromptCaching, LLM_IF_HOTFIX_StripImages, LLM_IF_HOTFIX_Sys0ToUsr0],
    chatPrice: { input: 1.1, cache: { cType: 'oai-ac', read: 0.55 }, output: 4.4 },
    benchmark: { cbaElo: 1304 },
+    isLegacy: true,
  },
  {
    idPrefix: 'o1-mini',
    label: 'o1 Mini',
-    description: 'Points to the most recent o1-mini snapshot: o1-mini-2024-09-12',
+    description: 'Deprecated. A small model alternative to o1. Points to the most recent o1-mini snapshot: o1-mini-2024-09-12',
    symLink: 'o1-mini-2024-09-12',
    hidden: true, // prefer versioned
    // copied from symlinked
@@ -250,6 +296,7 @@ export const _knownOpenAIChatModels: ManualMappings = [
    interfaces: [LLM_IF_OAI_Chat, LLM_IF_OAI_Reasoning, LLM_IF_OAI_PromptCaching, LLM_IF_HOTFIX_StripImages, LLM_IF_HOTFIX_Sys0ToUsr0],
    chatPrice: { input: 1.1, cache: { cType: 'oai-ac', read: 0.55 }, output: 4.4 },
    benchmark: { cbaElo: 1304 },
+    isLegacy: true,
  },

  /// GPT-4.1 series
@@ -342,8 +389,8 @@ export const _knownOpenAIChatModels: ManualMappings = [
  {
    hidden: true, // OBSOLETE
    idPrefix: 'gpt-4.5-preview-2025-02-27',
-    label: 'GPT-4.5 Preview (2025-02-27)',
-    description: 'Research preview of GPT-4.5, our largest and most capable GPT model yet. Deep world knowledge and better understanding of user intent makes it good at creative tasks and agentic planning.',
+    label: 'GPT-4.5 Preview (2025-02-27)', //  [deprecated]
+    description: 'Will be shut down on 2025-07-14. Research preview of GPT-4.5, our largest and most capable GPT model yet. Deep world knowledge and better understanding of user intent makes it good at creative tasks and agentic planning.',
    contextWindow: 128000,
    maxCompletionTokens: 16384,
    trainingDataCutoff: 'Oct 2023',
@@ -354,7 +401,7 @@ export const _knownOpenAIChatModels: ManualMappings = [
  },
  {
    idPrefix: 'gpt-4.5-preview',
-    label: 'GPT-4.5 Preview',
+    label: 'GPT-4.5 Preview', //  [deprecated]
    description: 'Largest GPT model, good for creative tasks and agentic planning. Currently points to gpt-4.5-preview-2025-02-27.',
    symLink: 'gpt-4.5-preview-2025-02-27',
    hidden: true, // prefer versioned
@@ -466,6 +513,19 @@ export const _knownOpenAIChatModels: ManualMappings = [
  },

  // GPT-4o Audio Preview
+  {
+    hidden: true, // UNSUPPORTED yet (audio output model)
+    idPrefix: 'gpt-4o-audio-preview-2025-06-03',
+    label: 'GPT-4o Audio Preview (2025-06-03)',
+    description: 'Latest snapshot for the Audio API model.',
+    contextWindow: 128000,
+    maxCompletionTokens: 16384,
+    trainingDataCutoff: 'Oct 2023',
+    interfaces: [LLM_IF_OAI_NeedsAudio],
+    chatPrice: { input: 2.5, output: 10 /* AUDIO PRICING UNSUPPORTED 40/80 */ },
+    // benchmarks don't apply to audio models
+    isPreview: true,
+  },
  {
    hidden: true, // UNSUPPORTED yet (audio output model)
    idPrefix: 'gpt-4o-audio-preview-2024-12-17',
@@ -496,7 +556,7 @@ export const _knownOpenAIChatModels: ManualMappings = [
    idPrefix: 'gpt-4o-audio-preview',
    label: 'GPT-4o Audio Preview',
    description: 'Preview release for audio inputs in chat completions.',
-    symLink: 'gpt-4o-audio-preview-2024-12-17',
+    symLink: 'gpt-4o-audio-preview-2024-12-17', // still points to 12-17 as of 2025-06-11
    hidden: true, // prefer versioned
    // copied from symlinked
    contextWindow: 128000,
@@ -509,6 +569,19 @@ export const _knownOpenAIChatModels: ManualMappings = [
  },

  // GPT-4o Realtime Preview
+  {
+    hidden: true, // UNSUPPORTED yet - REALTIME API
+    idPrefix: 'gpt-4o-realtime-preview-2025-06-03',
+    label: 'GPT-4o Realtime Preview (2025-06-03)',
+    description: 'Latest snapshot for the Realtime API model.',
+    contextWindow: 128000,
+    maxCompletionTokens: 4096,
+    trainingDataCutoff: 'Oct 2023',
+    interfaces: [LLM_IF_OAI_Realtime],
+    chatPrice: { input: 5, cache: { cType: 'oai-ac', read: 2.5 }, output: 20 /* AUDIO PRICING UNSUPPORTED 40/80 */ },
+    // benchmarks don't apply to realtime models
+    isPreview: true,
+  },
  {
    hidden: true, // UNSUPPORTED yet - REALTIME API
    idPrefix: 'gpt-4o-realtime-preview-2024-12-17',
@@ -871,6 +944,8 @@ export const _knownOpenAIChatModels: ManualMappings = [
 const openAIModelsDenyList: string[] = [
  // [OpenAI, 2025-03-11] FIXME: NOT YET SUPPORTED - "RESPONSES API"
  'computer-use-preview', 'computer-use-preview-2025-03-11', // FIXME: support these
+  'codex-mini-latest', // FIXME: support these
+  // 'o3-pro', // FIXME: support these
  'o1-pro', // FIXME: support these

  // Legacy GPT models
@@ -898,7 +973,7 @@ const openAIModelsDenyList: string[] = [
  'gpt-image-1', 'dall-e-3', 'dall-e-2',

  // Moderation models
-  'omni-moderation-latest', 'omni-moderation-2024-09-26',
+  'omni-moderation-latest', 'omni-moderation-2024-09-26', 'text-moderation-latest',
 ];

 export function openAIModelFilter(model: OpenAIWire_API_Models_List.Model) {
@@ -921,6 +996,8 @@ const _manualOrderingIdPrefixes = [
  'o4-20',
  'o4-mini-20',
  'o4-',
+  'o3-pro-20',
+  'o3-pro',
  'o3-20',
  'o3-mini-20',
  'o3-',
@@ -952,6 +1029,8 @@ const _manualOrderingIdPrefixes = [
  'gpt-4o-',
  // ChatGPT models
  'chatgpt-',
+  // Codex
+  'codex-',
  // ...rest
  // 'gpt-4-turbo-',
  // 'gpt-4-',