OpenAI: update models

This commit is contained in:
Enrico Ros
2025-06-11 14:11:14 -07:00
parent 702006f6ea
commit 13e0779ced
@@ -43,6 +43,18 @@ export const _knownOpenAIChatModels: ManualMappings = [
chatPrice: { input: 3, output: 12 },
isPreview: true,
},
{
hidden: true, // RESPONSES API UNSUPPORTED YET
idPrefix: 'codex-mini-latest',
label: 'Codex Mini Latest',
description: 'Fast reasoning model optimized for the Codex CLI. A fine-tuned version of o4-mini.',
contextWindow: 200000,
maxCompletionTokens: 100000,
trainingDataCutoff: 'May 31, 2024',
interfaces: [LLM_IF_OAI_Chat, LLM_IF_OAI_Vision, LLM_IF_OAI_Fn, LLM_IF_OAI_Json, LLM_IF_OAI_Reasoning, LLM_IF_OAI_PromptCaching],
parameterSpecs: [{ paramId: 'llmVndOaiReasoningEffort' }],
chatPrice: { input: 1.5, cache: { cType: 'oai-ac', read: 0.375 }, output: 6 },
},
/// Reasoning models - o-series
@@ -77,6 +89,36 @@ export const _knownOpenAIChatModels: ManualMappings = [
// benchmarks not available yet, as of 2025-04-16 (intro)
},
// o3-pro - (v1/responses API - UNSUPPORTED YET) 💎💰
{
hidden: true, // UNSUPPORTED /responses API yet
idPrefix: 'o3-pro-2025-06-10',
label: 'o3 Pro (2025-06-10) [unsupported]',
description: 'Requires (unsupported) Responses API. Version of o3 with more compute for better responses. Provides consistently better answers for complex tasks.',
contextWindow: 200000,
maxCompletionTokens: 100000,
trainingDataCutoff: 'May 31, 2024',
interfaces: [LLM_IF_OAI_Chat, LLM_IF_OAI_Vision, LLM_IF_OAI_Fn, LLM_IF_OAI_Json, LLM_IF_OAI_Reasoning],
parameterSpecs: [{ paramId: 'llmForceNoStream' }, { paramId: 'llmVndOaiReasoningEffort' }, { paramId: 'llmVndOaiRestoreMarkdown' }],
chatPrice: { input: 20, output: 80 },
// benchmark: has not been measured yet
},
{
idPrefix: 'o3-pro',
label: 'o3 Pro',
description: 'Requires (unsupported) Responses API. Version of o3 with more compute for better responses. Points to o3-pro-2025-06-10.',
symLink: 'o3-pro-2025-06-10',
hidden: true, // prefer versioned
// copied from symlinked
contextWindow: 200000,
maxCompletionTokens: 100000,
trainingDataCutoff: 'May 31, 2024',
interfaces: [LLM_IF_OAI_Chat, LLM_IF_OAI_Vision, LLM_IF_OAI_Fn, LLM_IF_OAI_Json, LLM_IF_OAI_Reasoning],
parameterSpecs: [{ paramId: 'llmForceNoStream' }, { paramId: 'llmVndOaiReasoningEffort' }, { paramId: 'llmVndOaiRestoreMarkdown' }],
chatPrice: { input: 20, output: 80 },
// benchmark: has not been measured yet
},
/// o3
{
isLatest: true,
@@ -88,7 +130,7 @@ export const _knownOpenAIChatModels: ManualMappings = [
trainingDataCutoff: 'May 31, 2024',
interfaces: [LLM_IF_OAI_Chat, LLM_IF_OAI_Vision, LLM_IF_OAI_Fn, LLM_IF_OAI_Json, LLM_IF_OAI_Reasoning, LLM_IF_OAI_PromptCaching],
parameterSpecs: [{ paramId: 'llmForceNoStream' }, { paramId: 'llmVndOaiReasoningEffort' }, { paramId: 'llmVndOaiRestoreMarkdown' }],
chatPrice: { input: 10, cache: { cType: 'oai-ac', read: 2.5 }, output: 40 },
chatPrice: { input: 2, cache: { cType: 'oai-ac', read: 0.5 }, output: 8 },
// benchmark: { cbaElo: 1413 /* unknown variant, as of 2025-05-12 */ },
},
{
@@ -103,7 +145,7 @@ export const _knownOpenAIChatModels: ManualMappings = [
trainingDataCutoff: 'May 31, 2024',
interfaces: [LLM_IF_OAI_Chat, LLM_IF_OAI_Vision, LLM_IF_OAI_Fn, LLM_IF_OAI_Json, LLM_IF_OAI_Reasoning, LLM_IF_OAI_PromptCaching],
parameterSpecs: [{ paramId: 'llmForceNoStream' }, { paramId: 'llmVndOaiReasoningEffort' }, { paramId: 'llmVndOaiRestoreMarkdown' }],
chatPrice: { input: 10, cache: { cType: 'oai-ac', read: 2.5 }, output: 40 },
chatPrice: { input: 2, cache: { cType: 'oai-ac', read: 0.5 }, output: 8 },
// benchmarks not available yet, as of 2025-04-16 (intro)
},
@@ -123,7 +165,7 @@ export const _knownOpenAIChatModels: ManualMappings = [
{
idPrefix: 'o3-mini',
label: 'o3 Mini',
description: 'Points to the most recent o3-mini snapshot: o3-mini-2025-01-31',
description: 'A small model alternative to o3. Points to the most recent o3-mini snapshot: o3-mini-2025-01-31',
symLink: 'o3-mini-2025-01-31',
hidden: true, // prefer versioned
// copied from symlinked
@@ -170,7 +212,7 @@ export const _knownOpenAIChatModels: ManualMappings = [
{
idPrefix: 'o1-2024-12-17',
label: 'o1 (2024-12-17)',
description: 'Latest o1 model.',
description: 'Previous full o-series reasoning model.',
contextWindow: 200000,
maxCompletionTokens: 100000,
trainingDataCutoff: 'Oct 2023',
@@ -182,7 +224,7 @@ export const _knownOpenAIChatModels: ManualMappings = [
{
idPrefix: 'o1',
label: 'o1',
description: 'Points to the most recent snapshot of the o1 model: o1-2024-12-17',
description: 'Previous full o-series reasoning model. Points to the most recent snapshot: o1-2024-12-17',
symLink: 'o1-2024-12-17',
hidden: true, // prefer versioned
// copied from symlinked
@@ -195,7 +237,7 @@ export const _knownOpenAIChatModels: ManualMappings = [
benchmark: { cbaElo: 1350 },
},
// o1-preview
// o1-preview (deprecated)
{
hidden: true, // OUTDATED
idPrefix: 'o1-preview-2024-09-12',
@@ -208,6 +250,7 @@ export const _knownOpenAIChatModels: ManualMappings = [
chatPrice: { input: 15, cache: { cType: 'oai-ac', read: 7.5 }, output: 60 },
benchmark: { cbaElo: 1335 },
isPreview: true,
isLegacy: true,
},
{
idPrefix: 'o1-preview',
@@ -223,24 +266,27 @@ export const _knownOpenAIChatModels: ManualMappings = [
chatPrice: { input: 15, cache: { cType: 'oai-ac', read: 7.5 }, output: 60 },
benchmark: { cbaElo: 1335 },
isPreview: true,
isLegacy: true,
},
// o1-mini
// o1-mini (deprecated)
{
hidden: true, // DEPRECATED
idPrefix: 'o1-mini-2024-09-12',
label: 'o1 Mini (2024-09-12)', // ⏱️
description: 'Latest o1-mini model snapshot. Fast, cost-efficient reasoning model tailored to coding, math, and science use cases.',
description: 'Deprecated. Fast, cost-efficient reasoning model tailored to coding, math, and science use cases.',
contextWindow: 128000,
maxCompletionTokens: 65536,
trainingDataCutoff: 'Oct 2023',
interfaces: [LLM_IF_OAI_Chat, LLM_IF_OAI_Reasoning, LLM_IF_OAI_PromptCaching, LLM_IF_HOTFIX_StripImages, LLM_IF_HOTFIX_Sys0ToUsr0],
chatPrice: { input: 1.1, cache: { cType: 'oai-ac', read: 0.55 }, output: 4.4 },
benchmark: { cbaElo: 1304 },
isLegacy: true,
},
{
idPrefix: 'o1-mini',
label: 'o1 Mini',
description: 'Points to the most recent o1-mini snapshot: o1-mini-2024-09-12',
description: 'Deprecated. A small model alternative to o1. Points to the most recent o1-mini snapshot: o1-mini-2024-09-12',
symLink: 'o1-mini-2024-09-12',
hidden: true, // prefer versioned
// copied from symlinked
@@ -250,6 +296,7 @@ export const _knownOpenAIChatModels: ManualMappings = [
interfaces: [LLM_IF_OAI_Chat, LLM_IF_OAI_Reasoning, LLM_IF_OAI_PromptCaching, LLM_IF_HOTFIX_StripImages, LLM_IF_HOTFIX_Sys0ToUsr0],
chatPrice: { input: 1.1, cache: { cType: 'oai-ac', read: 0.55 }, output: 4.4 },
benchmark: { cbaElo: 1304 },
isLegacy: true,
},
/// GPT-4.1 series
@@ -342,8 +389,8 @@ export const _knownOpenAIChatModels: ManualMappings = [
{
hidden: true, // OBSOLETE
idPrefix: 'gpt-4.5-preview-2025-02-27',
label: 'GPT-4.5 Preview (2025-02-27)',
description: 'Research preview of GPT-4.5, our largest and most capable GPT model yet. Deep world knowledge and better understanding of user intent makes it good at creative tasks and agentic planning.',
label: 'GPT-4.5 Preview (2025-02-27)', // [deprecated]
description: 'Will be shut down on 2025-07-14. Research preview of GPT-4.5, our largest and most capable GPT model yet. Deep world knowledge and better understanding of user intent makes it good at creative tasks and agentic planning.',
contextWindow: 128000,
maxCompletionTokens: 16384,
trainingDataCutoff: 'Oct 2023',
@@ -354,7 +401,7 @@ export const _knownOpenAIChatModels: ManualMappings = [
},
{
idPrefix: 'gpt-4.5-preview',
label: 'GPT-4.5 Preview',
label: 'GPT-4.5 Preview', // [deprecated]
description: 'Largest GPT model, good for creative tasks and agentic planning. Currently points to gpt-4.5-preview-2025-02-27.',
symLink: 'gpt-4.5-preview-2025-02-27',
hidden: true, // prefer versioned
@@ -466,6 +513,19 @@ export const _knownOpenAIChatModels: ManualMappings = [
},
// GPT-4o Audio Preview
{
hidden: true, // UNSUPPORTED yet (audio output model)
idPrefix: 'gpt-4o-audio-preview-2025-06-03',
label: 'GPT-4o Audio Preview (2025-06-03)',
description: 'Latest snapshot for the Audio API model.',
contextWindow: 128000,
maxCompletionTokens: 16384,
trainingDataCutoff: 'Oct 2023',
interfaces: [LLM_IF_OAI_NeedsAudio],
chatPrice: { input: 2.5, output: 10 /* AUDIO PRICING UNSUPPORTED 40/80 */ },
// benchmarks don't apply to audio models
isPreview: true,
},
{
hidden: true, // UNSUPPORTED yet (audio output model)
idPrefix: 'gpt-4o-audio-preview-2024-12-17',
@@ -496,7 +556,7 @@ export const _knownOpenAIChatModels: ManualMappings = [
idPrefix: 'gpt-4o-audio-preview',
label: 'GPT-4o Audio Preview',
description: 'Preview release for audio inputs in chat completions.',
symLink: 'gpt-4o-audio-preview-2024-12-17',
symLink: 'gpt-4o-audio-preview-2024-12-17', // still points to 12-17 as of 2025-06-11
hidden: true, // prefer versioned
// copied from symlinked
contextWindow: 128000,
@@ -509,6 +569,19 @@ export const _knownOpenAIChatModels: ManualMappings = [
},
// GPT-4o Realtime Preview
{
hidden: true, // UNSUPPORTED yet - REALTIME API
idPrefix: 'gpt-4o-realtime-preview-2025-06-03',
label: 'GPT-4o Realtime Preview (2025-06-03)',
description: 'Latest snapshot for the Realtime API model.',
contextWindow: 128000,
maxCompletionTokens: 4096,
trainingDataCutoff: 'Oct 2023',
interfaces: [LLM_IF_OAI_Realtime],
chatPrice: { input: 5, cache: { cType: 'oai-ac', read: 2.5 }, output: 20 /* AUDIO PRICING UNSUPPORTED 40/80 */ },
// benchmarks don't apply to realtime models
isPreview: true,
},
{
hidden: true, // UNSUPPORTED yet - REALTIME API
idPrefix: 'gpt-4o-realtime-preview-2024-12-17',
@@ -871,6 +944,8 @@ export const _knownOpenAIChatModels: ManualMappings = [
const openAIModelsDenyList: string[] = [
// [OpenAI, 2025-03-11] FIXME: NOT YET SUPPORTED - "RESPONSES API"
'computer-use-preview', 'computer-use-preview-2025-03-11', // FIXME: support these
'codex-mini-latest', // FIXME: support these
// 'o3-pro', // FIXME: support these
'o1-pro', // FIXME: support these
// Legacy GPT models
@@ -898,7 +973,7 @@ const openAIModelsDenyList: string[] = [
'gpt-image-1', 'dall-e-3', 'dall-e-2',
// Moderation models
'omni-moderation-latest', 'omni-moderation-2024-09-26',
'omni-moderation-latest', 'omni-moderation-2024-09-26', 'text-moderation-latest',
];
export function openAIModelFilter(model: OpenAIWire_API_Models_List.Model) {
@@ -921,6 +996,8 @@ const _manualOrderingIdPrefixes = [
'o4-20',
'o4-mini-20',
'o4-',
'o3-pro-20',
'o3-pro',
'o3-20',
'o3-mini-20',
'o3-',
@@ -952,6 +1029,8 @@ const _manualOrderingIdPrefixes = [
'gpt-4o-',
// ChatGPT models
'chatgpt-',
// Codex
'codex-',
// ...rest
// 'gpt-4-turbo-',
// 'gpt-4-',