mirror of
https://github.com/enricoros/big-AGI.git
synced 2026-05-10 21:50:14 -07:00
OpenAI: update models
This commit is contained in:
@@ -43,6 +43,18 @@ export const _knownOpenAIChatModels: ManualMappings = [
|
||||
chatPrice: { input: 3, output: 12 },
|
||||
isPreview: true,
|
||||
},
|
||||
{
|
||||
hidden: true, // RESPONSES API UNSUPPORTED YET
|
||||
idPrefix: 'codex-mini-latest',
|
||||
label: 'Codex Mini Latest',
|
||||
description: 'Fast reasoning model optimized for the Codex CLI. A fine-tuned version of o4-mini.',
|
||||
contextWindow: 200000,
|
||||
maxCompletionTokens: 100000,
|
||||
trainingDataCutoff: 'May 31, 2024',
|
||||
interfaces: [LLM_IF_OAI_Chat, LLM_IF_OAI_Vision, LLM_IF_OAI_Fn, LLM_IF_OAI_Json, LLM_IF_OAI_Reasoning, LLM_IF_OAI_PromptCaching],
|
||||
parameterSpecs: [{ paramId: 'llmVndOaiReasoningEffort' }],
|
||||
chatPrice: { input: 1.5, cache: { cType: 'oai-ac', read: 0.375 }, output: 6 },
|
||||
},
|
||||
|
||||
|
||||
/// Reasoning models - o-series
|
||||
@@ -77,6 +89,36 @@ export const _knownOpenAIChatModels: ManualMappings = [
|
||||
// benchmarks not available yet, as of 2025-04-16 (intro)
|
||||
},
|
||||
|
||||
// o3-pro - (v1/responses API - UNSUPPORTED YET) 💎💰
|
||||
{
|
||||
hidden: true, // UNSUPPORTED /responses API yet
|
||||
idPrefix: 'o3-pro-2025-06-10',
|
||||
label: 'o3 Pro (2025-06-10) [unsupported]',
|
||||
description: 'Requires (unsupported) Responses API. Version of o3 with more compute for better responses. Provides consistently better answers for complex tasks.',
|
||||
contextWindow: 200000,
|
||||
maxCompletionTokens: 100000,
|
||||
trainingDataCutoff: 'May 31, 2024',
|
||||
interfaces: [LLM_IF_OAI_Chat, LLM_IF_OAI_Vision, LLM_IF_OAI_Fn, LLM_IF_OAI_Json, LLM_IF_OAI_Reasoning],
|
||||
parameterSpecs: [{ paramId: 'llmForceNoStream' }, { paramId: 'llmVndOaiReasoningEffort' }, { paramId: 'llmVndOaiRestoreMarkdown' }],
|
||||
chatPrice: { input: 20, output: 80 },
|
||||
// benchmark: has not been measured yet
|
||||
},
|
||||
{
|
||||
idPrefix: 'o3-pro',
|
||||
label: 'o3 Pro',
|
||||
description: 'Requires (unsupported) Responses API. Version of o3 with more compute for better responses. Points to o3-pro-2025-06-10.',
|
||||
symLink: 'o3-pro-2025-06-10',
|
||||
hidden: true, // prefer versioned
|
||||
// copied from symlinked
|
||||
contextWindow: 200000,
|
||||
maxCompletionTokens: 100000,
|
||||
trainingDataCutoff: 'May 31, 2024',
|
||||
interfaces: [LLM_IF_OAI_Chat, LLM_IF_OAI_Vision, LLM_IF_OAI_Fn, LLM_IF_OAI_Json, LLM_IF_OAI_Reasoning],
|
||||
parameterSpecs: [{ paramId: 'llmForceNoStream' }, { paramId: 'llmVndOaiReasoningEffort' }, { paramId: 'llmVndOaiRestoreMarkdown' }],
|
||||
chatPrice: { input: 20, output: 80 },
|
||||
// benchmark: has not been measured yet
|
||||
},
|
||||
|
||||
/// o3
|
||||
{
|
||||
isLatest: true,
|
||||
@@ -88,7 +130,7 @@ export const _knownOpenAIChatModels: ManualMappings = [
|
||||
trainingDataCutoff: 'May 31, 2024',
|
||||
interfaces: [LLM_IF_OAI_Chat, LLM_IF_OAI_Vision, LLM_IF_OAI_Fn, LLM_IF_OAI_Json, LLM_IF_OAI_Reasoning, LLM_IF_OAI_PromptCaching],
|
||||
parameterSpecs: [{ paramId: 'llmForceNoStream' }, { paramId: 'llmVndOaiReasoningEffort' }, { paramId: 'llmVndOaiRestoreMarkdown' }],
|
||||
chatPrice: { input: 10, cache: { cType: 'oai-ac', read: 2.5 }, output: 40 },
|
||||
chatPrice: { input: 2, cache: { cType: 'oai-ac', read: 0.5 }, output: 8 },
|
||||
// benchmark: { cbaElo: 1413 /* unknown variant, as of 2025-05-12 */ },
|
||||
},
|
||||
{
|
||||
@@ -103,7 +145,7 @@ export const _knownOpenAIChatModels: ManualMappings = [
|
||||
trainingDataCutoff: 'May 31, 2024',
|
||||
interfaces: [LLM_IF_OAI_Chat, LLM_IF_OAI_Vision, LLM_IF_OAI_Fn, LLM_IF_OAI_Json, LLM_IF_OAI_Reasoning, LLM_IF_OAI_PromptCaching],
|
||||
parameterSpecs: [{ paramId: 'llmForceNoStream' }, { paramId: 'llmVndOaiReasoningEffort' }, { paramId: 'llmVndOaiRestoreMarkdown' }],
|
||||
chatPrice: { input: 10, cache: { cType: 'oai-ac', read: 2.5 }, output: 40 },
|
||||
chatPrice: { input: 2, cache: { cType: 'oai-ac', read: 0.5 }, output: 8 },
|
||||
// benchmarks not available yet, as of 2025-04-16 (intro)
|
||||
},
|
||||
|
||||
@@ -123,7 +165,7 @@ export const _knownOpenAIChatModels: ManualMappings = [
|
||||
{
|
||||
idPrefix: 'o3-mini',
|
||||
label: 'o3 Mini',
|
||||
description: 'Points to the most recent o3-mini snapshot: o3-mini-2025-01-31',
|
||||
description: 'A small model alternative to o3. Points to the most recent o3-mini snapshot: o3-mini-2025-01-31',
|
||||
symLink: 'o3-mini-2025-01-31',
|
||||
hidden: true, // prefer versioned
|
||||
// copied from symlinked
|
||||
@@ -170,7 +212,7 @@ export const _knownOpenAIChatModels: ManualMappings = [
|
||||
{
|
||||
idPrefix: 'o1-2024-12-17',
|
||||
label: 'o1 (2024-12-17)',
|
||||
description: 'Latest o1 model.',
|
||||
description: 'Previous full o-series reasoning model.',
|
||||
contextWindow: 200000,
|
||||
maxCompletionTokens: 100000,
|
||||
trainingDataCutoff: 'Oct 2023',
|
||||
@@ -182,7 +224,7 @@ export const _knownOpenAIChatModels: ManualMappings = [
|
||||
{
|
||||
idPrefix: 'o1',
|
||||
label: 'o1',
|
||||
description: 'Points to the most recent snapshot of the o1 model: o1-2024-12-17',
|
||||
description: 'Previous full o-series reasoning model. Points to the most recent snapshot: o1-2024-12-17',
|
||||
symLink: 'o1-2024-12-17',
|
||||
hidden: true, // prefer versioned
|
||||
// copied from symlinked
|
||||
@@ -195,7 +237,7 @@ export const _knownOpenAIChatModels: ManualMappings = [
|
||||
benchmark: { cbaElo: 1350 },
|
||||
},
|
||||
|
||||
// o1-preview
|
||||
// o1-preview (deprecated)
|
||||
{
|
||||
hidden: true, // OUTDATED
|
||||
idPrefix: 'o1-preview-2024-09-12',
|
||||
@@ -208,6 +250,7 @@ export const _knownOpenAIChatModels: ManualMappings = [
|
||||
chatPrice: { input: 15, cache: { cType: 'oai-ac', read: 7.5 }, output: 60 },
|
||||
benchmark: { cbaElo: 1335 },
|
||||
isPreview: true,
|
||||
isLegacy: true,
|
||||
},
|
||||
{
|
||||
idPrefix: 'o1-preview',
|
||||
@@ -223,24 +266,27 @@ export const _knownOpenAIChatModels: ManualMappings = [
|
||||
chatPrice: { input: 15, cache: { cType: 'oai-ac', read: 7.5 }, output: 60 },
|
||||
benchmark: { cbaElo: 1335 },
|
||||
isPreview: true,
|
||||
isLegacy: true,
|
||||
},
|
||||
|
||||
// o1-mini
|
||||
// o1-mini (deprecated)
|
||||
{
|
||||
hidden: true, // DEPRECATED
|
||||
idPrefix: 'o1-mini-2024-09-12',
|
||||
label: 'o1 Mini (2024-09-12)', // ⏱️
|
||||
description: 'Latest o1-mini model snapshot. Fast, cost-efficient reasoning model tailored to coding, math, and science use cases.',
|
||||
description: 'Deprecated. Fast, cost-efficient reasoning model tailored to coding, math, and science use cases.',
|
||||
contextWindow: 128000,
|
||||
maxCompletionTokens: 65536,
|
||||
trainingDataCutoff: 'Oct 2023',
|
||||
interfaces: [LLM_IF_OAI_Chat, LLM_IF_OAI_Reasoning, LLM_IF_OAI_PromptCaching, LLM_IF_HOTFIX_StripImages, LLM_IF_HOTFIX_Sys0ToUsr0],
|
||||
chatPrice: { input: 1.1, cache: { cType: 'oai-ac', read: 0.55 }, output: 4.4 },
|
||||
benchmark: { cbaElo: 1304 },
|
||||
isLegacy: true,
|
||||
},
|
||||
{
|
||||
idPrefix: 'o1-mini',
|
||||
label: 'o1 Mini',
|
||||
description: 'Points to the most recent o1-mini snapshot: o1-mini-2024-09-12',
|
||||
description: 'Deprecated. A small model alternative to o1. Points to the most recent o1-mini snapshot: o1-mini-2024-09-12',
|
||||
symLink: 'o1-mini-2024-09-12',
|
||||
hidden: true, // prefer versioned
|
||||
// copied from symlinked
|
||||
@@ -250,6 +296,7 @@ export const _knownOpenAIChatModels: ManualMappings = [
|
||||
interfaces: [LLM_IF_OAI_Chat, LLM_IF_OAI_Reasoning, LLM_IF_OAI_PromptCaching, LLM_IF_HOTFIX_StripImages, LLM_IF_HOTFIX_Sys0ToUsr0],
|
||||
chatPrice: { input: 1.1, cache: { cType: 'oai-ac', read: 0.55 }, output: 4.4 },
|
||||
benchmark: { cbaElo: 1304 },
|
||||
isLegacy: true,
|
||||
},
|
||||
|
||||
/// GPT-4.1 series
|
||||
@@ -342,8 +389,8 @@ export const _knownOpenAIChatModels: ManualMappings = [
|
||||
{
|
||||
hidden: true, // OBSOLETE
|
||||
idPrefix: 'gpt-4.5-preview-2025-02-27',
|
||||
label: 'GPT-4.5 Preview (2025-02-27)',
|
||||
description: 'Research preview of GPT-4.5, our largest and most capable GPT model yet. Deep world knowledge and better understanding of user intent makes it good at creative tasks and agentic planning.',
|
||||
label: 'GPT-4.5 Preview (2025-02-27)', // [deprecated]
|
||||
description: 'Will be shut down on 2025-07-14. Research preview of GPT-4.5, our largest and most capable GPT model yet. Deep world knowledge and better understanding of user intent makes it good at creative tasks and agentic planning.',
|
||||
contextWindow: 128000,
|
||||
maxCompletionTokens: 16384,
|
||||
trainingDataCutoff: 'Oct 2023',
|
||||
@@ -354,7 +401,7 @@ export const _knownOpenAIChatModels: ManualMappings = [
|
||||
},
|
||||
{
|
||||
idPrefix: 'gpt-4.5-preview',
|
||||
label: 'GPT-4.5 Preview',
|
||||
label: 'GPT-4.5 Preview', // [deprecated]
|
||||
description: 'Largest GPT model, good for creative tasks and agentic planning. Currently points to gpt-4.5-preview-2025-02-27.',
|
||||
symLink: 'gpt-4.5-preview-2025-02-27',
|
||||
hidden: true, // prefer versioned
|
||||
@@ -466,6 +513,19 @@ export const _knownOpenAIChatModels: ManualMappings = [
|
||||
},
|
||||
|
||||
// GPT-4o Audio Preview
|
||||
{
|
||||
hidden: true, // UNSUPPORTED yet (audio output model)
|
||||
idPrefix: 'gpt-4o-audio-preview-2025-06-03',
|
||||
label: 'GPT-4o Audio Preview (2025-06-03)',
|
||||
description: 'Latest snapshot for the Audio API model.',
|
||||
contextWindow: 128000,
|
||||
maxCompletionTokens: 16384,
|
||||
trainingDataCutoff: 'Oct 2023',
|
||||
interfaces: [LLM_IF_OAI_NeedsAudio],
|
||||
chatPrice: { input: 2.5, output: 10 /* AUDIO PRICING UNSUPPORTED 40/80 */ },
|
||||
// benchmarks don't apply to audio models
|
||||
isPreview: true,
|
||||
},
|
||||
{
|
||||
hidden: true, // UNSUPPORTED yet (audio output model)
|
||||
idPrefix: 'gpt-4o-audio-preview-2024-12-17',
|
||||
@@ -496,7 +556,7 @@ export const _knownOpenAIChatModels: ManualMappings = [
|
||||
idPrefix: 'gpt-4o-audio-preview',
|
||||
label: 'GPT-4o Audio Preview',
|
||||
description: 'Preview release for audio inputs in chat completions.',
|
||||
symLink: 'gpt-4o-audio-preview-2024-12-17',
|
||||
symLink: 'gpt-4o-audio-preview-2024-12-17', // still points to 12-17 as of 2025-06-11
|
||||
hidden: true, // prefer versioned
|
||||
// copied from symlinked
|
||||
contextWindow: 128000,
|
||||
@@ -509,6 +569,19 @@ export const _knownOpenAIChatModels: ManualMappings = [
|
||||
},
|
||||
|
||||
// GPT-4o Realtime Preview
|
||||
{
|
||||
hidden: true, // UNSUPPORTED yet - REALTIME API
|
||||
idPrefix: 'gpt-4o-realtime-preview-2025-06-03',
|
||||
label: 'GPT-4o Realtime Preview (2025-06-03)',
|
||||
description: 'Latest snapshot for the Realtime API model.',
|
||||
contextWindow: 128000,
|
||||
maxCompletionTokens: 4096,
|
||||
trainingDataCutoff: 'Oct 2023',
|
||||
interfaces: [LLM_IF_OAI_Realtime],
|
||||
chatPrice: { input: 5, cache: { cType: 'oai-ac', read: 2.5 }, output: 20 /* AUDIO PRICING UNSUPPORTED 40/80 */ },
|
||||
// benchmarks don't apply to realtime models
|
||||
isPreview: true,
|
||||
},
|
||||
{
|
||||
hidden: true, // UNSUPPORTED yet - REALTIME API
|
||||
idPrefix: 'gpt-4o-realtime-preview-2024-12-17',
|
||||
@@ -871,6 +944,8 @@ export const _knownOpenAIChatModels: ManualMappings = [
|
||||
const openAIModelsDenyList: string[] = [
|
||||
// [OpenAI, 2025-03-11] FIXME: NOT YET SUPPORTED - "RESPONSES API"
|
||||
'computer-use-preview', 'computer-use-preview-2025-03-11', // FIXME: support these
|
||||
'codex-mini-latest', // FIXME: support these
|
||||
// 'o3-pro', // FIXME: support these
|
||||
'o1-pro', // FIXME: support these
|
||||
|
||||
// Legacy GPT models
|
||||
@@ -898,7 +973,7 @@ const openAIModelsDenyList: string[] = [
|
||||
'gpt-image-1', 'dall-e-3', 'dall-e-2',
|
||||
|
||||
// Moderation models
|
||||
'omni-moderation-latest', 'omni-moderation-2024-09-26',
|
||||
'omni-moderation-latest', 'omni-moderation-2024-09-26', 'text-moderation-latest',
|
||||
];
|
||||
|
||||
export function openAIModelFilter(model: OpenAIWire_API_Models_List.Model) {
|
||||
@@ -921,6 +996,8 @@ const _manualOrderingIdPrefixes = [
|
||||
'o4-20',
|
||||
'o4-mini-20',
|
||||
'o4-',
|
||||
'o3-pro-20',
|
||||
'o3-pro',
|
||||
'o3-20',
|
||||
'o3-mini-20',
|
||||
'o3-',
|
||||
@@ -952,6 +1029,8 @@ const _manualOrderingIdPrefixes = [
|
||||
'gpt-4o-',
|
||||
// ChatGPT models
|
||||
'chatgpt-',
|
||||
// Codex
|
||||
'codex-',
|
||||
// ...rest
|
||||
// 'gpt-4-turbo-',
|
||||
// 'gpt-4-',
|
||||
|
||||
Reference in New Issue
Block a user