1 Commits

Author SHA1 Message Date
penurin d5fd93f64a Adjust release o1 context to 200K 2024-12-27 17:05:48 +00:00
@@ -7,7 +7,7 @@ import { RequestPreprocessor } from "../index";
const CLAUDE_MAX_CONTEXT = config.maxContextTokensAnthropic; const CLAUDE_MAX_CONTEXT = config.maxContextTokensAnthropic;
const OPENAI_MAX_CONTEXT = config.maxContextTokensOpenAI; const OPENAI_MAX_CONTEXT = config.maxContextTokensOpenAI;
// todo: make configurable // todo: make configurable
const GOOGLE_AI_MAX_CONTEXT = 1024000; const GOOGLE_AI_MAX_CONTEXT = 2048000;
const MISTRAL_AI_MAX_CONTENT = 131072; const MISTRAL_AI_MAX_CONTENT = 131072;
/** /**
@@ -68,6 +68,12 @@ export const validateContextSize: RequestPreprocessor = async (req) => {
modelMax = 131072; modelMax = 131072;
} else if (model.match(/^gpt-4(-\d{4})?-vision(-preview)?$/)) { } else if (model.match(/^gpt-4(-\d{4})?-vision(-preview)?$/)) {
modelMax = 131072; modelMax = 131072;
} else if (model.match(/^o1(-\d{4}-\d{2}-\d{2})?$/)) {
modelMax = 200000;
} else if (model.match(/^o1-mini(-\d{4}-\d{2}-\d{2})?$/)) {
modelMax = 128000;
} else if (model.match(/^o1-preview(-\d{4}-\d{2}-\d{2})?$/)) {
modelMax = 128000;
} else if (model.match(/gpt-3.5-turbo/)) { } else if (model.match(/gpt-3.5-turbo/)) {
modelMax = 16384; modelMax = 16384;
} else if (model.match(/gpt-4-32k/)) { } else if (model.match(/gpt-4-32k/)) {