From f95e24afbb55b3ec6afd9a22a28fe8878c959f1e Mon Sep 17 00:00:00 2001 From: nai-degen Date: Sun, 19 Nov 2023 02:23:41 -0600 Subject: [PATCH] fixes incorrect max model size for gpt4-v --- src/proxy/middleware/request/validate-context-size.ts | 2 ++ 1 file changed, 2 insertions(+) diff --git a/src/proxy/middleware/request/validate-context-size.ts b/src/proxy/middleware/request/validate-context-size.ts index ee661c9..9e813fa 100644 --- a/src/proxy/middleware/request/validate-context-size.ts +++ b/src/proxy/middleware/request/validate-context-size.ts @@ -46,6 +46,8 @@ export const validateContextSize: RequestPreprocessor = async (req) => { modelMax = 16384; } else if (model.match(/gpt-4-1106(-preview)?/)) { modelMax = 131072; + } else if (model.match(/^gpt-4(-\d{4})?-vision(-preview)?$/)) { + modelMax = 131072; } else if (model.match(/gpt-3.5-turbo/)) { modelMax = 4096; } else if (model.match(/gpt-4-32k/)) {