fix: gpt-4.1 max model token (#588)

BobDu · web-flow · commit 17dedfc7d6b4 · 2025-04-16T19:53:50.000+08:00
Signed-off-by: Bob Du &lt;i@bobdu.cc&gt;
diff --git a/service/src/chatgpt/index.ts b/service/src/chatgpt/index.ts
@@ -58,36 +58,20 @@ export async function initApi(key: KeyConfig, chatModel: string, maxContextCount
     // Set the token limits based on the model's type. This is because different models have different token limits.
     // The token limit includes the token count from both the message array sent and the model response.
 
-    // Check if the model type is GPT-4-turbo or newer
-    if (model.toLowerCase().includes('gpt-4o-2024-08-06') || model.toLowerCase().includes('chatgpt-4o-latest')) {
-      // 'gpt-4o-2024-08-06'/'chatgpt-4o-latest'
-      options.maxModelTokens = 128000
-      options.maxResponseTokens = 16384
+    if (model.toLowerCase().includes('gpt-4.1')) {
+      // https://platform.openai.com/docs/models/gpt-4.1
+      options.maxModelTokens = 1047576
+      options.maxResponseTokens = 32768
     }
-    if (model.toLowerCase().includes('gpt-4o') || model.toLowerCase().includes('gpt-4-turbo') || model.toLowerCase().includes('-preview')) {
-      // 'gpt-4o'/'gpt-4-turbo'/'xxxx-preview'
+    else if (model.toLowerCase().includes('gpt-4o')) {
+      // https://platform.openai.com/docs/models/gpt-4o
       options.maxModelTokens = 128000
-      options.maxResponseTokens = 4096
-    }
-    else if (model.toLowerCase().includes('gpt-4')) {
-      // 'gpt-4'
-      options.maxModelTokens = 8192
-      options.maxResponseTokens = 8192
-    }
-    else if (model.toLowerCase().includes('gpt-3.5-turbo-instruct')) {
-      // 'gpt-3.5-turbo-instruct'
-      options.maxModelTokens = 4096
-      options.maxResponseTokens = 4096
-    }
-    else if (model.toLowerCase().includes('gpt-3.5-turbo')) {
-      // 'gpt-3.5-turbo'
-      options.maxModelTokens = 16385
-      options.maxResponseTokens = 4096
+      options.maxResponseTokens = 16384
     }
     // If none of the above, use the default values
     else {
-      options.maxModelTokens = 4096
-      options.maxResponseTokens = 1024
+      options.maxModelTokens = 1047576
+      options.maxResponseTokens = 32768
     }
 
     if (isNotEmptyString(OPENAI_API_BASE_URL))