chore: o1模型使用max_completion_tokens

2025-10-14 09:29:43 +08:00 · 2024-11-07 19:45:27 +08:00
parent fbb9385f23
commit d5bda2904d
1 changed files with 6 additions and 0 deletions
--- a/app/client/platforms/openai.ts
+++ b/app/client/platforms/openai.ts
@@ -65,6 +65,7 @@ export interface RequestPayload {
  frequency_penalty: number;
  top_p: number;
  max_tokens?: number;
+  max_completion_tokens?: number;
 }

 export interface DalleRequestPayload {
@@ -233,6 +234,11 @@ export class ChatGPTApi implements LLMApi {
        // Please do not ask me why not send max_tokens, no reason, this param is just shit, I dont want to explain anymore.
      };

+      // O1 使用 max_completion_tokens 控制token数 (https://platform.openai.com/docs/guides/reasoning#controlling-costs)
+      if (isO1) {
+        requestPayload["max_completion_tokens"] = modelConfig.max_tokens;
+      }
+
      // add max_tokens to vision model
      if (visionModel) {
        requestPayload["max_tokens"] = Math.max(modelConfig.max_tokens, 4000);