Merge a87ec75ba6 into 995bef73de

Merge pull request #6599 from DreamRivulet/add-support-GPT5
add: model gpt-5
2025-09-30 15:16:38 +08:00 · 2025-08-12 23:30:50 +08:00 · 2025-08-10 17:21:12 +08:00 · 2025-08-09 17:03:49 +08:00 · 2025-08-09 17:03:49 +08:00 · 2025-08-09 17:03:49 +08:00
4 changed files with 54 additions and 27 deletions
--- a/app/api/common.ts
+++ b/app/api/common.ts
@ -90,6 +90,14 @@ export async function requestOpenai(req: NextRequest) {

  const fetchUrl = cloudflareAIGatewayUrl(`${baseUrl}/${path}`);
  console.log("fetchUrl", fetchUrl);
+
+  let payload = await req.text();
+  if (baseUrl.includes("openrouter.ai")) {
+    const body = JSON.parse(payload);
+    body["include_reasoning"] = true;
+    payload = JSON.stringify(body);
+  }
+
  const fetchOptions: RequestInit = {
    headers: {
      "Content-Type": "application/json",
@ -100,7 +108,7 @@ export async function requestOpenai(req: NextRequest) {
      }),
    },
    method: req.method,
-    body: req.body,
+    body: payload,
    // to fix #2485: https://stackoverflow.com/questions/55920957/cloudflare-worker-typeerror-one-time-use-body
    redirect: "manual",
    // @ts-ignore
@ -111,10 +119,7 @@ export async function requestOpenai(req: NextRequest) {
  // #1815 try to refuse gpt4 request
  if (serverConfig.customModels && req.body) {
    try {
-      const clonedBody = await req.text();
-      fetchOptions.body = clonedBody;
-
-      const jsonBody = JSON.parse(clonedBody) as { model?: string };
+      const jsonBody = JSON.parse(payload) as { model?: string };

      // not undefined and is false
      if (
--- a/app/client/platforms/openai.ts
+++ b/app/client/platforms/openai.ts
@ -2,10 +2,10 @@
 // azure and openai, using same models. so using same LLMApi.
 import {
  ApiPath,
-  OPENAI_BASE_URL,
-  DEFAULT_MODELS,
-  OpenaiPath,
  Azure,
+  DEFAULT_MODELS,
+  OPENAI_BASE_URL,
+  OpenaiPath,
  REQUEST_TIMEOUT_MS,
  ServiceProvider,
 } from "@/app/constant";
@ -18,13 +18,13 @@ import {
 } from "@/app/store";
 import { collectModelsWithDefaultModel } from "@/app/utils/model";
 import {
-  preProcessImageContent,
-  uploadImage,
  base64Image2Blob,
+  preProcessImageContent,
  streamWithThink,
+  uploadImage,
 } from "@/app/utils/chat";
 import { cloudflareAIGatewayUrl } from "@/app/utils/cloudflare";
-import { ModelSize, DalleQuality, DalleStyle } from "@/app/typing";
+import { DalleQuality, DalleStyle, ModelSize } from "@/app/typing";

 import {
  ChatOptions,
@ -39,9 +39,9 @@ import Locale from "../../locales";
 import { getClientConfig } from "@/app/config/client";
 import {
  getMessageTextContent,
-  isVisionModel,
-  isDalle3 as _isDalle3,
  getTimeoutMSByModel,
+  isDalle3 as _isDalle3,
+  isVisionModel,
 } from "@/app/utils";
 import { fetch } from "@/app/utils/stream";

@ -200,6 +200,7 @@ export class ChatGPTApi implements LLMApi {
      options.config.model.startsWith("o1") ||
      options.config.model.startsWith("o3") ||
      options.config.model.startsWith("o4-mini");
+    const isGpt5 =  options.config.model.startsWith("gpt-5");
    if (isDalle3) {
      const prompt = getMessageTextContent(
        options.messages.slice(-1)?.pop() as any,
@ -230,7 +231,7 @@ export class ChatGPTApi implements LLMApi {
        messages,
        stream: options.config.stream,
        model: modelConfig.model,
-        temperature: !isO1OrO3 ? modelConfig.temperature : 1,
+        temperature: (!isO1OrO3 && !isGpt5) ? modelConfig.temperature : 1,
        presence_penalty: !isO1OrO3 ? modelConfig.presence_penalty : 0,
        frequency_penalty: !isO1OrO3 ? modelConfig.frequency_penalty : 0,
        top_p: !isO1OrO3 ? modelConfig.top_p : 1,
@ -238,7 +239,13 @@ export class ChatGPTApi implements LLMApi {
        // Please do not ask me why not send max_tokens, no reason, this param is just shit, I dont want to explain anymore.
      };

-      if (isO1OrO3) {
+      if (isGpt5) {
+  	// Remove max_tokens if present
+  	delete requestPayload.max_tokens;
+  	// Add max_completion_tokens (or max_completion_tokens if that's what you meant)
+  	requestPayload["max_completion_tokens"] = modelConfig.max_tokens;
+
+      } else if (isO1OrO3) {
        // by default the o1/o3 models will not attempt to produce output that includes markdown formatting
        // manually add "Formatting re-enabled" developer message to encourage markdown inclusion in model responses
        // (https://learn.microsoft.com/en-us/azure/ai-services/openai/how-to/reasoning?tabs=python-secure#markdown-output)
@ -251,8 +258,9 @@ export class ChatGPTApi implements LLMApi {
        requestPayload["max_completion_tokens"] = modelConfig.max_tokens;
      }

+
      // add max_tokens to vision model
-      if (visionModel && !isO1OrO3) {
+      if (visionModel && !isO1OrO3 && ! isGpt5) {
        requestPayload["max_tokens"] = Math.max(modelConfig.max_tokens, 4000);
      }
    }
@ -303,6 +311,13 @@ export class ChatGPTApi implements LLMApi {
            useChatStore.getState().currentSession().mask?.plugin || [],
          );
        // console.log("getAsTools", tools, funcs);
+
+        // Add "include_reasoning" for OpenRouter: https://openrouter.ai/announcements/reasoning-tokens-for-thinking-models
+        if (chatPath.includes("openrouter.ai")) {
+          // @ts-ignore
+          requestPayload["include_reasoning"] = true;
+        }
+
        streamWithThink(
          chatPath,
          requestPayload,
@ -319,6 +334,7 @@ export class ChatGPTApi implements LLMApi {
                content: string;
                tool_calls: ChatMessageTool[];
                reasoning_content: string | null;
+                reasoning: string | null;
              };
            }>;

@ -344,7 +360,9 @@ export class ChatGPTApi implements LLMApi {
              }
            }

-            const reasoning = choices[0]?.delta?.reasoning_content;
+            const reasoning =
+              choices[0]?.delta?.reasoning_content ||
+              choices[0]?.delta?.reasoning;
            const content = choices[0]?.delta?.content;

            // Skip if both content and reasoning_content are empty or null
@ -420,6 +438,7 @@ export class ChatGPTApi implements LLMApi {
      options.onError?.(e as Error);
    }
  }
+
  async usage() {
    const formatDate = (d: Date) =>
      `${d.getFullYear()}-${(d.getMonth() + 1).toString().padStart(2, "0")}-${d
@ -523,4 +542,5 @@ export class ChatGPTApi implements LLMApi {
    }));
  }
 }
+
 export { OpenaiPath };
--- a/app/constant.ts
+++ b/app/constant.ts
@ -493,6 +493,7 @@ export const VISION_MODEL_REGEXES = [
  /o3/,
  /o4-mini/,
  /grok-4/i,
+  /gpt-5/
 ];

 export const EXCLUDE_VISION_MODEL_REGEXES = [/claude-3-5-haiku-20241022/];
@ -517,6 +518,11 @@ const openaiModels = [
  "gpt-4.1-nano-2025-04-14",
  "gpt-4.5-preview",
  "gpt-4.5-preview-2025-02-27",
+  "gpt-5-chat",
+  "gpt-5-mini",
+  "gpt-5-nano",
+  "gpt-5",
+  "gpt-5-chat-2025-01-01-preview",
  "gpt-4o",
  "gpt-4o-2024-05-13",
  "gpt-4o-2024-08-06",
--- a/app/utils/chat.ts
+++ b/app/utils/chat.ts
@ -1,7 +1,7 @@
 import {
  CACHE_URL_PREFIX,
-  UPLOAD_URL,
  REQUEST_TIMEOUT_MS,
+  UPLOAD_URL,
 } from "@/app/constant";
 import { MultimodalContent, RequestMessage } from "@/app/client/api";
 import Locale from "@/app/locales";
@ -111,6 +111,7 @@ export async function preProcessImageContentForAlibabaDashScope(
 }

 const imageCaches: Record<string, string> = {};
+
 export function cacheImageToBase64Image(imageUrl: string) {
  if (imageUrl.includes(CACHE_URL_PREFIX)) {
    if (!imageCaches[imageUrl]) {
@ -385,6 +386,7 @@ export function stream(
      openWhenHidden: true,
    });
  }
+
  console.debug("[ChatAPI] start");
  chatApi(chatPath, headers, requestPayload, tools); // call fetchEventSource
 }
@ -627,16 +629,9 @@ export function streamWithThink(
              if (remainText.length > 0) {
                remainText += "\n";
              }
-              remainText += "> " + chunk.content;
-            } else {
-              // Handle newlines in thinking content
-              if (chunk.content.includes("\n\n")) {
-                const lines = chunk.content.split("\n\n");
-                remainText += lines.join("\n\n> ");
-              } else {
-                remainText += chunk.content;
-              }
+              remainText += "> ";
            }
+            remainText += chunk.content.replaceAll("\n", "\n> ");
          } else {
            // If in normal mode
            if (isInThinkingMode || isThinkingChanged) {
@ -662,6 +657,7 @@ export function streamWithThink(
      openWhenHidden: true,
    });
  }
+
  console.debug("[ChatAPI] start");
  chatApi(chatPath, headers, requestPayload, tools); // call fetchEventSource
 }
Author	SHA1	Message	Date
Xu Chenxi	69c356b170	Merge `a87ec75ba6` into `995bef73de`	2025-08-12 23:30:50 +08:00
RiverRay	995bef73de	Merge pull request #6599 from DreamRivulet/add-support-GPT5 Some checks failed Run Tests / test (push) Has been cancelled Details add: model gpt-5	2025-08-10 17:21:12 +08:00
Sam	38ac502d80	Add support for GPT5	2025-08-09 17:03:49 +08:00
Sam	0511808900	use max_completion_tokens	2025-08-09 17:03:49 +08:00
Sam	42eff644b4	use max_completion_tokens	2025-08-09 17:03:49 +08:00
Sam	8ae6883784	add gpt-5	2025-08-09 17:03:49 +08:00
Sam	c0f2ab6de3	add gpt-5	2025-08-09 17:03:06 +08:00
xsun2001	a87ec75ba6	Support OpenRouter reasoning when using env var	2025-02-25 16:35:03 +08:00
xsun2001	6e082ad7ac	Support reasoning for OpenRouter using OpenAI provider	2025-02-18 14:41:59 +08:00