Merge c261ebc82c into 11b37c15bd

Merge pull request #6450 from stephen-zeng/main
Add gpt-4.1 family & gpt-4.5-preview support
2025-10-16 23:13:42 +08:00 · 2025-04-18 08:48:01 +08:00 · 2025-04-17 08:29:19 +08:00 · 2025-04-16 22:10:47 +08:00 · 2025-04-16 22:02:35 +08:00 · 2025-04-06 16:56:54 +08:00
2 changed files with 27 additions and 2 deletions
--- a/app/client/platforms/openai.ts
+++ b/app/client/platforms/openai.ts
@@ -56,7 +56,7 @@ export interface OpenAIListModelResponse {

 export interface RequestPayload {
  messages: {
-    role: "system" | "user" | "assistant";
+    role: "developer" | "system" | "user" | "assistant";
    content: string | MultimodalContent[];
  }[];
  stream?: boolean;
@@ -237,8 +237,16 @@ export class ChatGPTApi implements LLMApi {
        // Please do not ask me why not send max_tokens, no reason, this param is just shit, I dont want to explain anymore.
      };

-      // O1 使用 max_completion_tokens 控制token数 (https://platform.openai.com/docs/guides/reasoning#controlling-costs)
      if (isO1OrO3) {
+        // by default the o1/o3 models will not attempt to produce output that includes markdown formatting
+        // manually add "Formatting re-enabled" developer message to encourage markdown inclusion in model responses
+        // (https://learn.microsoft.com/en-us/azure/ai-services/openai/how-to/reasoning?tabs=python-secure#markdown-output)
+        requestPayload["messages"].unshift({
+          role: "developer",
+          content: "Formatting re-enabled",
+        });
+
+        // o1/o3 uses max_completion_tokens to control the number of tokens (https://platform.openai.com/docs/guides/reasoning#controlling-costs)
        requestPayload["max_completion_tokens"] = modelConfig.max_tokens;
      }

--- a/app/constant.ts
+++ b/app/constant.ts
@@ -417,6 +417,14 @@ export const KnowledgeCutOffDate: Record<string, string> = {
  "gpt-4-turbo": "2023-12",
  "gpt-4-turbo-2024-04-09": "2023-12",
  "gpt-4-turbo-preview": "2023-12",
+  "gpt-4.1": "2024-06",
+  "gpt-4.1-2025-04-14": "2024-06",
+  "gpt-4.1-mini": "2024-06",
+  "gpt-4.1-mini-2025-04-14": "2024-06",
+  "gpt-4.1-nano": "2024-06",
+  "gpt-4.1-nano-2025-04-14": "2024-06",
+  "gpt-4.5-preview": "2023-10",
+  "gpt-4.5-preview-2025-02-27": "2023-10",
  "gpt-4o": "2023-10",
  "gpt-4o-2024-05-13": "2023-10",
  "gpt-4o-2024-08-06": "2023-10",
@@ -458,6 +466,7 @@ export const DEFAULT_TTS_VOICES = [
 export const VISION_MODEL_REGEXES = [
  /vision/,
  /gpt-4o/,
+  /gpt-4\.1/,
  /claude-3/,
  /gemini-1\.5/,
  /gemini-exp/,
@@ -485,6 +494,14 @@ const openaiModels = [
  "gpt-4-32k-0613",
  "gpt-4-turbo",
  "gpt-4-turbo-preview",
+  "gpt-4.1",
+  "gpt-4.1-2025-04-14",
+  "gpt-4.1-mini",
+  "gpt-4.1-mini-2025-04-14",
+  "gpt-4.1-nano",
+  "gpt-4.1-nano-2025-04-14",
+  "gpt-4.5-preview",
+  "gpt-4.5-preview-2025-02-27",
  "gpt-4o",
  "gpt-4o-2024-05-13",
  "gpt-4o-2024-08-06",
Author	SHA1	Message	Date
Yunling Zhu	664390410b	Merge `c261ebc82c` into `11b37c15bd`	2025-04-18 08:48:01 +08:00
RiverRay	11b37c15bd	Merge pull request #6450 from stephen-zeng/main Some checks failed Run Tests / test (push) Has been cancelled Details Add gpt-4.1 family & gpt-4.5-preview support	2025-04-17 08:29:19 +08:00
QwQwQ	1d0038f17d	add gpt-4.5-preview support	2025-04-16 22:10:47 +08:00
QwQwQ	619fa519c0	add gpt-4.1 family support	2025-04-16 22:02:35 +08:00
Yunling Zhu	c261ebc82c	use unshift to improve perf	2025-04-06 16:56:54 +08:00
Yunling Zhu	f7c747c65f	encourage markdown inclusion for o1/o3	2025-04-03 22:11:59 +08:00