send longer chat history

added gpt-4.1 and removed gpt-4.5-preview
ignore local Dockerfile
2025-10-19 08:23:42 +08:00 · 2025-04-15 13:37:26 -05:00 · 2025-04-15 12:52:30 -05:00 · 2025-04-01 17:53:56 -05:00 · 2025-04-01 17:48:31 -05:00 · 2025-04-01 17:47:16 -05:00
13 changed files with 18808 additions and 1994 deletions
--- a/.gitignore
+++ b/.gitignore
@@ -49,3 +49,4 @@ masks.json

 # mcp config
 app/mcp/mcp_config.json
+Dockerfile.local
--- a/README.md
+++ b/README.md
@@ -22,12 +22,12 @@ English / [简体中文](./README_CN.md)
 [![MacOS][MacOS-image]][download-url]
 [![Linux][Linux-image]][download-url]

-[NextChatAI](https://nextchat.club?utm_source=readme) / [iOS APP](https://apps.apple.com/us/app/nextchat-ai/id6743085599) / [Web App Demo](https://app.nextchat.club) / [Desktop App](https://github.com/Yidadaa/ChatGPT-Next-Web/releases) / [Enterprise Edition](#enterprise-edition) 
+[NextChatAI](https://nextchat.club?utm_source=readme) / [Web App Demo](https://app.nextchat.dev) / [Desktop App](https://github.com/Yidadaa/ChatGPT-Next-Web/releases) / [Discord](https://discord.gg/YCkeafCafC) / [Enterprise Edition](#enterprise-edition) / [Twitter](https://twitter.com/NextChatDev)


 [saas-url]: https://nextchat.club?utm_source=readme
 [saas-image]: https://img.shields.io/badge/NextChat-Saas-green?logo=microsoftedge
-[web-url]: https://app.nextchat.club/
+[web-url]: https://app.nextchat.dev/
 [download-url]: https://github.com/Yidadaa/ChatGPT-Next-Web/releases
 [Web-image]: https://img.shields.io/badge/Web-PWA-orange?logo=microsoftedge
 [Windows-image]: https://img.shields.io/badge/-Windows-blue?logo=windows
@@ -40,14 +40,13 @@ English / [简体中文](./README_CN.md)

 </div>

-## 🥳 Cheer for NextChat iOS Version Online!
-> [👉 Click Here to Install Now](https://apps.apple.com/us/app/nextchat-ai/id6743085599)
-
-> [❤️ Source Code Coming Soon](https://github.com/ChatGPTNextWeb/NextChat-iOS)
-
-![Github iOS Image](https://github.com/user-attachments/assets/e0aa334f-4c13-4dc9-8310-e3b09fa4b9f3)
-
+## 🥳 Cheer for DeepSeek, China's AI star!
+ > Purpose-Built UI for DeepSeek Reasoner Model
 
+<img src="https://github.com/user-attachments/assets/f3952210-3af1-4dc0-9b81-40eaa4847d9a"/>
+
+
+
 ## 🫣 NextChat Support MCP  ! 
 > Before build, please set env ENABLE_MCP=true

--- a/app/client/platforms/anthropic.ts
+++ b/app/client/platforms/anthropic.ts
@@ -71,8 +71,6 @@ const ClaudeMapper = {
  system: "user",
 } as const;

-const keys = ["claude-2, claude-instant-1"];
-
 export class ClaudeApi implements LLMApi {
  speech(options: SpeechOptions): Promise<ArrayBuffer> {
    throw new Error("Method not implemented.");
--- a/app/client/platforms/google.ts
+++ b/app/client/platforms/google.ts
@@ -197,8 +197,6 @@ export class GeminiProApi implements LLMApi {
        signal: controller.signal,
        headers: getHeaders(),
      };
-
-      const isThinking = options.config.model.includes("-thinking");
      // make a fetch request
      const requestTimeoutId = setTimeout(
        () => controller.abort(),
--- a/app/client/platforms/openai.ts
+++ b/app/client/platforms/openai.ts
@@ -56,7 +56,7 @@ export interface OpenAIListModelResponse {

 export interface RequestPayload {
  messages: {
-    role: "developer" | "system" | "user" | "assistant";
+    role: "system" | "user" | "assistant";
    content: string | MultimodalContent[];
  }[];
  stream?: boolean;
@@ -67,6 +67,8 @@ export interface RequestPayload {
  top_p: number;
  max_tokens?: number;
  max_completion_tokens?: number;
+  reasoning_effort?: string;
+  // O3 only
 }

 export interface DalleRequestPayload {
@@ -196,10 +198,9 @@ export class ChatGPTApi implements LLMApi {
    let requestPayload: RequestPayload | DalleRequestPayload;

    const isDalle3 = _isDalle3(options.config.model);
-    const isO1OrO3 =
-      options.config.model.startsWith("o1") ||
-      options.config.model.startsWith("o3") ||
-      options.config.model.startsWith("o4-mini");
+    const isO1 = options.config.model.startsWith("o1");
+    const isO3 = options.config.model.startsWith("o3");
+    const isO1OrO3 = isO1 || isO3;
    if (isDalle3) {
      const prompt = getMessageTextContent(
        options.messages.slice(-1)?.pop() as any,
@@ -238,22 +239,23 @@ export class ChatGPTApi implements LLMApi {
        // Please do not ask me why not send max_tokens, no reason, this param is just shit, I dont want to explain anymore.
      };

+      // O1 使用 max_completion_tokens 控制token数 (https://platform.openai.com/docs/guides/reasoning#controlling-costs)
      if (isO1OrO3) {
-        // by default the o1/o3 models will not attempt to produce output that includes markdown formatting
-        // manually add "Formatting re-enabled" developer message to encourage markdown inclusion in model responses
-        // (https://learn.microsoft.com/en-us/azure/ai-services/openai/how-to/reasoning?tabs=python-secure#markdown-output)
-        requestPayload["messages"].unshift({
-          role: "developer",
-          content: "Formatting re-enabled",
-        });
-
-        // o1/o3 uses max_completion_tokens to control the number of tokens (https://platform.openai.com/docs/guides/reasoning#controlling-costs)
        requestPayload["max_completion_tokens"] = modelConfig.max_tokens;
      }

+      if (isO3) {
+        requestPayload["reasoning_effort"] = "high";
+        // make o3-mini defaults to high reasoning effort
+      }
+
      // add max_tokens to vision model
-      if (visionModel && !isO1OrO3) {
-        requestPayload["max_tokens"] = Math.max(modelConfig.max_tokens, 4000);
+      if (visionModel) {
+        if (isO1) {
+          requestPayload["max_completion_tokens"] = modelConfig.max_tokens;
+        } else {
+          requestPayload["max_tokens"] = Math.max(modelConfig.max_tokens, 4000);
+        }
      }
    }

@@ -295,6 +297,11 @@ export class ChatGPTApi implements LLMApi {
          isDalle3 ? OpenaiPath.ImagePath : OpenaiPath.ChatPath,
        );
      }
+      // make a fetch request
+      const requestTimeoutId = setTimeout(
+        () => controller.abort(),
+        getTimeoutMSByModel(options.config.model),
+      );
      if (shouldStream) {
        let index = -1;
        const [tools, funcs] = usePluginStore
@@ -402,12 +409,6 @@ export class ChatGPTApi implements LLMApi {
          headers: getHeaders(),
        };

-        // make a fetch request
-        const requestTimeoutId = setTimeout(
-          () => controller.abort(),
-          getTimeoutMSByModel(options.config.model),
-        );
-
        const res = await fetch(chatPath, chatPayload);
        clearTimeout(requestTimeoutId);

--- a/app/constant.ts
+++ b/app/constant.ts
@@ -408,43 +408,20 @@ You are an AI assistant with access to system tools. Your role is to help users
   
 `;

-export const SUMMARIZE_MODEL = "gpt-4o-mini";
-export const GEMINI_SUMMARIZE_MODEL = "gemini-pro";
+export const SUMMARIZE_MODEL = "gpt-4.1-mini";
+export const GEMINI_SUMMARIZE_MODEL = "gemini-2.0-flash";
 export const DEEPSEEK_SUMMARIZE_MODEL = "deepseek-chat";

 export const KnowledgeCutOffDate: Record<string, string> = {
-  default: "2021-09",
-  "gpt-4-turbo": "2023-12",
-  "gpt-4-turbo-2024-04-09": "2023-12",
-  "gpt-4-turbo-preview": "2023-12",
-  "gpt-4.1": "2024-06",
-  "gpt-4.1-2025-04-14": "2024-06",
-  "gpt-4.1-mini": "2024-06",
-  "gpt-4.1-mini-2025-04-14": "2024-06",
-  "gpt-4.1-nano": "2024-06",
-  "gpt-4.1-nano-2025-04-14": "2024-06",
-  "gpt-4.5-preview": "2023-10",
-  "gpt-4.5-preview-2025-02-27": "2023-10",
-  "gpt-4o": "2023-10",
-  "gpt-4o-2024-05-13": "2023-10",
-  "gpt-4o-2024-08-06": "2023-10",
-  "gpt-4o-2024-11-20": "2023-10",
-  "chatgpt-4o-latest": "2023-10",
-  "gpt-4o-mini": "2023-10",
-  "gpt-4o-mini-2024-07-18": "2023-10",
-  "gpt-4-vision-preview": "2023-04",
-  "o1-mini-2024-09-12": "2023-10",
-  "o1-mini": "2023-10",
-  "o1-preview-2024-09-12": "2023-10",
-  "o1-preview": "2023-10",
-  "o1-2024-12-17": "2023-10",
-  o1: "2023-10",
-  "o3-mini-2025-01-31": "2023-10",
-  "o3-mini": "2023-10",
+  default: "2023-10",
  // After improvements,
  // it's now easier to add "KnowledgeCutOffDate" instead of stupid hardcoding it, as was done previously.
-  "gemini-pro": "2023-12",
-  "gemini-pro-vision": "2023-12",
+  "gemini-2.5-pro-exp-03-25": "2025-01",
+  "gemini-2.0-flash": "2024-08",
+  "claude-3-7-sonnet-latest": "2024-10",
+  "claude-3-5-haiku-latest": "2024-10",
+  "gpt-4.1": "2024-06",
+  "gpt-4.1-mini": "2024-06",
  "deepseek-chat": "2024-07",
  "deepseek-coder": "2024-07",
 };
@@ -465,12 +442,12 @@ export const DEFAULT_TTS_VOICES = [

 export const VISION_MODEL_REGEXES = [
  /vision/,
-  /gpt-4o/,
  /gpt-4\.1/,
  /claude-3/,
  /gemini-1\.5/,
  /gemini-exp/,
  /gemini-2\.0/,
+  /gemini-2\.5-pro/,
  /learnlm/,
  /qwen-vl/,
  /qwen2-vl/,
@@ -478,86 +455,23 @@ export const VISION_MODEL_REGEXES = [
  /^dall-e-3$/, // Matches exactly "dall-e-3"
  /glm-4v/,
  /vl/i,
-  /o3/,
-  /o4-mini/,
+  /o1/,
 ];

 export const EXCLUDE_VISION_MODEL_REGEXES = [/claude-3-5-haiku-20241022/];

-const openaiModels = [
-  // As of July 2024, gpt-4o-mini should be used in place of gpt-3.5-turbo,
-  // as it is cheaper, more capable, multimodal, and just as fast. gpt-3.5-turbo is still available for use in the API.
-  "gpt-3.5-turbo",
-  "gpt-3.5-turbo-1106",
-  "gpt-3.5-turbo-0125",
-  "gpt-4",
-  "gpt-4-0613",
-  "gpt-4-32k",
-  "gpt-4-32k-0613",
-  "gpt-4-turbo",
-  "gpt-4-turbo-preview",
-  "gpt-4.1",
-  "gpt-4.1-2025-04-14",
-  "gpt-4.1-mini",
-  "gpt-4.1-mini-2025-04-14",
-  "gpt-4.1-nano",
-  "gpt-4.1-nano-2025-04-14",
-  "gpt-4.5-preview",
-  "gpt-4.5-preview-2025-02-27",
-  "gpt-4o",
-  "gpt-4o-2024-05-13",
-  "gpt-4o-2024-08-06",
-  "gpt-4o-2024-11-20",
-  "chatgpt-4o-latest",
-  "gpt-4o-mini",
-  "gpt-4o-mini-2024-07-18",
-  "gpt-4-vision-preview",
-  "gpt-4-turbo-2024-04-09",
-  "gpt-4-1106-preview",
-  "dall-e-3",
-  "o1-mini",
-  "o1-preview",
-  "o3-mini",
-  "o3",
-  "o4-mini",
-];
+const openaiModels = ["dall-e-3", "o1", "o3-mini", "gpt-4.1", "gpt-4.1-mini"];

 const googleModels = [
-  "gemini-1.5-pro-latest",
-  "gemini-1.5-pro",
-  "gemini-1.5-pro-002",
-  "gemini-1.5-flash-latest",
-  "gemini-1.5-flash-8b-latest",
-  "gemini-1.5-flash",
-  "gemini-1.5-flash-8b",
-  "gemini-1.5-flash-002",
-  "learnlm-1.5-pro-experimental",
-  "gemini-exp-1206",
  "gemini-2.0-flash",
-  "gemini-2.0-flash-exp",
-  "gemini-2.0-flash-lite-preview-02-05",
-  "gemini-2.0-flash-thinking-exp",
-  "gemini-2.0-flash-thinking-exp-1219",
-  "gemini-2.0-flash-thinking-exp-01-21",
-  "gemini-2.0-pro-exp",
-  "gemini-2.0-pro-exp-02-05",
-  "gemini-2.5-pro-preview-06-05",
+  "gemini-2.0-flash-lite",
+  "gemini-2.5-pro-exp-03-25",
 ];

 const anthropicModels = [
-  "claude-instant-1.2",
-  "claude-2.0",
-  "claude-2.1",
-  "claude-3-sonnet-20240229",
-  "claude-3-opus-20240229",
  "claude-3-opus-latest",
-  "claude-3-haiku-20240307",
-  "claude-3-5-haiku-20241022",
  "claude-3-5-haiku-latest",
-  "claude-3-5-sonnet-20240620",
-  "claude-3-5-sonnet-20241022",
  "claude-3-5-sonnet-latest",
-  "claude-3-7-sonnet-20250219",
  "claude-3-7-sonnet-latest",
 ];

@@ -628,18 +542,6 @@ const xAIModes = [
  "grok-2-vision-1212",
  "grok-2-vision",
  "grok-2-vision-latest",
-  "grok-3-mini-fast-beta",
-  "grok-3-mini-fast",
-  "grok-3-mini-fast-latest",
-  "grok-3-mini-beta",
-  "grok-3-mini",
-  "grok-3-mini-latest",
-  "grok-3-fast-beta",
-  "grok-3-fast",
-  "grok-3-fast-latest",
-  "grok-3-beta",
-  "grok-3",
-  "grok-3-latest",
 ];

 const chatglmModels = [
--- a/app/store/config.ts
+++ b/app/store/config.ts
@@ -66,14 +66,14 @@ export const DEFAULT_CONFIG = {
  modelConfig: {
    model: "gpt-4o-mini" as ModelType,
    providerName: "OpenAI" as ServiceProvider,
-    temperature: 0.5,
+    temperature: 0.2,
    top_p: 1,
    max_tokens: 4000,
    presence_penalty: 0,
    frequency_penalty: 0,
    sendMemory: true,
-    historyMessageCount: 4,
-    compressMessageLengthThreshold: 1000,
+    historyMessageCount: 20,
+    compressMessageLengthThreshold: 5000,
    compressModel: "",
    compressProviderName: "",
    enableInjectSystemPrompts: true,
--- a/app/utils.ts
+++ b/app/utils.ts
@@ -304,9 +304,18 @@ export function getTimeoutMSByModel(model: string) {
    model.startsWith("o1") ||
    model.startsWith("o3") ||
    model.includes("deepseek-r") ||
-    model.includes("-thinking")
-  )
+    model.includes("-thinking") ||
+    model.includes("pro")
+  ) {
+    console.log(
+      "thinking model is " +
+        model +
+        " timeout is " +
+        REQUEST_TIMEOUT_MS_FOR_THINKING,
+    );
    return REQUEST_TIMEOUT_MS_FOR_THINKING;
+  }
+  console.log("normal model is " + model + " timeout is " + REQUEST_TIMEOUT_MS);
  return REQUEST_TIMEOUT_MS;
 }

--- a/package-lock.json
+++ b/package-lock.json
--- a/package.json
+++ b/package.json
@@ -83,7 +83,7 @@
    "jest": "^29.7.0",
    "jest-environment-jsdom": "^29.7.0",
    "lint-staged": "^13.2.2",
-    "prettier": "^3.6.2",
+    "prettier": "^3.0.2",
    "ts-node": "^10.9.2",
    "tsx": "^4.16.0",
    "typescript": "5.2.2",
--- a/test/model-available.test.ts
+++ b/test/model-available.test.ts
@@ -3,7 +3,7 @@ import { isModelNotavailableInServer } from "../app/utils/model";
 describe("isModelNotavailableInServer", () => {
  test("test model will return false, which means the model is available", () => {
    const customModels = "";
-    const modelName = "gpt-4";
+    const modelName = "gpt-4.1";
    const providerNames = "OpenAI";
    const result = isModelNotavailableInServer(
      customModels,
--- a/test/vision-model-checker.test.ts
+++ b/test/vision-model-checker.test.ts
@@ -15,10 +15,11 @@ describe("isVisionModel", () => {

  test("should identify vision models using regex patterns", () => {
    const visionModels = [
-      "gpt-4-vision",
+      "gpt-4.1",
      "claude-3-opus",
      "gemini-1.5-pro",
      "gemini-2.0",
+      "gemini-2.5-pro",
      "gemini-exp-vision",
      "learnlm-vision",
      "qwen-vl-max",
--- a/yarn.lock
+++ b/yarn.lock
Author	SHA1	Message	Date
Davidlasky	ac7b720b5b	send longer chat history	2025-04-15 13:37:26 -05:00
Davidlasky	d02f9b0dd4	added gpt-4.1 and removed gpt-4.5-preview	2025-04-15 12:52:30 -05:00
Davidlasky	f2a5af7556	ignore local Dockerfile	2025-04-01 17:53:56 -05:00
Davidlasky	ff196f22c2	local debug	2025-04-01 17:48:31 -05:00
Davidlasky	106db97f8c	enable o3-mini-high, optimize timeout for thinking models	2025-04-01 17:47:16 -05:00
Davidlasky	e30d90714b	remove legacy models and support new models	2025-04-01 17:45:33 -05:00
Davidlasky	2329d59c83	defaults o3-mini to high	2025-04-01 13:33:38 -05:00
Davidlasky	b5ee4c1fcf	make timeout longer	2025-03-29 02:28:00 -05:00
LaskyJ	6d69494e08	Update utils.ts	2025-03-27 12:52:25 -05:00
Davidlasky	2509495cdc	try to add o1 as a vision model	2025-03-25 18:01:23 -05:00
LaskyJ	d65aca6d13	Update constant.ts	2025-03-25 15:40:36 -05:00
LaskyJ	2f5184c5b4	Update constant.ts	2025-03-25 15:27:26 -05:00
GH Action - Upstream Sync	20df2eed07	Merge branch 'main' of https://github.com/ChatGPTNextWeb/ChatGPT-Next-Web	2025-03-21 01:00:47 +00:00
LaskyJ	fd998de148	Merge branch 'ChatGPTNextWeb:main' into main	2025-03-14 18:47:04 -05:00
GH Action - Upstream Sync	fd2e69d1c7	Merge branch 'main' of https://github.com/ChatGPTNextWeb/ChatGPT-Next-Web	2025-03-02 01:01:58 +00:00
GH Action - Upstream Sync	e8dcede878	Merge branch 'main' of https://github.com/ChatGPTNextWeb/ChatGPT-Next-Web	2025-03-01 01:02:26 +00:00
GH Action - Upstream Sync	3b23f5f8ab	Merge branch 'main' of https://github.com/ChatGPTNextWeb/ChatGPT-Next-Web	2025-02-27 00:58:12 +00:00
LaskyJ	75cdd15bc2	Update constant.ts	2025-02-25 21:04:07 -06:00
LaskyJ	af1dfd2a6c	Update constant.ts	2025-02-25 20:52:01 -06:00
LaskyJ	6aecdd80e9	Update constant.ts	2025-02-25 20:50:10 -06:00