diff --git a/pkg/api/http/service/model.py b/pkg/api/http/service/model.py index 036c1b9c..17297ed1 100644 --- a/pkg/api/http/service/model.py +++ b/pkg/api/http/service/model.py @@ -1,13 +1,14 @@ from __future__ import annotations import uuid + import sqlalchemy +from langbot_plugin.api.entities.builtin.provider import message as provider_message from ....core import app from ....entity.persistence import model as persistence_model from ....entity.persistence import pipeline as persistence_pipeline from ....provider.modelmgr import requester as model_requester -from langbot_plugin.api.entities.builtin.provider import message as provider_message class LLMModelsService: @@ -104,12 +105,17 @@ class LLMModelsService: else: runtime_llm_model = await self.ap.model_mgr.init_runtime_llm_model(model_data) + # 有些模型厂商默认开启了思考功能,测试容易延迟 + extra_args = model_data.get('extra_args', {}) + if not extra_args or 'thinking' not in extra_args: + extra_args['thinking'] = {'type': 'disabled'} + await runtime_llm_model.requester.invoke_llm( query=None, model=runtime_llm_model, - messages=[provider_message.Message(role='user', content='Hello, world!')], + messages=[provider_message.Message(role='user', content='Hello, world! Please just reply a "Hello".')], funcs=[], - extra_args=model_data.get('extra_args', {}), + extra_args=extra_args, ) diff --git a/web/src/app/infra/http/BaseHttpClient.ts b/web/src/app/infra/http/BaseHttpClient.ts index 019a54e6..cc2c31e4 100644 --- a/web/src/app/infra/http/BaseHttpClient.ts +++ b/web/src/app/infra/http/BaseHttpClient.ts @@ -38,7 +38,7 @@ export abstract class BaseHttpClient { this.instance = axios.create({ baseURL: baseURL, - timeout: 15000, + timeout: 30000, headers: { 'Content-Type': 'application/json', },