perf: model testing

2026-07-25 13:56:08 +00:00 · 2025-08-07 10:01:04 +08:00
parent 0f239ace17
commit 02dbe80d2f
6 changed files with 31 additions and 6 deletions
@@ -101,7 +101,7 @@ class LLMModelsService:
            model=runtime_llm_model,
            messages=[llm_entities.Message(role='user', content='Hello, world!')],
            funcs=[],
-            extra_args={},
+            extra_args=model_data.get('extra_args', {}),
        )


@@ -21,7 +21,7 @@ class AnthropicMessages(requester.ProviderAPIRequester):
    client: anthropic.AsyncAnthropic

    default_config: dict[str, typing.Any] = {
-        'base_url': 'https://api.anthropic.com/v1',
+        'base_url': 'https://api.anthropic.com',
        'timeout': 120,
    }

@@ -44,6 +44,7 @@ class AnthropicMessages(requester.ProviderAPIRequester):
        self.client = anthropic.AsyncAnthropic(
            api_key='',
            http_client=httpx_client,
+            base_url=self.requester_cfg['base_url'],
        )

    async def invoke_llm(
@@ -141,7 +142,6 @@ class AnthropicMessages(requester.ProviderAPIRequester):
                args['tools'] = tools

        try:
-            # print(json.dumps(args, indent=4, ensure_ascii=False))
            resp = await self.client.messages.create(**args)

            args = {
@@ -14,7 +14,7 @@ spec:
        zh_Hans: 基础 URL
      type: string
      required: true
-      default: "https://api.anthropic.com/v1"
+      default: "https://api.anthropic.com"
    - name: timeout
      label:
        en_US: Timeout