feat(agent-runner): enforce typed host permissions

2026-06-18 19:44:21 +00:00 · 2026-06-10 22:36:23 +08:00
parent 8938ef7412
commit ea96d37e60
41 changed files with 584 additions and 3862 deletions
@@ -1,169 +0,0 @@
-"""Tests for DifyServiceAPIRunner pure utility methods.
-
-Tests the helper methods that don't require real Dify API calls.
-"""
-
-from __future__ import annotations
-
-import pytest
-
-
-class TestDifyExtractTextOutput:
-    """Tests for _extract_dify_text_output method."""
-
-    def _create_runner(self):
-        """Create runner instance."""
-        from unittest.mock import MagicMock
-
-        from langbot.pkg.provider.runners.difysvapi import DifyServiceAPIRunner
-
-        mock_app = MagicMock()
-        pipeline_config = {
-            'ai': {
-                'dify-service-api': {
-                    'app-type': 'chat',
-                    'api-key': 'test-key',
-                    'base-url': 'https://api.dify.ai',
-                }
-            },
-            'output': {'misc': {}}
-        }
-
-        runner = DifyServiceAPIRunner(mock_app, pipeline_config)
-        runner.dify_client = MagicMock()
-
-        return runner
-
-    def test_extract_none_value(self):
-        """None returns empty string."""
-        runner = self._create_runner()
-
-        result = runner._extract_dify_text_output(None)
-
-        assert result == ''
-
-    def test_extract_string_value(self):
-        """Plain string is returned."""
-        runner = self._create_runner()
-
-        result = runner._extract_dify_text_output('plain text')
-
-        assert result == 'plain text'
-
-    def test_extract_dict_with_content(self):
-        """Dict with 'content' key extracts content."""
-        runner = self._create_runner()
-
-        result = runner._extract_dify_text_output({'content': 'extracted content'})
-
-        assert result == 'extracted content'
-
-    def test_extract_dict_without_content(self):
-        """Dict without 'content' key is JSON dumped."""
-        runner = self._create_runner()
-
-        result = runner._extract_dify_text_output({'key': 'value'})
-
-        assert 'key' in result
-        assert 'value' in result
-
-    def test_extract_json_string_with_content(self):
-        """JSON string with 'content' key extracts content."""
-        runner = self._create_runner()
-
-        result = runner._extract_dify_text_output('{"content": "json content"}')
-
-        assert result == 'json content'
-
-    def test_extract_json_string_without_content(self):
-        """JSON string without 'content' key returns original."""
-        runner = self._create_runner()
-
-        result = runner._extract_dify_text_output('{"other": "value"}')
-
-        assert '{"other": "value"}' in result
-
-    def test_extract_whitespace_string(self):
-        """Whitespace string returns empty."""
-        runner = self._create_runner()
-
-        result = runner._extract_dify_text_output('   ')
-
-        assert result == ''
-
-
-class TestDifyRunnerConfigValidation:
-    """Tests for runner config validation."""
-
-    def test_invalid_app_type_raises(self):
-        """Invalid app-type raises DifyAPIError."""
-        from unittest.mock import MagicMock
-
-        from langbot.pkg.provider.runners.difysvapi import DifyServiceAPIRunner
-        from langbot.libs.dify_service_api.v1.errors import DifyAPIError
-
-        mock_app = MagicMock()
-        pipeline_config = {
-            'ai': {
-                'dify-service-api': {
-                    'app-type': 'invalid-type',
-                    'api-key': 'test',
-                    'base-url': 'https://api.dify.ai',
-                }
-            },
-            'output': {'misc': {}}
-        }
-
-        with pytest.raises(DifyAPIError, match='不支持'):
-            DifyServiceAPIRunner(mock_app, pipeline_config)
-
-    def test_valid_app_types(self):
-        """Valid app-types don't raise."""
-        from unittest.mock import MagicMock
-
-        from langbot.pkg.provider.runners.difysvapi import DifyServiceAPIRunner
-
-        mock_app = MagicMock()
-
-        for app_type in ['chat', 'agent', 'workflow']:
-            pipeline_config = {
-                'ai': {
-                    'dify-service-api': {
-                        'app-type': app_type,
-                        'api-key': 'test',
-                        'base-url': 'https://api.dify.ai',
-                    }
-                },
-                'output': {'misc': {}}
-            }
-
-            runner = DifyServiceAPIRunner(mock_app, pipeline_config)
-            # Should not raise
-            assert runner is not None
-
-
-class TestDifyRunnerInit:
-    """Tests for runner initialization."""
-
-    def test_runner_stores_config(self):
-        """Runner stores pipeline_config."""
-        from unittest.mock import MagicMock
-
-        from langbot.pkg.provider.runners.difysvapi import DifyServiceAPIRunner
-
-        mock_app = MagicMock()
-        pipeline_config = {
-            'ai': {
-                'dify-service-api': {
-                    'app-type': 'chat',
-                    'api-key': 'test-key',
-                    'base-url': 'https://api.dify.ai',
-                }
-            },
-            'output': {'misc': {}}
-        }
-
-        runner = DifyServiceAPIRunner(mock_app, pipeline_config)
-
-        assert runner.pipeline_config == pipeline_config
-        assert runner.ap == mock_app
@@ -1,242 +0,0 @@
-from __future__ import annotations
-
-import json
-from types import SimpleNamespace
-from unittest.mock import AsyncMock, Mock
-
-import pytest
-
-import langbot_plugin.api.entities.builtin.pipeline.query as pipeline_query
-import langbot_plugin.api.entities.builtin.provider.message as provider_message
-import langbot_plugin.api.entities.builtin.provider.session as provider_session
-
-from langbot.pkg.provider.runners.localagent import LocalAgentRunner
-
-
-class RecordingProvider:
-    def __init__(self):
-        self.requests: list[dict] = []
-
-    async def invoke_llm(self, query, model, messages, funcs, extra_args=None, remove_think=None):
-        self.requests.append(
-            {
-                'messages': list(messages),
-                'funcs': list(funcs),
-                'remove_think': remove_think,
-            }
-        )
-
-        if len(self.requests) == 1:
-            return provider_message.Message(
-                role='assistant',
-                content='Let me calculate that exactly.',
-                tool_calls=[
-                    provider_message.ToolCall(
-                        id='call-1',
-                        type='function',
-                        function=provider_message.FunctionCall(
-                            name='exec',
-                            arguments=json.dumps(
-                                {'command': ("python - <<'PY'\nnums = [1, 2, 3, 4]\nprint(sum(nums) / len(nums))\nPY")}
-                            ),
-                        ),
-                    )
-                ],
-            )
-
-        tool_result = json.loads(messages[-1].content)
-        return provider_message.Message(
-            role='assistant',
-            content=f'The average is {tool_result["stdout"]}.',
-        )
-
-
-class RecordingStreamProvider:
-    def __init__(self):
-        self.stream_requests: list[dict] = []
-
-    def invoke_llm_stream(self, query, model, messages, funcs, extra_args=None, remove_think=None):
-        self.stream_requests.append(
-            {
-                'messages': list(messages),
-                'funcs': list(funcs),
-                'remove_think': remove_think,
-            }
-        )
-
-        async def _stream():
-            if len(self.stream_requests) == 1:
-                yield provider_message.MessageChunk(
-                    role='assistant',
-                    tool_calls=[
-                        provider_message.ToolCall(
-                            id='call-1',
-                            type='function',
-                            function=provider_message.FunctionCall(
-                                name='exec',
-                                arguments=json.dumps({'command': "python -c 'print(1)'"}),
-                            ),
-                        )
-                    ],
-                    is_final=True,
-                )
-                return
-
-            yield provider_message.MessageChunk(
-                role='assistant',
-                content='Tool execution failed.',
-                is_final=True,
-            )
-
-        return _stream()
-
-
-def make_query() -> pipeline_query.Query:
-    adapter = AsyncMock()
-    adapter.is_stream_output_supported = AsyncMock(return_value=False)
-
-    return pipeline_query.Query.model_construct(
-        query_id='avg-query',
-        launcher_type=provider_session.LauncherTypes.PERSON,
-        launcher_id=12345,
-        sender_id=12345,
-        message_chain=[],
-        message_event=None,
-        adapter=adapter,
-        pipeline_uuid='pipeline-uuid',
-        bot_uuid='bot-uuid',
-        pipeline_config={
-            'ai': {
-                'runner': {'runner': 'local-agent'},
-                'local-agent': {'model': {'primary': 'test-model-uuid', 'fallbacks': []}, 'prompt': 'test-prompt'},
-            },
-            'output': {'misc': {'remove-think': False}},
-        },
-        prompt=SimpleNamespace(messages=[]),
-        messages=[],
-        user_message=provider_message.Message(
-            role='user',
-            content='Please calculate the average of 1, 2, 3, and 4.',
-        ),
-        use_funcs=[SimpleNamespace(name='exec')],
-        use_llm_model_uuid='test-model-uuid',
-        variables={},
-    )
-
-
-@pytest.mark.asyncio
-async def test_localagent_uses_exec_for_exact_calculation():
-    provider = RecordingProvider()
-    model = SimpleNamespace(
-        provider=provider,
-        model_entity=SimpleNamespace(
-            uuid='test-model-uuid',
-            name='test-model',
-            abilities=['func_call'],
-            extra_args={},
-        ),
-    )
-
-    tool_manager = SimpleNamespace(
-        execute_func_call=AsyncMock(
-            return_value={
-                'session_id': 'avg-query',
-                'backend': 'podman',
-                'status': 'completed',
-                'ok': True,
-                'exit_code': 0,
-                'stdout': '2.5',
-                'stderr': '',
-                'duration_ms': 18,
-            }
-        )
-    )
-
-    app = SimpleNamespace(
-        logger=Mock(),
-        model_mgr=SimpleNamespace(get_model_by_uuid=AsyncMock(return_value=model)),
-        tool_mgr=tool_manager,
-        rag_mgr=SimpleNamespace(),
-        box_service=SimpleNamespace(
-            get_system_guidance=Mock(
-                return_value=(
-                    'When the exec tool is available, use it for exact calculations, statistics, '
-                    'structured data parsing, and code execution instead of estimating mentally. '
-                    'Unless the user explicitly asks for the script, code, or implementation details, '
-                    'do not include the generated script in the final answer. '
-                    'A default workspace is mounted at /workspace for file tasks.'
-                )
-            ),
-        ),
-        skill_mgr=SimpleNamespace(
-            get_skills_for_pipeline=AsyncMock(return_value=[]),
-            detect_skill_activation=AsyncMock(return_value=None),
-            build_activation_prompt=Mock(return_value=None),
-        ),
-    )
-
-    runner = LocalAgentRunner(app, pipeline_config={})
-    query = make_query()
-
-    results = [message async for message in runner.run(query)]
-
-    assert [message.role for message in results] == ['assistant', 'tool', 'assistant']
-    assert results[-1].content == 'The average is 2.5.'
-
-    tool_manager.execute_func_call.assert_awaited_once()
-    tool_name, tool_parameters = tool_manager.execute_func_call.await_args.args[:2]
-    assert tool_name == 'exec'
-    assert 'print(sum(nums) / len(nums))' in tool_parameters['command']
-
-    first_request = provider.requests[0]
-    assert any(
-        message.role == 'system'
-        and 'exec' in str(message.content)
-        and 'exact calculations' in str(message.content)
-        and 'Unless the user explicitly asks for the script' in str(message.content)
-        and '/workspace' in str(message.content)
-        for message in first_request['messages']
-    )
-    assert [tool.name for tool in first_request['funcs']] == ['exec']
-
-
-@pytest.mark.asyncio
-async def test_localagent_streaming_tool_error_yields_message_chunks():
-    provider = RecordingStreamProvider()
-    model = SimpleNamespace(
-        provider=provider,
-        model_entity=SimpleNamespace(
-            uuid='test-model-uuid',
-            name='test-model',
-            abilities=['func_call'],
-            extra_args={},
-        ),
-    )
-
-    adapter = AsyncMock()
-    adapter.is_stream_output_supported = AsyncMock(return_value=True)
-
-    query = make_query()
-    query.adapter = adapter
-
-    app = SimpleNamespace(
-        logger=Mock(),
-        model_mgr=SimpleNamespace(get_model_by_uuid=AsyncMock(return_value=model)),
-        tool_mgr=SimpleNamespace(execute_func_call=AsyncMock(side_effect=RuntimeError('boom'))),
-        rag_mgr=SimpleNamespace(),
-        box_service=SimpleNamespace(
-            get_system_guidance=Mock(return_value='sandbox guidance'),
-        ),
-        skill_mgr=SimpleNamespace(
-            get_skills_for_pipeline=AsyncMock(return_value=[]),
-            detect_skill_activation=AsyncMock(return_value=None),
-            build_activation_prompt=Mock(return_value=None),
-        ),
-    )
-
-    runner = LocalAgentRunner(app, pipeline_config={})
-
-    results = [message async for message in runner.run(query)]
-
-    assert all(isinstance(message, provider_message.MessageChunk) for message in results)
-    assert any(message.role == 'tool' and message.content == 'err: boom' for message in results)
@@ -21,7 +21,6 @@ from langbot.pkg.provider.modelmgr.modelmgr import ModelManager
 from langbot.pkg.provider.modelmgr.requesters.chatcmpl import OpenAIChatCompletions
 from langbot.pkg.provider.modelmgr.requesters.modelscopechatcmpl import ModelScopeChatCompletions
 from langbot.pkg.provider.modelmgr.token import TokenManager
-from langbot.pkg.provider.runners.localagent import LocalAgentRunner


 DEFAULT_RUNNER_ID = 'plugin:langbot/local-agent/default'
@@ -43,8 +42,8 @@ class FakeAgentRunnerRegistry:
            ],
            capabilities={'tool_calling': True, 'knowledge_retrieval': True, 'multimodal_input': True},
            permissions={
-                'models': ['list', 'invoke', 'stream'],
-                'tools': ['list', 'detail', 'call'],
+                'models': ['invoke', 'stream'],
+                'tools': ['detail', 'call'],
                'knowledge_bases': ['list', 'retrieve'],
            },
        )
@@ -320,8 +319,3 @@ async def test_updated_llm_model_is_immediately_usable_by_local_agent_pipeline()
    processed_query = result.new_query

    assert processed_query.use_llm_model_uuid == model_uuid
-
-    runner = SimpleNamespace(ap=ap, pipeline_config=pipeline_config)
-    candidates = await LocalAgentRunner._get_model_candidates(runner, processed_query)
-
-    assert [model.model_entity.uuid for model in candidates] == [model_uuid]