feat(agent-runner): add persistent state APIs

2026-06-09 15:26:03 +00:00 · 2026-05-23 21:45:11 +08:00
parent cefd99e416
commit 24993ac700
12 changed files with 2407 additions and 62 deletions
--- a/src/langbot/pkg/agent/runner/context_builder.py
+++ b/src/langbot/pkg/agent/runner/context_builder.py
@@ -13,6 +13,7 @@ from .descriptor import AgentRunnerDescriptor
 from .config_migration import ConfigMigration
 from .context_packager import AgentContextPackager
 from .state_store import get_state_store
+from .persistent_state_store import get_persistent_state_store
 from . import events as runner_events
 from .host_models import AgentEventEnvelope, AgentBinding
 from .pipeline_compat_adapter import PipelineCompatAdapter
@@ -259,11 +260,13 @@ class AgentRunContextBuilder:

        # Build context access (no history inlined by default for Protocol v1)
        # Populate with actual values from stores
-        context_access = await self._build_context_access(event, descriptor)
+        context_access = await self._build_context_access(event, descriptor, binding)

-        # Build state snapshot from event context
-        state_store = get_state_store()
-        state: AgentRunState = state_store.build_snapshot_from_event(event, binding, descriptor)
+        # Build state snapshot from persistent state store (event-first Protocol v1)
+        persistent_state_store = get_persistent_state_store(
+            self.ap.persistence_mgr.get_db_engine()
+        )
+        state: AgentRunState = await persistent_state_store.build_snapshot_from_event(event, binding, descriptor)

        # Build runtime context
        runtime: AgentRuntimeContext = {
@@ -420,6 +423,7 @@ class AgentRunContextBuilder:
        }

        # Build context access (for legacy, minimal API availability)
+        # Legacy Query-based mode does NOT have persistent state API
        context_access = {
            'conversation_id': conversation.get('conversation_id') if conversation else None,
            'thread_id': None,
@@ -441,7 +445,7 @@ class AgentRunContextBuilder:
                'event_page': False,
                'artifact_metadata': False,
                'artifact_read': False,
-                'state': True,
+                'state': False,  # Legacy Query mode does not have persistent state API
                'storage': True,
            },
        }
@@ -869,12 +873,14 @@ class AgentRunContextBuilder:
        self,
        event: AgentEventEnvelope,
        descriptor: AgentRunnerDescriptor,
+        binding: AgentBinding | None = None,
    ) -> dict[str, typing.Any]:
        """Build ContextAccess with actual values from stores.

        Args:
            event: Event envelope
            descriptor: Runner descriptor
+            binding: Agent binding (required for state_policy in event-first mode)

        Returns:
            ContextAccess dict
@@ -895,6 +901,14 @@ class AgentRunContextBuilder:
        artifact_metadata_enabled = 'metadata' in artifact_permissions
        artifact_read_enabled = 'read' in artifact_permissions

+        # Determine state API availability based on binding state_policy (event-first mode)
+        # For legacy Query-based mode, state is NOT available (no persistent state API)
+        state_enabled = False
+        if binding is not None:
+            state_policy = binding.state_policy
+            if state_policy.enable_state and state_policy.state_scopes:
+                state_enabled = True
+
        # Get latest cursor and has_history_before if conversation exists
        latest_cursor = None
        has_history_before = False
@@ -931,7 +945,7 @@ class AgentRunContextBuilder:
                'event_page': event_page_enabled,
                'artifact_metadata': artifact_metadata_enabled,
                'artifact_read': artifact_read_enabled,
-                'state': True,
+                'state': state_enabled,
                'storage': True,
            },
        }
--- a/src/langbot/pkg/agent/runner/orchestrator.py
+++ b/src/langbot/pkg/agent/runner/orchestrator.py
@@ -17,6 +17,7 @@ from .context_builder import AgentRunContextBuilder, AgentRunContextPayload
 from .resource_builder import AgentResourceBuilder
 from .result_normalizer import AgentResultNormalizer
 from .state_store import get_state_store, RunnerScopedStateStore
+from .persistent_state_store import get_persistent_state_store, PersistentStateStore
 from .session_registry import get_session_registry, AgentRunSessionRegistry
 from .config_migration import ConfigMigration
 from .host_models import AgentEventEnvelope, AgentBinding
@@ -63,6 +64,7 @@ class AgentRunOrchestrator:
    # Cached singleton references (set in __init__)
    _session_registry: AgentRunSessionRegistry
    _state_store: RunnerScopedStateStore
+    _persistent_state_store: PersistentStateStore | None

    def __init__(
        self,
@@ -77,6 +79,7 @@ class AgentRunOrchestrator:
        # Cache singleton references to avoid per-request getter calls
        self._session_registry = get_session_registry()
        self._state_store = get_state_store()
+        self._persistent_state_store = None  # Lazy init on first use

    async def run(
        self,
@@ -122,6 +125,9 @@ class AgentRunOrchestrator:
            resources=resources,
        )

+        # Build state context for State API handlers
+        state_context = self._build_state_context(event, binding, descriptor)
+
        # Register session for proxy action permission validation
        run_id = context['run_id']
        await self._session_registry.register(
@@ -132,6 +138,11 @@ class AgentRunOrchestrator:
            resources=resources,
            permissions=descriptor.permissions or {},
            conversation_id=event.conversation_id,
+            state_policy={
+                'enable_state': binding.state_policy.enable_state,
+                'state_scopes': list(binding.state_policy.state_scopes),
+            },
+            state_context=state_context,
        )

        # Write incoming event to EventLog
@@ -170,7 +181,7 @@ class AgentRunOrchestrator:

                # Handle state.updated first - consume before normalizer
                if result_dict.get('type') == 'state.updated':
-                    self._handle_state_updated_event(result_dict, event, binding, descriptor)
+                    await self._handle_state_updated_event(result_dict, event, binding, descriptor)
                    # Pass to normalizer for logging, but don't yield to pipeline
                    await self.result_normalizer.normalize(result_dict, descriptor)
                    continue
@@ -555,7 +566,7 @@ class AgentRunOrchestrator:
                f'artifact.created failed to register artifact: {e}',
            )

-    def _handle_state_updated_event(
+    async def _handle_state_updated_event(
        self,
        result_dict: dict[str, typing.Any],
        event: AgentEventEnvelope,
@@ -564,6 +575,8 @@ class AgentRunOrchestrator:
    ) -> None:
        """Handle state.updated result in event-first mode.

+        Persists state to database via PersistentStateStore.
+
        Args:
            result_dict: Raw result dict with type='state.updated'
            event: Event envelope
@@ -585,8 +598,14 @@ class AgentRunOrchestrator:
            )
            return

-        # Apply update to state store using event context
-        success = self._state_store.apply_update_from_event(
+        # Lazy init persistent state store
+        if self._persistent_state_store is None:
+            self._persistent_state_store = get_persistent_state_store(
+                self.ap.persistence_mgr.get_db_engine()
+            )
+
+        # Apply update to persistent state store
+        success, error = await self._persistent_state_store.apply_update_from_event(
            event=event,
            binding=binding,
            descriptor=descriptor,
@@ -600,7 +619,79 @@ class AgentRunOrchestrator:
            self.ap.logger.debug(
                f'Runner {descriptor.id} state.updated (event mode): scope={scope}, key={key}'
            )
-        # Invalid scope or missing identity is already logged by apply_update_from_event
+        elif error:
+            self.ap.logger.warning(
+                f'Runner {descriptor.id} state.updated rejected: {error}'
+            )
+
+    def _build_state_context(
+        self,
+        event: AgentEventEnvelope,
+        binding: AgentBinding,
+        descriptor: AgentRunnerDescriptor,
+    ) -> dict[str, typing.Any]:
+        """Build state context for State API handlers.
+
+        Returns context with:
+        - scope_keys: Dict mapping scope name to scope_key
+        - binding_identity: Binding identity for state isolation
+        - Additional context fields for DB insert
+        """
+        # Get binding identity
+        binding_identity = binding.binding_id
+        if not binding_identity:
+            scope = binding.scope
+            if scope.scope_type and scope.scope_id:
+                binding_identity = f"{scope.scope_type}:{scope.scope_id}"
+            else:
+                binding_identity = "unknown_binding"
+
+        # Build scope keys for each scope
+        scope_keys: dict[str, str] = {}
+
+        # Conversation scope
+        if event.conversation_id:
+            parts = [descriptor.id, binding_identity, event.conversation_id]
+            if event.thread_id:
+                parts.append(event.thread_id)
+            scope_keys['conversation'] = f'conversation:{":".join(parts)}'
+
+        # Actor scope
+        if event.actor and event.actor.actor_id:
+            parts = [
+                descriptor.id,
+                binding_identity,
+                event.actor.actor_type or 'user',
+                event.actor.actor_id,
+            ]
+            scope_keys['actor'] = f'actor:{":".join(parts)}'
+
+        # Subject scope
+        if event.subject and event.subject.subject_id:
+            parts = [
+                descriptor.id,
+                binding_identity,
+                event.subject.subject_type or 'unknown',
+                event.subject.subject_id,
+            ]
+            scope_keys['subject'] = f'subject:{":".join(parts)}'
+
+        # Runner scope (always available)
+        parts = [descriptor.id, binding_identity]
+        scope_keys['runner'] = f'runner:{":".join(parts)}'
+
+        return {
+            'scope_keys': scope_keys,
+            'binding_identity': binding_identity,
+            'bot_id': event.bot_id,
+            'workspace_id': event.workspace_id,
+            'conversation_id': event.conversation_id,
+            'thread_id': event.thread_id,
+            'actor_type': event.actor.actor_type if event.actor else None,
+            'actor_id': event.actor.actor_id if event.actor else None,
+            'subject_type': event.subject.subject_type if event.subject else None,
+            'subject_id': event.subject.subject_id if event.subject else None,
+        }

    async def _write_event_log(
        self,
--- a/src/langbot/pkg/agent/runner/persistent_state_store.py
+++ b/src/langbot/pkg/agent/runner/persistent_state_store.py
@@ -0,0 +1,522 @@
+"""Persistent state store for AgentRunner protocol state.
+
+This module provides a database-backed state store for event-first Protocol v1,
+while preserving in-memory state store for legacy Query-based flow.
+"""
+from __future__ import annotations
+
+import typing
+import json
+import asyncio
+import threading
+from datetime import datetime
+
+import sqlalchemy
+from sqlalchemy.ext.asyncio import AsyncEngine
+from sqlalchemy import select, delete, update
+
+from langbot_plugin.api.entities.builtin.pipeline import query as pipeline_query
+
+from .descriptor import AgentRunnerDescriptor
+from .host_models import AgentEventEnvelope, AgentBinding
+from ...entity.persistence.agent_runner_state import AgentRunnerState
+
+
+# Valid state scopes for agent runner state updates.
+VALID_STATE_SCOPES = ('conversation', 'actor', 'subject', 'runner')
+
+# Key mapping for backward compatibility
+LEGACY_KEY_MAPPING = {
+    'conversation_id': 'external.conversation_id',
+}
+
+# Maximum value_json size (256KB)
+MAX_VALUE_JSON_BYTES = 256 * 1024
+
+
+class PersistentStateStore:
+    """Database-backed state store for AgentRunner protocol state.
+
+    IMPORTANT: This is HOST-OWNED protocol state, NOT plugin instance state.
+
+    This store provides:
+    1. Persistent storage across runs via database
+    2. Scope isolation by runner_id + binding_identity + scope
+    3. Policy enforcement (enable_state, state_scopes)
+    4. JSON value validation and size limits
+
+    Used by:
+    - Event-first Protocol v1 (async methods)
+    - State API handlers (get/set/delete/list)
+    """
+
+    def __init__(self, db_engine: AsyncEngine):
+        self._db_engine = db_engine
+
+    # ========== Scope Key Building (shared with in-memory store) ==========
+
+    def _get_binding_identity(self, binding: AgentBinding) -> str:
+        """Get stable binding identity for scope key."""
+        if binding.binding_id:
+            return binding.binding_id
+        scope = binding.scope
+        if scope.scope_type and scope.scope_id:
+            return f"{scope.scope_type}:{scope.scope_id}"
+        return "unknown_binding"
+
+    def _make_conversation_scope_key(
+        self,
+        event: AgentEventEnvelope,
+        binding: AgentBinding,
+        descriptor: AgentRunnerDescriptor,
+    ) -> str | None:
+        """Build conversation scope key from event and binding."""
+        if not event.conversation_id:
+            return None
+
+        binding_identity = self._get_binding_identity(binding)
+        parts = [
+            descriptor.id,
+            binding_identity,
+            event.conversation_id,
+        ]
+        if event.thread_id:
+            parts.append(event.thread_id)
+        return f'conversation:{":".join(parts)}'
+
+    def _make_actor_scope_key(
+        self,
+        event: AgentEventEnvelope,
+        binding: AgentBinding,
+        descriptor: AgentRunnerDescriptor,
+    ) -> str | None:
+        """Build actor scope key from event and binding."""
+        if not event.actor or not event.actor.actor_id:
+            return None
+
+        binding_identity = self._get_binding_identity(binding)
+        parts = [
+            descriptor.id,
+            binding_identity,
+            event.actor.actor_type or 'user',
+            event.actor.actor_id,
+        ]
+        return f'actor:{":".join(parts)}'
+
+    def _make_subject_scope_key(
+        self,
+        event: AgentEventEnvelope,
+        binding: AgentBinding,
+        descriptor: AgentRunnerDescriptor,
+    ) -> str | None:
+        """Build subject scope key from event and binding."""
+        if not event.subject or not event.subject.subject_id:
+            return None
+
+        binding_identity = self._get_binding_identity(binding)
+        parts = [
+            descriptor.id,
+            binding_identity,
+            event.subject.subject_type or 'unknown',
+            event.subject.subject_id,
+        ]
+        return f'subject:{":".join(parts)}'
+
+    def _make_runner_scope_key(
+        self,
+        event: AgentEventEnvelope,
+        binding: AgentBinding,
+        descriptor: AgentRunnerDescriptor,
+    ) -> str:
+        """Build runner scope key from event and binding."""
+        binding_identity = self._get_binding_identity(binding)
+        parts = [
+            descriptor.id,
+            binding_identity,
+        ]
+        return f'runner:{":".join(parts)}'
+
+    def _get_scope_key(
+        self,
+        scope: str,
+        event: AgentEventEnvelope,
+        binding: AgentBinding,
+        descriptor: AgentRunnerDescriptor,
+    ) -> str | None:
+        """Get scope key for given scope."""
+        if scope == 'conversation':
+            return self._make_conversation_scope_key(event, binding, descriptor)
+        elif scope == 'actor':
+            return self._make_actor_scope_key(event, binding, descriptor)
+        elif scope == 'subject':
+            return self._make_subject_scope_key(event, binding, descriptor)
+        elif scope == 'runner':
+            return self._make_runner_scope_key(event, binding, descriptor)
+        return None
+
+    def _check_scope_enabled(self, scope: str, binding: AgentBinding) -> bool:
+        """Check if scope is enabled by binding's state_policy."""
+        state_policy = binding.state_policy
+        if not state_policy.enable_state:
+            return False
+        return scope in state_policy.state_scopes
+
+    def _validate_json_value(
+        self,
+        value: typing.Any,
+        logger: typing.Any = None,
+    ) -> tuple[str | None, str | None]:
+        """Validate and serialize value to JSON.
+
+        Returns:
+            Tuple of (json_string, error_message). If error_message is not None,
+            json_string will be None.
+        """
+        try:
+            json_str = json.dumps(value, ensure_ascii=False)
+        except (TypeError, ValueError) as e:
+            return None, f'Value is not JSON-serializable: {e}'
+
+        # Check size limit
+        json_bytes = len(json_str.encode('utf-8'))
+        if json_bytes > MAX_VALUE_JSON_BYTES:
+            return None, f'Value size {json_bytes} bytes exceeds limit {MAX_VALUE_JSON_BYTES} bytes'
+
+        return json_str, None
+
+    # ========== Async DB Operations ==========
+
+    async def build_snapshot_from_event(
+        self,
+        event: AgentEventEnvelope,
+        binding: AgentBinding,
+        descriptor: AgentRunnerDescriptor,
+    ) -> dict[str, dict[str, typing.Any]]:
+        """Build state snapshot for all scopes from event and binding.
+
+        Reads from database, respects state_policy.
+        """
+        state_policy = binding.state_policy
+
+        # If state is disabled, return all empty scopes
+        if not state_policy.enable_state:
+            return {
+                'conversation': {},
+                'actor': {},
+                'subject': {},
+                'runner': {},
+            }
+
+        snapshot: dict[str, dict[str, typing.Any]] = {
+            'conversation': {},
+            'actor': {},
+            'subject': {},
+            'runner': {},
+        }
+
+        async with self._db_engine.connect() as conn:
+            for scope in VALID_STATE_SCOPES:
+                if not self._check_scope_enabled(scope, binding):
+                    continue
+
+                scope_key = self._get_scope_key(scope, event, binding, descriptor)
+                if not scope_key:
+                    continue
+
+                # Query all state entries for this scope_key
+                result = await conn.execute(
+                    select(AgentRunnerState.state_key, AgentRunnerState.value_json)
+                    .where(AgentRunnerState.scope_key == scope_key)
+                )
+                rows = result.fetchall()
+
+                for row in rows:
+                    key = row.state_key
+                    value_json = row.value_json
+                    if value_json:
+                        try:
+                            snapshot[scope][key] = json.loads(value_json)
+                        except json.JSONDecodeError:
+                            pass  # Skip invalid JSON
+
+        # Seed external.conversation_id from event.conversation_id if not set
+        if self._check_scope_enabled('conversation', binding) and event.conversation_id:
+            if 'external.conversation_id' not in snapshot['conversation']:
+                snapshot['conversation']['external.conversation_id'] = event.conversation_id
+
+        return snapshot
+
+    async def apply_update_from_event(
+        self,
+        event: AgentEventEnvelope,
+        binding: AgentBinding,
+        descriptor: AgentRunnerDescriptor,
+        scope: str,
+        key: str,
+        value: typing.Any,
+        logger: typing.Any = None,
+    ) -> tuple[bool, str | None]:
+        """Apply a state update from event context.
+
+        Returns:
+            Tuple of (success, error_message). If success is False, error_message
+            contains the reason.
+        """
+        state_policy = binding.state_policy
+
+        # Check if state is disabled
+        if not state_policy.enable_state:
+            return False, 'State is disabled by binding policy'
+
+        # Validate scope
+        if scope not in VALID_STATE_SCOPES:
+            return False, f'Invalid scope: {scope}'
+
+        # Check if scope is enabled
+        if not self._check_scope_enabled(scope, binding):
+            return False, f'Scope "{scope}" not enabled by binding policy'
+
+        # Map legacy key names
+        if key in LEGACY_KEY_MAPPING:
+            key = LEGACY_KEY_MAPPING[key]
+
+        # Get scope key
+        scope_key = self._get_scope_key(scope, event, binding, descriptor)
+        if not scope_key:
+            return False, f'Missing identity for scope "{scope}"'
+
+        # Validate and serialize value
+        value_json, error = self._validate_json_value(value, logger)
+        if error:
+            return False, error
+
+        # Build context fields
+        binding_identity = self._get_binding_identity(binding)
+
+        async with self._db_engine.begin() as conn:
+            # Check if entry exists
+            result = await conn.execute(
+                select(AgentRunnerState.id)
+                .where(AgentRunnerState.scope_key == scope_key)
+                .where(AgentRunnerState.state_key == key)
+            )
+            existing = result.first()
+
+            now = datetime.utcnow()
+
+            if existing:
+                # Update existing entry
+                await conn.execute(
+                    update(AgentRunnerState)
+                    .where(AgentRunnerState.id == existing.id)
+                    .values(
+                        value_json=value_json,
+                        updated_at=now,
+                    )
+                )
+            else:
+                # Insert new entry
+                await conn.execute(
+                    sqlalchemy.insert(AgentRunnerState).values(
+                        runner_id=descriptor.id,
+                        binding_identity=binding_identity,
+                        scope=scope,
+                        scope_key=scope_key,
+                        state_key=key,
+                        value_json=value_json,
+                        bot_id=event.bot_id,
+                        workspace_id=event.workspace_id,
+                        conversation_id=event.conversation_id,
+                        thread_id=event.thread_id,
+                        actor_type=event.actor.actor_type if event.actor else None,
+                        actor_id=event.actor.actor_id if event.actor else None,
+                        subject_type=event.subject.subject_type if event.subject else None,
+                        subject_id=event.subject.subject_id if event.subject else None,
+                        created_at=now,
+                        updated_at=now,
+                    )
+                )
+
+        return True, None
+
+    async def state_get(
+        self,
+        scope_key: str,
+        state_key: str,
+    ) -> typing.Any:
+        """Get a single state value by scope_key and state_key.
+
+        Used by State API handlers.
+        """
+        async with self._db_engine.connect() as conn:
+            result = await conn.execute(
+                select(AgentRunnerState.value_json)
+                .where(AgentRunnerState.scope_key == scope_key)
+                .where(AgentRunnerState.state_key == state_key)
+            )
+            row = result.first()
+
+            if not row or not row.value_json:
+                return None
+
+            try:
+                return json.loads(row.value_json)
+            except json.JSONDecodeError:
+                return None
+
+    async def state_set(
+        self,
+        scope_key: str,
+        state_key: str,
+        value: typing.Any,
+        runner_id: str,
+        binding_identity: str,
+        scope: str,
+        context: dict[str, typing.Any] | None = None,
+        logger: typing.Any = None,
+    ) -> tuple[bool, str | None]:
+        """Set a state value.
+
+        Used by State API handlers.
+        Context contains optional fields like bot_id, conversation_id, etc.
+        """
+        # Validate and serialize value
+        value_json, error = self._validate_json_value(value, logger)
+        if error:
+            return False, error
+
+        context = context or {}
+
+        async with self._db_engine.begin() as conn:
+            # Check if entry exists
+            result = await conn.execute(
+                select(AgentRunnerState.id)
+                .where(AgentRunnerState.scope_key == scope_key)
+                .where(AgentRunnerState.state_key == state_key)
+            )
+            existing = result.first()
+
+            now = datetime.utcnow()
+
+            if existing:
+                # Update existing entry
+                await conn.execute(
+                    update(AgentRunnerState)
+                    .where(AgentRunnerState.id == existing.id)
+                    .values(
+                        value_json=value_json,
+                        updated_at=now,
+                    )
+                )
+            else:
+                # Insert new entry
+                await conn.execute(
+                    sqlalchemy.insert(AgentRunnerState).values(
+                        runner_id=runner_id,
+                        binding_identity=binding_identity,
+                        scope=scope,
+                        scope_key=scope_key,
+                        state_key=state_key,
+                        value_json=value_json,
+                        bot_id=context.get('bot_id'),
+                        workspace_id=context.get('workspace_id'),
+                        conversation_id=context.get('conversation_id'),
+                        thread_id=context.get('thread_id'),
+                        actor_type=context.get('actor_type'),
+                        actor_id=context.get('actor_id'),
+                        subject_type=context.get('subject_type'),
+                        subject_id=context.get('subject_id'),
+                        created_at=now,
+                        updated_at=now,
+                    )
+                )
+
+        return True, None
+
+    async def state_delete(
+        self,
+        scope_key: str,
+        state_key: str,
+    ) -> bool:
+        """Delete a state value.
+
+        Returns True if deleted, False if not found.
+        """
+        async with self._db_engine.begin() as conn:
+            result = await conn.execute(
+                delete(AgentRunnerState)
+                .where(AgentRunnerState.scope_key == scope_key)
+                .where(AgentRunnerState.state_key == state_key)
+                .returning(AgentRunnerState.id)
+            )
+            deleted = result.first()
+            return deleted is not None
+
+    async def state_list(
+        self,
+        scope_key: str,
+        prefix: str | None = None,
+        limit: int = 100,
+    ) -> tuple[list[str], bool]:
+        """List state keys in a scope.
+
+        Returns tuple of (keys, has_more).
+        """
+        # Enforce limit cap
+        limit = min(limit, 100)
+
+        async with self._db_engine.connect() as conn:
+            query = (
+                select(AgentRunnerState.state_key)
+                .where(AgentRunnerState.scope_key == scope_key)
+                .order_by(AgentRunnerState.state_key)
+                .limit(limit + 1)  # Fetch one extra to check has_more
+            )
+
+            if prefix:
+                query = query.where(
+                    AgentRunnerState.state_key.like(f'{prefix}%')
+                )
+
+            result = await conn.execute(query)
+            rows = result.fetchall()
+
+            keys = [row.state_key for row in rows[:limit]]
+            has_more = len(rows) > limit
+
+            return keys, has_more
+
+    async def clear_all(self) -> None:
+        """Clear all state entries (for testing)."""
+        async with self._db_engine.begin() as conn:
+            await conn.execute(delete(AgentRunnerState))
+
+
+# Global singleton persistent state store
+_persistent_state_store: PersistentStateStore | None = None
+_persistent_state_store_lock = threading.Lock()
+
+
+def get_persistent_state_store(db_engine: AsyncEngine | None = None) -> PersistentStateStore:
+    """Get the global persistent state store singleton.
+
+    Args:
+        db_engine: Database engine (required on first call)
+
+    Returns:
+        PersistentStateStore singleton
+    """
+    global _persistent_state_store
+    with _persistent_state_store_lock:
+        if _persistent_state_store is None:
+            if db_engine is None:
+                raise RuntimeError("db_engine required for first call to get_persistent_state_store")
+            _persistent_state_store = PersistentStateStore(db_engine)
+        return _persistent_state_store
+
+
+def reset_persistent_state_store() -> None:
+    """Reset the global persistent state store (for testing)."""
+    global _persistent_state_store
+    with _persistent_state_store_lock:
+        _persistent_state_store = None
--- a/src/langbot/pkg/agent/runner/session_registry.py
+++ b/src/langbot/pkg/agent/runner/session_registry.py
@@ -28,6 +28,8 @@ class AgentRunSession(typing.TypedDict):
        conversation_id: Conversation ID for history/event access
        resources: Authorized resources for this run (from AgentResources)
        permissions: Runner permissions from descriptor (artifacts, history, events, etc.)
+        state_policy: State policy from binding (enable_state, state_scopes)
+        state_context: Context for state API (scope_keys, binding_identity, etc.)
        status: Session status tracking
        _authorized_ids: Pre-computed authorized resource IDs for O(1) lookup
    """
@@ -38,6 +40,8 @@ class AgentRunSession(typing.TypedDict):
    conversation_id: str | None
    resources: AgentResources
    permissions: dict[str, list[str]]
+    state_policy: dict[str, typing.Any]  # {enable_state: bool, state_scopes: list}
+    state_context: dict[str, typing.Any]  # {scope_keys: dict, binding_identity: str, ...}
    status: AgentRunSessionStatus
    _authorized_ids: dict[str, set[str]]  # Pre-computed sets for O(1) lookup

@@ -70,6 +74,8 @@ class AgentRunSessionRegistry:
        resources: AgentResources,
        conversation_id: str | None = None,
        permissions: dict[str, list[str]] | None = None,
+        state_policy: dict[str, typing.Any] | None = None,
+        state_context: dict[str, typing.Any] | None = None,
    ) -> None:
        """Register a new agent run session.

@@ -81,12 +87,21 @@ class AgentRunSessionRegistry:
            resources: Authorized resources for this run
            conversation_id: Conversation ID for history/event access
            permissions: Runner permissions from descriptor (artifacts, history, events, etc.)
+            state_policy: State policy from binding (enable_state, state_scopes)
+            state_context: Context for state API (scope_keys, binding_identity, etc.)
        """
        now = int(time.time())

        # Normalize permissions to empty dict if None
        permissions = permissions or {}

+        # Normalize state_policy to defaults if None
+        if state_policy is None:
+            state_policy = {'enable_state': True, 'state_scopes': ['conversation', 'actor']}
+
+        # Normalize state_context to empty dict if None
+        state_context = state_context or {}
+
        # Pre-compute authorized resource IDs for O(1) lookup
        authorized_ids: dict[str, set[str]] = {
            'model': {m.get('model_id') for m in resources.get('models', [])},
@@ -95,14 +110,18 @@ class AgentRunSessionRegistry:
            'file': {f.get('file_id') for f in resources.get('files', [])},
        }

+        # NOTE: state_policy and state_context are stored at session top-level,
+        # NOT in resources. Resources should only contain resource authorization info.
        session: AgentRunSession = {
            'run_id': run_id,
            'runner_id': runner_id,
            'query_id': query_id,
            'plugin_identity': plugin_identity,
            'conversation_id': conversation_id,
-            'resources': resources,
+            'resources': resources,  # Original AgentResources, no state metadata mixed in
            'permissions': permissions,
+            'state_policy': state_policy,
+            'state_context': state_context,
            'status': {
                'started_at': now,
                'last_activity_at': now,