diff --git a/app/.env.example b/app/.env.example
index 91a3052..55c8a0e 100644
--- a/app/.env.example
+++ b/app/.env.example
@@ -14,6 +14,11 @@ JWT_SECRET_KEY=please-set-at-least-32-bytes-secret-key
 # TOKEN_HASH_SECRET=please-set-at-least-32-bytes-and-different-from-jwt-secret
 ACCESS_TOKEN_EXPIRE_MINUTES=4320
 REFRESH_TOKEN_EXPIRE_DAYS=7
+# Auth risk-control defaults (can be overridden per environment)
+MAX_FAILED_LOGIN_ATTEMPTS=8
+ACCOUNT_LOCK_MINUTES=5
+REGISTER_RATE_LIMIT=12
+LOGIN_RATE_LIMIT=30
 
 REDIS_URL=redis://localhost:6379/0
 # RabbitMQ is optional in this stage, kept for future publisher swap.
@@ -60,10 +65,11 @@ AGENT_COMPACT_THRESHOLD=0.75
 AGENT_USER_DAILY_LIMIT=50
 AGENT_USER_CONCURRENT_LIMIT=2
 AGENT_STAGING_TTL_SEC=86400
-AGENT_SSE_ENABLED=false
+AGENT_SSE_ENABLED=true
+AGENT_LLM_PROVIDER=anthropic
 AGENT_LLM_MODEL=claude-sonnet-4-6
-# Configure provider compatibility only via base URL + API key token.
-# Example (DeepSeek Anthropic-compatible endpoint): https://api.deepseek.com/anthropic
+AGENT_LLM_PLAN_MAX_TOKENS=8192
+# For Anthropic-compatible providers, e.g. DeepSeek: https://api.deepseek.com/anthropic
 # AGENT_LLM_BASE_URL=
 # AGENT_LLM_API_KEY=
 AGENT_MCP_ENDPOINTS=[]
diff --git a/app/src/fileflash/agents/harness/__init__.py b/app/src/fileflash/agents/harness/__init__.py
index 87e106a..acdcb08 100644
--- a/app/src/fileflash/agents/harness/__init__.py
+++ b/app/src/fileflash/agents/harness/__init__.py
@@ -6,6 +6,7 @@
 from .policy import PolicyDecision, PolicyGuard
 from .prompt import PromptBuildRequest, PromptBuilder
 from .router import ToolCall, ToolRouter
+from .tool_registry import REGISTRY, ToolContext, ToolRegistry, ToolSpec
 
 __all__ = [
     "AgentEvent",
@@ -20,6 +21,10 @@
     "PolicyGuard",
     "PromptBuildRequest",
     "PromptBuilder",
+    "REGISTRY",
     "ToolCall",
+    "ToolContext",
+    "ToolRegistry",
     "ToolRouter",
+    "ToolSpec",
 ]
diff --git a/app/src/fileflash/agents/harness/ask.py b/app/src/fileflash/agents/harness/ask.py
new file mode 100644
index 0000000..258f4ac
--- /dev/null
+++ b/app/src/fileflash/agents/harness/ask.py
@@ -0,0 +1,128 @@
+from __future__ import annotations
+
+import asyncio
+import contextlib
+from datetime import UTC, datetime
+from typing import Any
+
+from sqlalchemy.ext.asyncio import AsyncSession
+
+from ...repositories import AgentInboxMessageRepository
+from .event_bus import AgentEventBus, AgentEventEnvelope, AgentEventStream
+
+
+class AskTimedOut(Exception):
+    def __init__(self, *, ask_id: int) -> None:
+        super().__init__(f"Ask {ask_id} timed out")
+        self.ask_id = ask_id
+
+
+class AskProtocol:
+    def __init__(
+        self,
+        *,
+        db: AsyncSession,
+        event_bus: AgentEventBus,
+        job_id: int,
+    ) -> None:
+        self._db = db
+        self._bus = event_bus
+        self._job_id = job_id
+        self._repo = AgentInboxMessageRepository(db)
+        self._waiters: dict[int, asyncio.Future[Any]] = {}
+        self._sub_ctx = None
+        self._sub_stream: AgentEventStream | None = None
+        self._sub_task: asyncio.Task[None] | None = None
+
+    async def start(self) -> None:
+        self._sub_ctx = self._bus.subscribe(job_id=self._job_id)
+        self._sub_stream = await self._sub_ctx.__aenter__()
+        self._sub_task = asyncio.create_task(self._listen())
+
+    async def aclose(self) -> None:
+        if self._sub_task is not None:
+            self._sub_task.cancel()
+            with contextlib.suppress(asyncio.CancelledError):
+                await self._sub_task
+        if self._sub_ctx is not None:
+            await self._sub_ctx.__aexit__(None, None, None)
+        for future in self._waiters.values():
+            if not future.done():
+                future.cancel()
+
+    async def ask(
+        self,
+        *,
+        prompt: str,
+        schema: dict[str, Any],
+        timeout_sec: float,
+    ) -> Any:
+        msg = await self._repo.create_ask(
+            job_id=self._job_id,
+            payload={"prompt": prompt, "schema": schema, "timeoutSec": timeout_sec},
+        )
+        await self._db.commit()
+
+        ask_id = int(msg.inbox_message_id)
+        loop = asyncio.get_running_loop()
+        future: asyncio.Future[Any] = loop.create_future()
+        self._waiters[ask_id] = future
+
+        await self._bus.publish(
+            AgentEventEnvelope(
+                job_id=self._job_id,
+                event_type="agent.ask",
+                payload={
+                    "messageId": str(ask_id),
+                    "prompt": prompt,
+                    "schema": schema,
+                    "timeoutSec": timeout_sec,
+                },
+                emitted_at=datetime.now(UTC),
+            )
+        )
+
+        try:
+            value = await asyncio.wait_for(future, timeout=timeout_sec)
+        except TimeoutError as exc:
+            await self._repo.mark_timed_out(
+                inbox_message_id=ask_id,
+                answered_at=datetime.now(UTC),
+            )
+            await self._db.commit()
+            raise AskTimedOut(ask_id=ask_id) from exc
+        finally:
+            self._waiters.pop(ask_id, None)
+
+        await self._repo.mark_answered(
+            inbox_message_id=ask_id,
+            answered_at=datetime.now(UTC),
+        )
+        await self._db.commit()
+        return value
+
+    async def _listen(self) -> None:
+        assert self._sub_stream is not None
+        while True:
+            try:
+                envelope = await self._sub_stream.next(timeout=None)
+            except asyncio.CancelledError:
+                raise
+            except Exception:
+                continue
+            if envelope.event_type != "agent.inbox.reply":
+                continue
+            reply_to = envelope.payload.get("replyTo")
+            if reply_to is None:
+                continue
+            try:
+                ask_id = int(reply_to)
+            except (TypeError, ValueError):
+                continue
+            future = self._waiters.get(ask_id)
+            if future is None or future.done():
+                continue
+            future.set_result(envelope.payload.get("value"))
+
+
+__all__ = ["AskProtocol", "AskTimedOut"]
diff --git a/app/src/fileflash/agents/harness/event_bus.py b/app/src/fileflash/agents/harness/event_bus.py
new file mode 100644
index 0000000..05c73d0
--- /dev/null
+++ b/app/src/fileflash/agents/harness/event_bus.py
@@ -0,0 +1,194 @@
+from __future__ import annotations
+
+import asyncio
+import contextlib
+import json
+import logging
+from collections.abc import AsyncIterator
+from contextlib import AbstractAsyncContextManager
+from dataclasses import asdict, dataclass
+from datetime import datetime
+from typing import Any, Protocol
+
+from fastapi.encoders import jsonable_encoder
+from redis.asyncio import Redis
+
+from ...core.settings import Settings, get_settings
+
+logger = logging.getLogger(__name__)
+
+
+@dataclass(slots=True)
+class AgentEventEnvelope:
+    job_id: int
+    event_type: str
+    payload: dict[str, Any]
+    emitted_at: datetime
+    event_id: str | None = None
+
+    def to_json(self) -> str:
+        body = jsonable_encoder(asdict(self))
+        return json.dumps(body, ensure_ascii=False, separators=(",", ":"))
+
+    @classmethod
+    def from_json(cls, raw: str) -> AgentEventEnvelope:
+        data = json.loads(raw)
+        return cls(
+            job_id=int(data["job_id"]),
+            event_type=str(data["event_type"]),
+            payload=dict(data.get("payload") or {}),
+            emitted_at=datetime.fromisoformat(data["emitted_at"]),
+            event_id=data.get("event_id"),
+        )
+
+
+class AgentEventStream(Protocol):
+    async def next(self, *, timeout: float | None = None) -> AgentEventEnvelope: ...
+    async def aclose(self) -> None: ...
+
+
+class AgentEventBus(Protocol):
+    async def publish(self, envelope: AgentEventEnvelope) -> None: ...
+
+    def subscribe(
+        self,
+        *,
+        job_id: int,
+    ) -> AbstractAsyncContextManager[AgentEventStream]: ...
+
+
+@dataclass(slots=True)
+class _InMemoryStream:
+    queue: asyncio.Queue[AgentEventEnvelope]
+
+    async def next(self, *, timeout: float | None = None) -> AgentEventEnvelope:
+        if timeout is None:
+            return await self.queue.get()
+        return await asyncio.wait_for(self.queue.get(), timeout=timeout)
+
+    async def aclose(self) -> None:
+        return None
+
+
+class InMemoryAgentEventBus:
+    def __init__(self, *, buffer_size: int = 64) -> None:
+        self._buffer = buffer_size
+        self._subscribers: dict[int, list[asyncio.Queue[AgentEventEnvelope]]] = {}
+
+    async def publish(self, envelope: AgentEventEnvelope) -> None:
+        queues = list(self._subscribers.get(envelope.job_id, []))
+        for queue in queues:
+            if queue.full():
+                logger.warning(
+                    "InMemoryAgentEventBus dropped event: queue full job_id=%s",
+                    envelope.job_id,
+                )
+                continue
+            await queue.put(envelope)
+
+    @contextlib.asynccontextmanager
+    async def subscribe(self, *, job_id: int) -> AsyncIterator[_InMemoryStream]:
+        queue: asyncio.Queue[AgentEventEnvelope] = asyncio.Queue(maxsize=self._buffer)
+        self._subscribers.setdefault(job_id, []).append(queue)
+        try:
+            yield _InMemoryStream(queue=queue)
+        finally:
+            subscribers = self._subscribers.get(job_id)
+            if subscribers is not None:
+                subscribers.remove(queue)
+                if not subscribers:
+                    del self._subscribers[job_id]
+
+
+class RedisAgentEventBus:
+    def __init__(
+        self,
+        *,
+        redis: Redis,
+        channel_prefix: str,
+        buffer_size: int = 64,
+    ) -> None:
+        self._redis = redis
+        self._channel_prefix = channel_prefix
+        self._buffer = buffer_size
+
+    def _channel(self, job_id: int) -> str:
+        return f"{self._channel_prefix}:{job_id}:events"
+
+    async def publish(self, envelope: AgentEventEnvelope) -> None:
+        await self._redis.publish(self._channel(envelope.job_id), envelope.to_json())
+
+    @contextlib.asynccontextmanager
+    async def subscribe(self, *, job_id: int) -> AsyncIterator[_RedisStream]:
+        pubsub = self._redis.pubsub()
+        channel = self._channel(job_id)
+        await pubsub.subscribe(channel)
+        stream = _RedisStream(pubsub=pubsub)
+        try:
+            yield stream
+        finally:
+            await pubsub.unsubscribe(channel)
+            await pubsub.aclose()
+
+
+@dataclass(slots=True)
+class _RedisStream:
+    pubsub: Any
+
+    async def next(self, *, timeout: float | None = None) -> AgentEventEnvelope:
+        if timeout is None:
+            async for message in self.pubsub.listen():
+                envelope = _envelope_from_redis_message(message)
+                if envelope is not None:
+                    return envelope
+        else:
+            message = await self.pubsub.get_message(
+                ignore_subscribe_messages=True,
+                timeout=timeout,
+            )
+            envelope = _envelope_from_redis_message(message)
+            if envelope is not None:
+                return envelope
+        raise TimeoutError("No event within timeout")
+
+    async def aclose(self) -> None:
+        await self.pubsub.aclose()
+
+
+def _envelope_from_redis_message(message: Any) -> AgentEventEnvelope | None:
+    if message is None:
+        return None
+    message_type = message.get("type")
+    if message_type not in {"message", "pmessage"}:
+        return None
+    data = message.get("data")
+    if isinstance(data, bytes):
+        data = data.decode("utf-8")
+    return AgentEventEnvelope.from_json(str(data))
+
+
+def build_agent_event_bus(
+    *,
+    settings: Settings | None = None,
+    redis: Redis | None = None,
+) -> AgentEventBus:
+    cfg = settings or get_settings()
+    if redis is None:
+        if not cfg.redis_url:
+            return InMemoryAgentEventBus(buffer_size=cfg.agent_event_bus_buffer_size)
+        redis = Redis.from_url(cfg.redis_url, decode_responses=True)
+    return RedisAgentEventBus(
+        redis=redis,
+        channel_prefix=cfg.agent_event_channel_prefix,
+        buffer_size=cfg.agent_event_bus_buffer_size,
+    )
+
+
+__all__ = [
+    "AgentEventBus",
+    "AgentEventEnvelope",
+    "AgentEventStream",
+    "InMemoryAgentEventBus",
+    "RedisAgentEventBus",
+    "build_agent_event_bus",
+]
diff --git a/app/src/fileflash/agents/harness/events.py b/app/src/fileflash/agents/harness/events.py
index 8bf7a94..3fbfbb2 100644
--- a/app/src/fileflash/agents/harness/events.py
+++ b/app/src/fileflash/agents/harness/events.py
@@ -1,15 +1,6 @@
 from __future__ import annotations
 
-from dataclasses import dataclass
-from typing import Any
+from .event_bus import AgentEventBus as EventBus
+from .event_bus import AgentEventEnvelope as AgentEvent
 
-
-@dataclass(slots=True)
-class AgentEvent:
-    event_type: str
-    payload: dict[str, Any]
-
-
-class EventBus:
-    async def publish(self, event: AgentEvent) -> None:
-        raise NotImplementedError("EventBus is scaffolded only in this stage")
+__all__ = ["AgentEvent", "EventBus"]
diff --git a/app/src/fileflash/agents/harness/inbox.py b/app/src/fileflash/agents/harness/inbox.py
new file mode 100644
index 0000000..ac7f45c
--- /dev/null
+++ b/app/src/fileflash/agents/harness/inbox.py
@@ -0,0 +1,76 @@
+from __future__ import annotations
+
+from datetime import UTC, datetime
+from typing import Any
+
+from sqlalchemy.ext.asyncio import AsyncSession
+
+from ...models.enums import AgentInboxKind, AgentInboxStatus
+from ...repositories import AgentInboxMessageRepository
+from .event_bus import AgentEventBus, AgentEventEnvelope
+
+_INBOX_EVENT_TYPES: dict[AgentInboxKind, str] = {
+    AgentInboxKind.REPLY: "agent.inbox.reply",
+    AgentInboxKind.CONTROL_PAUSE: "agent.inbox.control",
+    AgentInboxKind.CONTROL_RESUME: "agent.inbox.control",
+    AgentInboxKind.CONTROL_APPROVE: "agent.inbox.control",
+    AgentInboxKind.CONTROL_DENY: "agent.inbox.control",
+    AgentInboxKind.CONTROL_SKIP: "agent.inbox.control",
+    AgentInboxKind.CONTROL_CANCEL: "agent.inbox.control",
+}
+
+
+class AgentInbox:
+    def __init__(self, *, db: AsyncSession, event_bus: AgentEventBus) -> None:
+        self._db = db
+        self._bus = event_bus
+        self._repo = AgentInboxMessageRepository(db)
+
+    async def handle(
+        self,
+        *,
+        job_id: int,
+        kind: AgentInboxKind,
+        payload: dict[str, Any],
+        reply_to_id: int | None = None,
+    ):
+        if kind == AgentInboxKind.REPLY:
+            if reply_to_id is None:
+                raise ValueError("reply requires reply_to_id")
+            ask = await self._repo.get_ask(inbox_message_id=reply_to_id)
+            if ask is None:
+                raise ValueError(f"ask {reply_to_id} not found")
+            if int(ask.job_id) != job_id:
+                raise ValueError(f"ask {reply_to_id} belongs to a different job")
+            if ask.status != AgentInboxStatus.WAITING:
+                raise ValueError(f"ask {reply_to_id} is not waiting")
+
+        msg = await self._repo.record_user_message(
+            job_id=job_id,
+            kind=kind,
+            payload=payload,
+            reply_to_id=reply_to_id,
+        )
+        event_type = _INBOX_EVENT_TYPES[kind]
+        envelope_payload: dict[str, Any] = {
+            "kind": kind.value,
+            "messageId": str(msg.inbox_message_id),
+        }
+        if reply_to_id is not None:
+            envelope_payload["replyTo"] = str(reply_to_id)
+        if "value" in payload:
+            envelope_payload["value"] = payload["value"]
+        if "metadata" in payload:
+            envelope_payload["metadata"] = payload["metadata"]
+        await self._bus.publish(
+            AgentEventEnvelope(
+                job_id=job_id,
+                event_type=event_type,
+                payload=envelope_payload,
+                emitted_at=datetime.now(UTC),
+            )
+        )
+        return msg
+
+
+__all__ = ["AgentInbox"]
diff --git a/app/src/fileflash/agents/harness/policy.py b/app/src/fileflash/agents/harness/policy.py
index 027af98..730322b 100644
--- a/app/src/fileflash/agents/harness/policy.py
+++ b/app/src/fileflash/agents/harness/policy.py
@@ -3,6 +3,7 @@
 from dataclasses import dataclass, field
 
 from ...schemas.agent import AgentProposedAction
+from .tool_registry import REGISTRY
 
 
 @dataclass(slots=True)
@@ -11,38 +12,18 @@ class PolicyDecision:
     reasons: list[str] = field(default_factory=list)
 
 
-HIGH_RISK_TOOLS = frozenset(
-    {
-        "drive.deleteFile",
-        "drive.deleteFolder",
-        "drive.batchDelete",
-        "recycle.clear",
-        "recycle.permanentDelete",
-    }
-)
-
-WRITE_TOOLS = frozenset(
-    {
-        "drive.createFolder",
-        "drive.moveFile",
-        "drive.moveFolder",
-        "drive.renameFile",
-        "drive.renameFolder",
-        *HIGH_RISK_TOOLS,
-    }
-)
-
-
 def classify_tool_side_effect(tool_name: str) -> str:
-    return "write" if tool_name in WRITE_TOOLS else "read"
+    try:
+        return REGISTRY.get(tool_name).side_effect
+    except KeyError:
+        return "write"
 
 
 def classify_tool_risk(tool_name: str) -> str:
-    if tool_name in HIGH_RISK_TOOLS or "delete" in tool_name.lower():
+    try:
+        return REGISTRY.get(tool_name).risk_level
+    except KeyError:
         return "high"
-    if classify_tool_side_effect(tool_name) == "write":
-        return "medium"
-    return "low"
 
 
 def normalize_action_risk(action: AgentProposedAction) -> AgentProposedAction:
@@ -70,6 +51,13 @@ async def evaluate_tool_call(
         tool_name: str,
         high_risk_confirmed: bool = False,
     ) -> PolicyDecision:
+        try:
+            REGISTRY.get(tool_name)
+        except KeyError:
+            return PolicyDecision(
+                allowed=False,
+                reasons=[f"Unsupported agent tool: {tool_name}"],
+            )
         if classify_tool_risk(tool_name) == "high" and not high_risk_confirmed:
             return PolicyDecision(
                 allowed=False,
diff --git a/app/src/fileflash/agents/harness/router.py b/app/src/fileflash/agents/harness/router.py
index 3c46f39..2b3b639 100644
--- a/app/src/fileflash/agents/harness/router.py
+++ b/app/src/fileflash/agents/harness/router.py
@@ -3,23 +3,12 @@
 from dataclasses import dataclass
 from typing import Any
 
-from sqlalchemy import and_, select
 from sqlalchemy.ext.asyncio import AsyncSession
 
 from ...core.errors import ApiError
-from ...core.mime import resolve_file_mime_type
-from ...models import File, Folder
-from ...models.enums import FileStatus, FolderStatus, FolderType
-from ...schemas.file import (
-    CreateFolderRequest,
-    GetFolderContentsQuery,
-    MoveFileRequest,
-    MoveFolderRequest,
-    RenameFileRequest,
-    RenameFolderRequest,
-)
 from ...services.file import FileService
 from ...services.folder import FolderService
+from .tool_registry import REGISTRY, ToolContext
 
 
 @dataclass(slots=True)
@@ -36,323 +25,23 @@ def __init__(self, *, db: AsyncSession, user_id: int) -> None:
         self.folder_service = FolderService(db=db)
 
     async def dispatch(self, call: ToolCall) -> dict[str, Any]:
-        tool = call.tool_name
-        args = dict(call.arguments or {})
-
-        if tool == "drive.listFolder":
-            folder_id = _first_value(args, "folderId", "parentFolderId") or "root"
-            query = GetFolderContentsQuery(
-                folder_id=str(folder_id),
-                page=int(args.get("page") or 1),
-                per_page=min(200, int(args.get("perPage") or 200)),
-            )
-            if str(folder_id) == "root":
-                result = await self.folder_service.get_root_contents(
-                    user_id=self.user_id,
-                    query=query,
-                )
-            else:
-                result = await self.folder_service.get_folder_contents(
-                    user_id=self.user_id,
-                    query=query,
-                )
-            return result.model_dump(by_alias=True, mode="json")
-
-        if tool == "drive.countFiles":
-            return await self._count_files(args)
-
-        if tool == "drive.createFolder":
-            name = _required_text(args, "name", "folderName")
-            parent_id = _first_value(args, "parentFolderId", "targetParentId", "folderId") or "root"
-            result = await self.folder_service.create_folder(
-                user_id=self.user_id,
-                payload=CreateFolderRequest(folder_name=name, parent_folder_id=str(parent_id)),
-            )
-            data = result.model_dump(by_alias=True, mode="json")
-            data.setdefault("folderId", data.get("id"))
-            return data
-
-        if tool == "drive.moveFile":
-            file_id = _required_text(args, "fileId", "id")
-            target_folder_id = _required_text(args, "targetFolderId", "targetParentId")
-            result = await self.file_service.move_file(
-                user_id=self.user_id,
-                file_id=file_id,
-                payload=MoveFileRequest(
-                    target_folder_id=target_folder_id,
-                    share_handling=str(args.get("shareHandling") or "keep"),
-                ),
-            )
-            return result.model_dump(by_alias=True, mode="json")
-
-        if tool == "drive.moveFolder":
-            folder_id = _required_text(args, "folderId", "id")
-            target_parent_id = _required_text(args, "targetParentId", "targetFolderId")
-            result = await self.folder_service.move_folder(
-                user_id=self.user_id,
-                folder_id=folder_id,
-                payload=MoveFolderRequest(
-                    target_parent_id=target_parent_id,
-                    share_handling=str(args.get("shareHandling") or "keep"),
-                ),
-            )
-            return result.model_dump(by_alias=True, mode="json")
-
-        if tool == "drive.renameFile":
-            file_id = _required_text(args, "fileId", "id")
-            file_name = _required_text(args, "fileName", "name")
-            result = await self.file_service.rename_file(
-                user_id=self.user_id,
-                file_id=file_id,
-                payload=RenameFileRequest(file_name=file_name),
-            )
-            return result.model_dump(by_alias=True, mode="json")
-
-        if tool == "drive.renameFolder":
-            folder_id = _required_text(args, "folderId", "id")
-            folder_name = _required_text(args, "folderName", "name")
-            result = await self.folder_service.rename_folder(
-                user_id=self.user_id,
-                folder_id=folder_id,
-                payload=RenameFolderRequest(folder_name=folder_name),
-            )
-            return result.model_dump(by_alias=True, mode="json")
-
-        if tool == "drive.deleteFile":
-            file_id = _required_text(args, "fileId", "id")
-            result = await self.file_service.delete_file(user_id=self.user_id, file_id=file_id)
-            return result.model_dump(by_alias=True, mode="json")
-
-        if tool == "drive.deleteFolder":
-            folder_id = _required_text(args, "folderId", "id")
-            result = await self.folder_service.delete_folder(
-                user_id=self.user_id,
-                folder_id=folder_id,
-            )
-            return result.model_dump(by_alias=True, mode="json")
-
-        raise ApiError(status_code=400, code=400, message=f"Unsupported agent tool: {tool}")
-
-    async def _count_files(self, args: dict[str, Any]) -> dict[str, Any]:
-        folder_id = str(_first_value(args, "folderId", "parentFolderId") or "root")
-        recursive = _bool_arg(args.get("recursive"), default=True)
-        category = _normalize_category(args.get("category"))
-        search = str(args.get("search") or "").strip().lower()
-        root_folder_id = await _resolve_folder_id(
-            self.db,
+        tool_name = str(call.tool_name or "").strip()
+        try:
+            spec = REGISTRY.get(tool_name)
+        except KeyError as exc:
+            raise ApiError(
+                status_code=400,
+                code=400,
+                message=f"Unsupported agent tool: {tool_name}",
+            ) from exc
+
+        ctx = ToolContext(
+            db=self.db,
             user_id=self.user_id,
-            folder_id=folder_id,
-        )
-        folder_ids = (
-            await _active_descendant_folder_ids(
-                self.db,
-                user_id=self.user_id,
-                root_folder_id=root_folder_id,
-            )
-            if recursive
-            else [root_folder_id]
+            file_service=self.file_service,
+            folder_service=self.folder_service,
         )
-
-        statement = select(
-            File.file_id,
-            File.file_name,
-            File.file_size,
-            File.mime_type,
-            File.file_ext,
-            File.folder_id,
-        ).where(
-            and_(
-                File.owner_id == self.user_id,
-                File.folder_id.in_(folder_ids),
-                File.status == FileStatus.ACTIVE,
-                File.is_latest.is_(True),
-            )
-        )
-        if search:
-            statement = statement.where(File.file_name.ilike(f"%{search}%"))
-        statement = statement.order_by(File.file_name.asc())
-
-        rows = (await self.db.execute(statement)).all()
-        by_mime_type: dict[str, int] = {}
-        sample_items: list[dict[str, Any]] = []
-        total_items = 0
-        for row in rows:
-            file_id, file_name, file_size, mime_type, file_ext, row_folder_id = row
-            resolved_mime = resolve_file_mime_type(
-                mime_type=mime_type,
-                file_ext=file_ext,
-                file_name=file_name,
-            )
-            if category is not None and _category_for_file(
-                mime_type=resolved_mime,
-                file_ext=file_ext,
-                file_name=file_name,
-            ) != category:
-                continue
-
-            total_items += 1
-            by_mime_type[resolved_mime] = by_mime_type.get(resolved_mime, 0) + 1
-            if len(sample_items) < 5:
-                sample_items.append(
-                    {
-                        "id": str(file_id),
-                        "name": str(file_name),
-                        "size": int(file_size or 0),
-                        "mimeType": resolved_mime,
-                        "folderId": str(row_folder_id),
-                    }
-                )
-
-        return {
-            "totalItems": total_items,
-            "category": category,
-            "recursive": recursive,
-            "folderId": str(root_folder_id),
-            "byMimeType": dict(sorted(by_mime_type.items())),
-            "sampleItems": sample_items,
-        }
-
-
-def _first_value(args: dict[str, Any], *keys: str) -> Any:
-    for key in keys:
-        value = args.get(key)
-        if value not in (None, ""):
-            return value
-    return None
-
-
-def _required_text(args: dict[str, Any], *keys: str) -> str:
-    value = _first_value(args, *keys)
-    if value is None:
-        raise ApiError(status_code=400, code=400, message=f"Missing required tool input: {keys[0]}")
-    text = str(value).strip()
-    if not text:
-        raise ApiError(status_code=400, code=400, message=f"Missing required tool input: {keys[0]}")
-    return text
-
-
-def _bool_arg(value: Any, *, default: bool) -> bool:
-    if value is None:
-        return default
-    if isinstance(value, bool):
-        return value
-    text = str(value).strip().lower()
-    if text in {"1", "true", "yes", "y"}:
-        return True
-    if text in {"0", "false", "no", "n"}:
-        return False
-    return default
-
-
-async def _resolve_folder_id(db: AsyncSession, *, user_id: int, folder_id: str) -> int:
-    if not folder_id or folder_id == "root":
-        root_id = await db.scalar(
-            select(Folder.folder_id).where(
-                and_(
-                    Folder.owner_id == user_id,
-                    Folder.parent_folder_id.is_(None),
-                    Folder.folder_type == FolderType.ROOT,
-                    Folder.status == FolderStatus.ACTIVE,
-                )
-            )
-        )
-        if root_id is None:
-            raise ApiError(status_code=404, code=404, message="Root folder not found")
-        return int(root_id)
-    try:
-        parsed = int(folder_id)
-    except ValueError as exc:
-        raise ApiError(status_code=400, code=400, message="Invalid folderId") from exc
-    exists = await db.scalar(
-        select(Folder.folder_id).where(
-            and_(
-                Folder.folder_id == parsed,
-                Folder.owner_id == user_id,
-                Folder.status == FolderStatus.ACTIVE,
-            )
-        )
-    )
-    if exists is None:
-        raise ApiError(status_code=404, code=404, message="Folder not found")
-    return parsed
-
-
-async def _active_descendant_folder_ids(
-    db: AsyncSession,
-    *,
-    user_id: int,
-    root_folder_id: int,
-) -> list[int]:
-    descendants = (
-        select(Folder.folder_id)
-        .where(
-            and_(
-                Folder.folder_id == root_folder_id,
-                Folder.owner_id == user_id,
-                Folder.status == FolderStatus.ACTIVE,
-            )
-        )
-        .cte(name="agent_count_descendants", recursive=True)
-    )
-    descendants = descendants.union_all(
-        select(Folder.folder_id).where(
-            and_(
-                Folder.parent_folder_id == descendants.c.folder_id,
-                Folder.owner_id == user_id,
-                Folder.status == FolderStatus.ACTIVE,
-            )
-        )
-    )
-    folder_ids = list(await db.scalars(select(descendants.c.folder_id)))
-    return [int(folder_id) for folder_id in folder_ids]
-
-
-def _normalize_category(value: Any) -> str | None:
-    text = str(value or "").strip().lower()
-    aliases = {
-        "movies": "video",
-        "movie": "video",
-        "film": "video",
-        "films": "video",
-        "视频": "video",
-        "影片": "video",
-        "电影": "video",
-        "videos": "video",
-        "documents": "document",
-        "docs": "document",
-        "images": "image",
-        "pictures": "image",
-        "archives": "archive",
-        "compressed": "archive",
-    }
-    text = aliases.get(text, text)
-    if text in {"video", "audio", "image", "document", "archive", "other"}:
-        return text
-    return None
-
-
-def _category_for_file(*, mime_type: str, file_ext: str | None, file_name: str | None) -> str:
-    mime = (mime_type or "").lower()
-    ext = _normalized_extension(file_ext) or _filename_extension(file_name)
-    if mime.startswith("video/") or ext in {"mp4", "mov", "avi", "mkv", "webm", "m4v"}:
-        return "video"
-    if mime.startswith("audio/") or ext in {"mp3", "wav", "flac", "m4a", "aac", "ogg"}:
-        return "audio"
-    if mime.startswith("image/") or ext in {"jpg", "jpeg", "png", "gif", "webp", "svg", "bmp"}:
-        return "image"
-    if mime in {"application/pdf"} or ext in {"pdf", "doc", "docx", "xls", "xlsx", "ppt", "pptx", "txt", "md"}:
-        return "document"
-    if ext in {"zip", "rar", "7z", "tar", "gz", "bz2", "xz"}:
-        return "archive"
-    return "other"
-
-
-def _normalized_extension(value: str | None) -> str:
-    return str(value or "").strip().lower().lstrip(".")
+        return await spec.handler(ctx, dict(call.arguments or {}))
 
 
-def _filename_extension(value: str | None) -> str:
-    name = str(value or "").strip().lower()
-    if "." not in name:
-        return ""
-    return name.rsplit(".", 1)[-1]
+__all__ = ["ToolCall", "ToolRouter"]
diff --git a/app/src/fileflash/agents/harness/tool_registry.py b/app/src/fileflash/agents/harness/tool_registry.py
new file mode 100644
index 0000000..c508a86
--- /dev/null
+++ b/app/src/fileflash/agents/harness/tool_registry.py
@@ -0,0 +1,138 @@
+from __future__ import annotations
+
+import re
+from collections.abc import Awaitable, Callable
+from dataclasses import dataclass
+from typing import Any, Literal
+
+from sqlalchemy.ext.asyncio import AsyncSession
+
+ToolSideEffect = Literal["read", "write"]
+ToolRiskLevel = Literal["low", "medium", "high"]
+
+
+@dataclass(slots=True)
+class ToolContext:
+    db: AsyncSession
+    user_id: int
+    file_service: Any
+    folder_service: Any
+
+
+ToolHandler = Callable[[ToolContext, dict[str, Any]], Awaitable[dict[str, Any]]]
+ToolAnswerFormatter = Callable[[dict[str, Any]], str | None]
+
+
+@dataclass(frozen=True, slots=True)
+class ToolSpec:
+    name: str
+    description: str
+    input_schema: dict[str, Any]
+    side_effect: ToolSideEffect
+    risk_level: ToolRiskLevel
+    requires_confirmation: bool
+    handler: ToolHandler
+    anthropic_name: str | None = None
+    answer_formatter: ToolAnswerFormatter | None = None
+
+    def __post_init__(self) -> None:
+        if self.anthropic_name is None:
+            object.__setattr__(self, "anthropic_name", _to_provider_tool_name(self.name))
+
+    def to_anthropic_tool(self) -> dict[str, Any]:
+        return {
+            "name": self.anthropic_name,
+            "description": self.description,
+            "input_schema": self.input_schema,
+            "internalName": self.name,
+        }
+
+    def to_planner_schema(self) -> dict[str, Any]:
+        return {
+            "tool": self.name,
+            "providerTool": self.anthropic_name,
+            "description": self.description,
+            "inputSchema": self.input_schema,
+            "sideEffect": self.side_effect,
+            "riskLevel": self.risk_level,
+            "requiresConfirmation": self.requires_confirmation,
+        }
+
+
+class ToolRegistry:
+    def __init__(self) -> None:
+        self._by_name: dict[str, ToolSpec] = {}
+        self._by_provider_name: dict[str, ToolSpec] = {}
+
+    def register(self, spec: ToolSpec) -> ToolSpec:
+        if spec.name in self._by_name:
+            raise ValueError(f"Agent tool already registered: {spec.name}")
+        provider_name = str(spec.anthropic_name or "")
+        if provider_name in self._by_provider_name:
+            raise ValueError(f"Agent provider tool already registered: {provider_name}")
+        self._by_name[spec.name] = spec
+        self._by_provider_name[provider_name] = spec
+        return spec
+
+    def get(self, name: str) -> ToolSpec:
+        ensure_builtin_tools_registered()
+        return self._by_name[name]
+
+    def get_by_provider_name(self, name: str) -> ToolSpec:
+        ensure_builtin_tools_registered()
+        return self._by_provider_name[name]
+
+    def all(self) -> list[ToolSpec]:
+        ensure_builtin_tools_registered()
+        return list(self._by_name.values())
+
+    def all_names(self) -> tuple[str, ...]:
+        return tuple(spec.name for spec in self.all())
+
+    def unknown_names(self, names: list[str] | tuple[str, ...]) -> list[str]:
+        ensure_builtin_tools_registered()
+        return [name for name in names if name not in self._by_name]
+
+    def validate_names(self, names: list[str] | tuple[str, ...]) -> tuple[str, ...]:
+        unknown = self.unknown_names(names)
+        if unknown:
+            raise ValueError(f"Unknown agent tools: {', '.join(sorted(unknown))}")
+        return tuple(names)
+
+    def schemas_for(self, names: list[str] | tuple[str, ...]) -> list[dict[str, Any]]:
+        return [self.get(name).to_planner_schema() for name in names]
+
+    def anthropic_tools_for(self, names: list[str] | tuple[str, ...]) -> list[dict[str, Any]]:
+        return [self.get(name).to_anthropic_tool() for name in names]
+
+
+REGISTRY = ToolRegistry()
+_BUILTINS_REGISTERED = False
+
+
+def ensure_builtin_tools_registered() -> None:
+    global _BUILTINS_REGISTERED
+    if _BUILTINS_REGISTERED:
+        return
+    from .. import tools as _tools  # noqa: F401
+    _BUILTINS_REGISTERED = True
+
+
+def _to_provider_tool_name(name: str) -> str:
+    value = name.replace(".", "_").replace("-", "_")
+    value = re.sub(r"(?<!^)(?=[A-Z])", "_", value).lower()
+    value = re.sub(r"[^a-zA-Z0-9_]+", "_", value).strip("_")
+    return value or "tool"
+
+
+__all__ = [
+    "REGISTRY",
+    "ToolAnswerFormatter",
+    "ToolContext",
+    "ToolHandler",
+    "ToolRegistry",
+    "ToolRiskLevel",
+    "ToolSideEffect",
+    "ToolSpec",
+    "ensure_builtin_tools_registered",
+]
diff --git a/app/src/fileflash/agents/runtime/execute_runner.py b/app/src/fileflash/agents/runtime/execute_runner.py
index 499b489..04929c9 100644
--- a/app/src/fileflash/agents/runtime/execute_runner.py
+++ b/app/src/fileflash/agents/runtime/execute_runner.py
@@ -1,5 +1,8 @@
 from __future__ import annotations
 
+import asyncio
+import json
+import logging
 from datetime import UTC, datetime
 from typing import Any
 
@@ -7,27 +10,62 @@
 from sqlalchemy.ext.asyncio import AsyncSession
 
 from ...core.errors import ApiError
+from ...core.settings import Settings, get_settings
 from ...models import BackgroundJob
+from ...models.enums import AgentInboxKind
 from ...repositories import (
     AgentActionLogRepository,
+    AgentInboxMessageRepository,
     AgentPlanRepository,
     AgentWorkSessionRepository,
 )
 from ...schemas.agent import AgentExecutionResult, AgentProposedAction, ExecuteAgentRequest
+from ..harness.ask import AskProtocol
+from ..harness.event_bus import AgentEventBus, AgentEventEnvelope
 from ..harness.policy import PolicyGuard
 from ..harness.router import ToolCall, ToolRouter
+from .llm import AnswerClient, AnthropicPlannerClient
 from .reference_rules import is_symbolic_id_placeholder, parse_step_reference
 
+logger = logging.getLogger(__name__)
+
 
 class AgentJobCanceled(Exception):
     pass
 
 
 class ExecuteRunner:
-    def __init__(self, *, policy_guard: PolicyGuard | None = None) -> None:
+    def __init__(
+        self,
+        *,
+        settings: Settings | None = None,
+        policy_guard: PolicyGuard | None = None,
+        event_bus: AgentEventBus | None = None,
+        answer_client: AnswerClient | None = None,
+    ) -> None:
+        self.settings = settings or get_settings()
         self.policy_guard = policy_guard or PolicyGuard()
+        self.event_bus = event_bus
+        self.answer_client = answer_client or AnthropicPlannerClient(settings=self.settings)
 
     async def run(self, *, db: AsyncSession, job: BackgroundJob) -> AgentExecutionResult:
+        ask: AskProtocol | None = None
+        if self.event_bus is not None:
+            ask = AskProtocol(db=db, event_bus=self.event_bus, job_id=int(job.job_id))
+            await ask.start()
+        try:
+            return await self._run(db=db, job=job, ask=ask)
+        finally:
+            if ask is not None:
+                await ask.aclose()
+
+    async def _run(
+        self,
+        *,
+        db: AsyncSession,
+        job: BackgroundJob,
+        ask: AskProtocol | None,
+    ) -> AgentExecutionResult:
         if job.requested_by is None:
             raise ApiError(status_code=400, code=400, message="Agent job is missing requestedBy")
         request = ExecuteAgentRequest.model_validate(dict(job.payload or {}))
@@ -59,10 +97,23 @@ async def run(self, *, db: AsyncSession, job: BackgroundJob) -> AgentExecutionRe
         )
         await db.commit()
 
+        inbox_repo = AgentInboxMessageRepository(db) if self.event_bus is not None else None
+        paused = False
         for action in actions:
             await db.refresh(job)
             if job.cancel_requested_at is not None:
                 raise AgentJobCanceled()
+            if inbox_repo is not None:
+                paused, skip_current = await self._handle_step_boundary_controls(
+                    db=db,
+                    job=job,
+                    inbox_repo=inbox_repo,
+                    action=action,
+                    warnings=warnings,
+                    paused=paused,
+                )
+                if skip_current:
+                    continue
 
             decision = await self.policy_guard.evaluate_tool_call(
                 tool_name=action.tool,
@@ -98,6 +149,13 @@ async def run(self, *, db: AsyncSession, job: BackgroundJob) -> AgentExecutionRe
                     error_message=f"{type(exc).__name__}: {exc}"[:2000],
                 )
                 await db.commit()
+                await self._publish_tool(
+                    "tool.failed",
+                    job_id=int(job.job_id),
+                    step=action.step,
+                    tool=action.tool,
+                    payload={"errorMessage": f"{type(exc).__name__}: {exc}"[:2000]},
+                )
                 raise
 
             await action_logs.append_step(
@@ -109,6 +167,14 @@ async def run(self, *, db: AsyncSession, job: BackgroundJob) -> AgentExecutionRe
                 started_at=started,
             )
             await db.commit()
+            await self._publish_tool(
+                "tool.started",
+                job_id=int(job.job_id),
+                step=action.step,
+                tool=action.tool,
+                payload={"input": resolved_input},
+                emitted_at=started,
+            )
 
             try:
                 output = await router.dispatch(
@@ -126,6 +192,13 @@ async def run(self, *, db: AsyncSession, job: BackgroundJob) -> AgentExecutionRe
                     error_message=f"{type(exc).__name__}: {exc}"[:2000],
                 )
                 await db.commit()
+                await self._publish_tool(
+                    "tool.failed",
+                    job_id=int(job.job_id),
+                    step=action.step,
+                    tool=action.tool,
+                    payload={"errorMessage": f"{type(exc).__name__}: {exc}"[:2000]},
+                )
                 raise
 
             safe_output = jsonable_encoder(output)
@@ -138,6 +211,13 @@ async def run(self, *, db: AsyncSession, job: BackgroundJob) -> AgentExecutionRe
                 duration_ms=duration_ms,
             )
             await db.commit()
+            await self._publish_tool(
+                "tool.succeeded",
+                job_id=int(job.job_id),
+                step=action.step,
+                tool=action.tool,
+                payload={"output": safe_output, "durationMs": duration_ms},
+            )
             step_outputs[action.step] = safe_output
             applied += 1
 
@@ -146,7 +226,12 @@ async def run(self, *, db: AsyncSession, job: BackgroundJob) -> AgentExecutionRe
             warnings.append(f"{skipped} action(s) were skipped.")
         await work_sessions.close_session(job_id=int(job.job_id), status="closed")
         await db.commit()
-        answer = _build_execution_answer(actions=actions, step_outputs=step_outputs)
+        answer = await _build_execution_answer(
+            task_input=str(getattr(plan, "input_text", "") or ""),
+            actions=actions,
+            step_outputs=step_outputs,
+            answer_client=self.answer_client,
+        )
         return AgentExecutionResult(
             plan_job_id=str(plan_job_id),
             execute_job_id=str(job.job_id),
@@ -158,6 +243,96 @@ async def run(self, *, db: AsyncSession, job: BackgroundJob) -> AgentExecutionRe
             finished_at=datetime.now(UTC),
         )
 
+    async def _handle_step_boundary_controls(
+        self,
+        *,
+        db: AsyncSession,
+        job: BackgroundJob,
+        inbox_repo: AgentInboxMessageRepository,
+        action: AgentProposedAction,
+        warnings: list[str],
+        paused: bool,
+    ) -> tuple[bool, bool]:
+        while True:
+            skip_current = False
+            pending = await inbox_repo.list_pending_controls(job_id=int(job.job_id))
+            for ctrl in pending:
+                kind = AgentInboxKind(ctrl.kind)
+                if kind == AgentInboxKind.CONTROL_CANCEL:
+                    await inbox_repo.mark_dropped(inbox_message_id=int(ctrl.inbox_message_id))
+                    job.cancel_requested_at = datetime.now(UTC)
+                    await db.commit()
+                    raise AgentJobCanceled()
+                if kind == AgentInboxKind.CONTROL_PAUSE:
+                    paused = True
+                    await inbox_repo.mark_dropped(inbox_message_id=int(ctrl.inbox_message_id))
+                    await self._publish_state("agent.paused", job_id=int(job.job_id))
+                elif kind == AgentInboxKind.CONTROL_RESUME:
+                    paused = False
+                    await inbox_repo.mark_dropped(inbox_message_id=int(ctrl.inbox_message_id))
+                    await self._publish_state("agent.resumed", job_id=int(job.job_id))
+                elif kind == AgentInboxKind.CONTROL_SKIP:
+                    await inbox_repo.mark_dropped(inbox_message_id=int(ctrl.inbox_message_id))
+                    warnings.append(f"Step {action.step} skipped by user")
+                    skip_current = True
+                else:
+                    await inbox_repo.mark_dropped(inbox_message_id=int(ctrl.inbox_message_id))
+            await db.commit()
+            if skip_current:
+                return paused, True
+            if not paused:
+                return paused, False
+            await asyncio.sleep(0.1)
+
+    async def _publish_state(self, event_type: str, *, job_id: int) -> None:
+        if self.event_bus is None:
+            return
+        try:
+            await self.event_bus.publish(
+                AgentEventEnvelope(
+                    job_id=job_id,
+                    event_type=event_type,
+                    payload={},
+                    emitted_at=datetime.now(UTC),
+                )
+            )
+        except Exception:
+            logger.exception(
+                "Failed to publish state event jobId=%s eventType=%s",
+                job_id,
+                event_type,
+            )
+
+    async def _publish_tool(
+        self,
+        event_type: str,
+        *,
+        job_id: int,
+        step: int,
+        tool: str,
+        payload: dict[str, Any],
+        emitted_at: datetime | None = None,
+    ) -> None:
+        if self.event_bus is None:
+            return
+        try:
+            await self.event_bus.publish(
+                AgentEventEnvelope(
+                    job_id=job_id,
+                    event_type=event_type,
+                    payload={"step": int(step), "tool": str(tool), **payload},
+                    emitted_at=emitted_at or datetime.now(UTC),
+                )
+            )
+        except Exception:
+            logger.exception(
+                "Failed to publish tool event jobId=%s eventType=%s step=%s tool=%s",
+                job_id,
+                event_type,
+                step,
+                tool,
+            )
+
 
 def _parse_job_id(raw: str) -> int:
     try:
@@ -226,35 +401,89 @@ def _resolve_references(
     return value
 
 
-def _build_execution_answer(
+async def _build_execution_answer(
     *,
+    task_input: str = "",
     actions: list[AgentProposedAction],
     step_outputs: dict[int, dict[str, Any]],
+    answer_client: AnswerClient,
 ) -> str | None:
-    for action in actions:
-        if action.tool != "drive.countFiles":
-            continue
-        output = step_outputs.get(action.step)
-        if not isinstance(output, dict):
-            continue
-        return _count_files_answer(output)
-
-    if actions and all(action.side_effect == "read" for action in actions):
-        return f"已完成 {len(step_outputs)} 个只读操作。"
-    return None
-
-
-def _count_files_answer(output: dict[str, Any]) -> str:
-    total_items = int(output.get("totalItems") or 0)
-    category = str(output.get("category") or "").strip().lower()
-    if category == "video":
-        return f"你上传了 {total_items} 部电影（按视频文件统计）。"
-    if category == "audio":
-        return f"你上传了 {total_items} 个音频文件。"
-    if category == "image":
-        return f"你上传了 {total_items} 张图片。"
-    if category == "document":
-        return f"你上传了 {total_items} 个文档。"
-    if category == "archive":
-        return f"你上传了 {total_items} 个压缩包。"
-    return f"你上传了 {total_items} 个文件。"
+    if not actions:
+        return None
+    user_prompt = _answer_user_prompt(
+        task_input=task_input,
+        actions=actions,
+        step_outputs=step_outputs,
+    )
+    text = await answer_client.create_answer(
+        system_prompt=_answer_system_prompt(),
+        user_prompt=user_prompt,
+        max_tokens=640,
+        reasoning_effort="low",
+    )
+    answer = _normalize_answer(text)
+    if answer is None:
+        raise ApiError(status_code=502, code=502, message="Agent answer model returned empty response")
+    return answer
+
+
+def _answer_system_prompt() -> str:
+    return (
+        "You are FileFlash execution answer generator. "
+        "Only describe results that are present in tool outputs. "
+        "Do not invent filenames, counts, or paths. "
+        "Keep the response concise and user-facing in the same language as the user input."
+    )
+
+
+def _answer_user_prompt(
+    *,
+    task_input: str,
+    actions: list[AgentProposedAction],
+    step_outputs: dict[int, dict[str, Any]],
+) -> str:
+    payload_actions: list[dict[str, Any]] = []
+    for action in sorted(actions, key=lambda item: item.step):
+        payload_actions.append(
+            {
+                "step": action.step,
+                "tool": action.tool,
+                "sideEffect": action.side_effect,
+                "input": action.input,
+                "output": _compact_output(step_outputs.get(action.step)),
+            }
+        )
+    payload = {
+        "task": task_input,
+        "actions": payload_actions,
+        "responseGuidance": {
+            "includeNamesWhenAvailable": True,
+            "mentionTruncationWhenProvided": True,
+            "ifAmbiguous": "state candidate count and ask for clarification",
+        },
+    }
+    return json.dumps(payload, ensure_ascii=False, sort_keys=True)
+
+
+def _compact_output(value: dict[str, Any] | None) -> dict[str, Any] | None:
+    if not isinstance(value, dict):
+        return None
+    text = json.dumps(value, ensure_ascii=False, separators=(",", ":"))
+    if len(text) <= 12_000:
+        return value
+    compact = dict(value)
+    compact["truncated"] = True
+    compact["truncatedFields"] = sorted(compact.keys())[:16]
+    compact.pop("items", None)
+    compact.pop("sampleItems", None)
+    return compact
+
+
+def _normalize_answer(text: str) -> str | None:
+    candidate = str(text or "").strip()
+    if not candidate:
+        return None
+    candidate = " ".join(candidate.split())
+    if len(candidate) > 1200:
+        candidate = candidate[:1200].rstrip() + "…"
+    return candidate
diff --git a/app/src/fileflash/agents/runtime/llm.py b/app/src/fileflash/agents/runtime/llm.py
index 4a268ee..1596728 100644
--- a/app/src/fileflash/agents/runtime/llm.py
+++ b/app/src/fileflash/agents/runtime/llm.py
@@ -1,6 +1,8 @@
 from __future__ import annotations
 
 import json
+import logging
+from collections.abc import Awaitable, Callable
 from typing import Any, Protocol
 
 import anthropic
@@ -9,6 +11,9 @@
 from ...core.errors import ApiError
 from ...core.settings import Settings
 
+ToolExecutor = Callable[[str, dict[str, Any]], Awaitable[dict[str, Any]]]
+logger = logging.getLogger(__name__)
+
 
 class PlannerClient(Protocol):
     async def create_plan(
@@ -18,9 +23,23 @@ async def create_plan(
         user_prompt: str,
         max_tokens: int,
         reasoning_effort: str = "adaptive",
+        tools: list[dict[str, Any]] | None = None,
+        tool_executor: ToolExecutor | None = None,
+        max_tool_roundtrips: int = 4,
     ) -> dict[str, Any]: ...
 
 
+class AnswerClient(Protocol):
+    async def create_answer(
+        self,
+        *,
+        system_prompt: str,
+        user_prompt: str,
+        max_tokens: int,
+        reasoning_effort: str = "adaptive",
+    ) -> str: ...
+
+
 class AnthropicPlannerClient:
     def __init__(self, *, settings: Settings, client: AsyncAnthropic | None = None) -> None:
         self.settings = settings
@@ -33,14 +52,94 @@ async def create_plan(
         user_prompt: str,
         max_tokens: int,
         reasoning_effort: str = "adaptive",
+        tools: list[dict[str, Any]] | None = None,
+        tool_executor: ToolExecutor | None = None,
+        max_tool_roundtrips: int = 4,
     ) -> dict[str, Any]:
         api_key = (self.settings.agent_llm_api_key or "").strip()
         if not api_key:
             raise ApiError(status_code=503, code=503, message="Agent LLM API key is not configured")
+        plan_token_cap = _safe_plan_token_cap(self.settings)
+
+        request_kwargs: dict[str, Any] = {
+            "model": self.settings.agent_llm_model,
+            "max_tokens": min(max_tokens, plan_token_cap),
+            "system": system_prompt,
+            "messages": [{"role": "user", "content": user_prompt}],
+            "timeout": 60.0,
+        }
+        tool_name_map = _tool_name_map(tools or [])
+        if tools:
+            request_kwargs["tools"] = _anthropic_tools_payload(tools)
+            request_kwargs["tool_choice"] = {"type": "auto"}
+        request_kwargs.update(_reasoning_params(reasoning_effort))
+
+        try:
+            parsed, usage = await self._request_and_parse_plan(
+                api_key=api_key,
+                request_kwargs=request_kwargs,
+                tool_name_map=tool_name_map,
+                tool_executor=tool_executor,
+                max_tool_roundtrips=max_tool_roundtrips,
+            )
+        except ApiError as first_error:
+            if not _is_retryable_output_error(first_error):
+                raise
+            logger.warning(
+                "Planner LLM retrying attempt=%s reason=%s degraded=%s jsonOnly=%s",
+                2,
+                first_error.message,
+                True,
+                False,
+            )
+            degraded_kwargs = _degraded_plan_request_kwargs(request_kwargs)
+            try:
+                parsed, usage = await self._request_and_parse_plan(
+                    api_key=api_key,
+                    request_kwargs=degraded_kwargs,
+                    tool_name_map=tool_name_map,
+                    tool_executor=tool_executor,
+                    max_tool_roundtrips=max_tool_roundtrips,
+                )
+            except ApiError as second_error:
+                if not _is_retryable_output_error(second_error):
+                    raise
+                logger.warning(
+                    "Planner LLM retrying attempt=%s reason=%s degraded=%s jsonOnly=%s",
+                    3,
+                    second_error.message,
+                    True,
+                    True,
+                )
+                strict_kwargs = _strict_json_retry_kwargs(
+                    degraded_kwargs,
+                    max_tokens_cap=plan_token_cap,
+                )
+                parsed, usage = await self._request_and_parse_plan(
+                    api_key=api_key,
+                    request_kwargs=strict_kwargs,
+                    tool_name_map=tool_name_map,
+                    tool_executor=tool_executor,
+                    max_tool_roundtrips=max_tool_roundtrips,
+                )
+        if isinstance(usage, dict):
+            parsed["_usage"] = usage
+        return parsed
 
+    async def create_answer(
+        self,
+        *,
+        system_prompt: str,
+        user_prompt: str,
+        max_tokens: int,
+        reasoning_effort: str = "adaptive",
+    ) -> str:
+        api_key = (self.settings.agent_llm_api_key or "").strip()
+        if not api_key:
+            raise ApiError(status_code=503, code=503, message="Agent LLM API key is not configured")
         request_kwargs: dict[str, Any] = {
             "model": self.settings.agent_llm_model,
-            "max_tokens": min(max_tokens, 4096),
+            "max_tokens": min(max_tokens, 1024),
             "system": system_prompt,
             "messages": [{"role": "user", "content": user_prompt}],
             "timeout": 60.0,
@@ -48,7 +147,7 @@ async def create_plan(
         request_kwargs.update(_reasoning_params(reasoning_effort))
         message = await self._request_plan(api_key=api_key, request_kwargs=request_kwargs)
         try:
-            parsed, usage = _parse_plan_message(message)
+            return _extract_text(message)
         except ApiError as exc:
             if not _is_retryable_output_error(exc):
                 raise
@@ -56,10 +155,7 @@ async def create_plan(
             degraded_kwargs.pop("thinking", None)
             degraded_kwargs.pop("output_config", None)
             message = await self._request_plan(api_key=api_key, request_kwargs=degraded_kwargs)
-            parsed, usage = _parse_plan_message(message)
-        if isinstance(usage, dict):
-            parsed["_usage"] = usage
-        return parsed
+            return _extract_text(message)
 
     async def _request_plan(self, *, api_key: str, request_kwargs: dict[str, Any]) -> Any:
         try:
@@ -93,6 +189,98 @@ def _get_client(self, api_key: str) -> AsyncAnthropic:
             )
         return self._client
 
+    async def _parse_plan_response(
+        self,
+        *,
+        api_key: str,
+        request_kwargs: dict[str, Any],
+        message: Any,
+        tool_name_map: dict[str, str],
+        tool_executor: ToolExecutor | None,
+        max_tool_roundtrips: int,
+    ) -> tuple[dict[str, Any], dict[str, Any] | None]:
+        if tool_executor is None:
+            return _parse_plan_message(message, tool_name_map=tool_name_map)
+        tool_calls = _extract_tool_use_calls(message=message, tool_name_map=tool_name_map)
+        if not tool_calls:
+            return _parse_plan_message(message, tool_name_map=tool_name_map)
+        return await self._run_tool_loop(
+            api_key=api_key,
+            request_kwargs=request_kwargs,
+            initial_message=message,
+            tool_name_map=tool_name_map,
+            tool_executor=tool_executor,
+            max_tool_roundtrips=max_tool_roundtrips,
+        )
+
+    async def _request_and_parse_plan(
+        self,
+        *,
+        api_key: str,
+        request_kwargs: dict[str, Any],
+        tool_name_map: dict[str, str],
+        tool_executor: ToolExecutor | None,
+        max_tool_roundtrips: int,
+    ) -> tuple[dict[str, Any], dict[str, Any] | None]:
+        message = await self._request_plan(api_key=api_key, request_kwargs=request_kwargs)
+        return await self._parse_plan_response(
+            api_key=api_key,
+            request_kwargs=request_kwargs,
+            message=message,
+            tool_name_map=tool_name_map,
+            tool_executor=tool_executor,
+            max_tool_roundtrips=max_tool_roundtrips,
+        )
+
+    async def _run_tool_loop(
+        self,
+        *,
+        api_key: str,
+        request_kwargs: dict[str, Any],
+        initial_message: Any,
+        tool_name_map: dict[str, str],
+        tool_executor: ToolExecutor,
+        max_tool_roundtrips: int,
+    ) -> tuple[dict[str, Any], dict[str, Any] | None]:
+        max_rounds = max(1, min(int(max_tool_roundtrips or 0), 12))
+        base_messages = request_kwargs.get("messages")
+        if not isinstance(base_messages, list):
+            raise ApiError(status_code=502, code=502, message="Agent LLM returned an invalid response")
+        messages: list[dict[str, Any]] = list(base_messages)
+        usage_total: dict[str, int] = {}
+        current_message = initial_message
+
+        for _ in range(max_rounds):
+            usage_total = _merge_usage_totals(usage_total, _usage_payload(current_message))
+            tool_calls = _extract_tool_use_calls(message=current_message, tool_name_map=tool_name_map)
+            if not tool_calls:
+                parsed, _ = _parse_plan_message(current_message, tool_name_map=tool_name_map)
+                return parsed, usage_total or None
+
+            assistant_content = _content_block_mappings(current_message)
+            if assistant_content:
+                messages.append({"role": "assistant", "content": assistant_content})
+            tool_results: list[dict[str, Any]] = []
+            for call in tool_calls:
+                tool_output = await tool_executor(call["tool"], call["input"])
+                tool_results.append(
+                    {
+                        "type": "tool_result",
+                        "tool_use_id": call["id"],
+                        "content": _tool_result_content(tool_output),
+                    }
+                )
+            messages.append({"role": "user", "content": tool_results})
+            loop_kwargs = dict(request_kwargs)
+            loop_kwargs["messages"] = messages
+            current_message = await self._request_plan(api_key=api_key, request_kwargs=loop_kwargs)
+
+        raise ApiError(
+            status_code=502,
+            code=502,
+            message="Agent LLM exceeded planning tool rounds",
+        )
+
 
 def _extract_text(message: Any) -> str:
     chunks = getattr(message, "content", None)
@@ -112,6 +300,69 @@ def _extract_text(message: Any) -> str:
     return text
 
 
+def _content_block_mappings(message: Any) -> list[dict[str, Any]]:
+    chunks = getattr(message, "content", None)
+    if isinstance(chunks, str):
+        return [{"type": "text", "text": chunks}]
+    if not isinstance(chunks, list):
+        return []
+    blocks: list[dict[str, Any]] = []
+    for chunk in chunks:
+        if isinstance(chunk, dict):
+            blocks.append(chunk)
+            continue
+        if hasattr(chunk, "model_dump"):
+            dumped = chunk.model_dump()
+            if isinstance(dumped, dict):
+                blocks.append(dumped)
+                continue
+        blocks.append(
+            {
+                "type": getattr(chunk, "type", None),
+                "text": getattr(chunk, "text", None),
+                "name": getattr(chunk, "name", None),
+                "input": getattr(chunk, "input", None),
+                "id": getattr(chunk, "id", None),
+            }
+        )
+    return blocks
+
+
+def _extract_tool_use_payload(
+    message: Any,
+    *,
+    tool_name_map: dict[str, str],
+) -> tuple[list[dict[str, Any]], str | None]:
+    actions: list[dict[str, Any]] = []
+    text_parts: list[str] = []
+    for block in _content_block_mappings(message):
+        block_type = str(block.get("type") or "")
+        if block_type == "tool_use":
+            provider_name = str(block.get("name") or "").strip()
+            action_input = _coerce_mapping(block.get("input"))
+            actions.append(
+                {
+                    "step": len(actions) + 1,
+                    "tool": tool_name_map.get(provider_name, provider_name),
+                    "input": action_input,
+                }
+            )
+            continue
+        text_parts.extend(_extract_text_parts_from_mapping(block))
+    summary = "\n".join(part for part in text_parts if part).strip()
+    return actions, summary or None
+
+
+def _coerce_mapping(value: Any) -> dict[str, Any]:
+    if isinstance(value, dict):
+        return value
+    if hasattr(value, "model_dump"):
+        dumped = value.model_dump()
+        if isinstance(dumped, dict):
+            return dumped
+    return {}
+
+
 def _extract_text_parts(chunk: Any) -> list[str]:
     if chunk is None:
         return []
@@ -193,6 +444,34 @@ def _usage_payload(message: Any) -> dict[str, Any] | None:
     return payload or None
 
 
+def _merge_usage_totals(base: dict[str, int], extra: dict[str, Any] | None) -> dict[str, int]:
+    merged = dict(base)
+    if not isinstance(extra, dict):
+        return merged
+    for key in (
+        "input_tokens",
+        "output_tokens",
+        "cache_creation_input_tokens",
+        "cache_read_input_tokens",
+    ):
+        value = extra.get(key)
+        if value is None:
+            continue
+        try:
+            parsed = int(value)
+        except (TypeError, ValueError):
+            continue
+        merged[key] = int(merged.get(key) or 0) + parsed
+    return merged
+
+
+def _tool_result_content(payload: dict[str, Any]) -> list[dict[str, str]]:
+    text = json.dumps(payload, ensure_ascii=False)
+    if len(text) > 12_000:
+        text = text[:12_000] + "…"
+    return [{"type": "text", "text": text}]
+
+
 def _reasoning_params(reasoning_effort: str) -> dict[str, Any]:
     effort = (reasoning_effort or "adaptive").strip().lower()
     if effort == "adaptive":
@@ -211,13 +490,83 @@ def _response_details(error: anthropic.APIStatusError) -> str:
     return str(text or "")[:800]
 
 
-def _parse_plan_message(message: Any) -> tuple[dict[str, Any], dict[str, Any] | None]:
+def _parse_plan_message(
+    message: Any,
+    *,
+    tool_name_map: dict[str, str] | None = None,
+) -> tuple[dict[str, Any], dict[str, Any] | None]:
+    tool_actions, summary = _extract_tool_use_payload(
+        message,
+        tool_name_map=tool_name_map or {},
+    )
+    usage = _usage_payload(message)
+    if tool_actions:
+        return {
+            "summary": summary or f"Prepared {len(tool_actions)} file action(s).",
+            "proposedActions": tool_actions,
+        }, usage
     text = _extract_text(message)
     parsed = _parse_json_text(text)
-    usage = _usage_payload(message)
     return parsed, usage
 
 
+def _extract_tool_use_calls(
+    message: Any,
+    *,
+    tool_name_map: dict[str, str],
+) -> list[dict[str, Any]]:
+    calls: list[dict[str, Any]] = []
+    for block in _content_block_mappings(message):
+        if str(block.get("type") or "") != "tool_use":
+            continue
+        provider_name = str(block.get("name") or "").strip()
+        if not provider_name:
+            continue
+        tool_use_id = str(block.get("id") or "").strip()
+        if not tool_use_id:
+            tool_use_id = f"tool_use_{len(calls) + 1}"
+        calls.append(
+            {
+                "id": tool_use_id,
+                "tool": tool_name_map.get(provider_name, provider_name),
+                "input": _coerce_mapping(block.get("input")),
+            }
+        )
+    return calls
+
+
+def _tool_name_map(tools: list[dict[str, Any]]) -> dict[str, str]:
+    mapping: dict[str, str] = {}
+    for tool in tools:
+        provider_name = str(tool.get("name") or "").strip()
+        if not provider_name:
+            continue
+        internal_name = str(
+            tool.get("internalName")
+            or tool.get("internal_name")
+            or tool.get("tool")
+            or provider_name
+        ).strip()
+        mapping[provider_name] = internal_name or provider_name
+    return mapping
+
+
+def _anthropic_tools_payload(tools: list[dict[str, Any]]) -> list[dict[str, Any]]:
+    payload: list[dict[str, Any]] = []
+    for tool in tools:
+        name = str(tool.get("name") or "").strip()
+        if not name:
+            continue
+        payload.append(
+            {
+                "name": name,
+                "description": str(tool.get("description") or ""),
+                "input_schema": dict(tool.get("input_schema") or {"type": "object"}),
+            }
+        )
+    return payload
+
+
 def _is_retryable_output_error(error: ApiError) -> bool:
     if error.status_code != 502:
         return False
@@ -229,26 +578,137 @@ def _is_retryable_output_error(error: ApiError) -> bool:
     }
 
 
+def _safe_plan_token_cap(settings: Settings) -> int:
+    raw_value = getattr(settings, "agent_llm_plan_max_tokens", 8192)
+    try:
+        parsed = int(raw_value)
+    except (TypeError, ValueError):
+        return 8192
+    return max(1, parsed)
+
+
+def _degraded_plan_request_kwargs(request_kwargs: dict[str, Any]) -> dict[str, Any]:
+    degraded_kwargs = dict(request_kwargs)
+    degraded_kwargs.pop("thinking", None)
+    degraded_kwargs.pop("output_config", None)
+    return degraded_kwargs
+
+
+def _strict_json_retry_kwargs(
+    request_kwargs: dict[str, Any],
+    *,
+    max_tokens_cap: int,
+) -> dict[str, Any]:
+    strict_kwargs = dict(request_kwargs)
+    strict_kwargs["max_tokens"] = max(1, int(max_tokens_cap))
+    messages = request_kwargs.get("messages")
+    strict_kwargs["messages"] = _append_json_only_retry_instruction(messages)
+    return strict_kwargs
+
+
+def _append_json_only_retry_instruction(messages: Any) -> list[dict[str, Any]]:
+    instruction = (
+        "Return ONLY one valid JSON object that matches outputSchema. "
+        "Do not include markdown fences, prose, or extra text."
+    )
+    if not isinstance(messages, list):
+        return [{"role": "user", "content": instruction}]
+    cloned: list[dict[str, Any]] = []
+    for item in messages:
+        if isinstance(item, dict):
+            cloned.append(dict(item))
+    for idx in range(len(cloned) - 1, -1, -1):
+        if cloned[idx].get("role") != "user":
+            continue
+        content = cloned[idx].get("content")
+        if isinstance(content, str):
+            merged = content.rstrip()
+            if merged:
+                merged = f"{merged}\n\n{instruction}"
+            else:
+                merged = instruction
+            cloned[idx]["content"] = merged
+            return cloned
+    cloned.append({"role": "user", "content": instruction})
+    return cloned
+
+
 def _parse_json_text(text: str) -> dict[str, Any]:
-    candidate = text.strip()
-    if candidate.startswith("```"):
-        lines = candidate.splitlines()
-        if lines and lines[0].startswith("```"):
-            lines = lines[1:]
-        if lines and lines[-1].startswith("```"):
-            lines = lines[:-1]
-        candidate = "\n".join(lines).strip()
+    candidate = _strip_code_fences(text)
     try:
-        parsed = json.loads(candidate)
-    except json.JSONDecodeError as exc:
+        return _decode_json_object(candidate)
+    except ApiError:
+        raise
+    except json.JSONDecodeError as decode_error:
+        extracted = _extract_balanced_json_object(candidate)
+        if extracted is not None:
+            try:
+                return _decode_json_object(extracted)
+            except ApiError:
+                raise
+            except json.JSONDecodeError:
+                pass
         raise ApiError(
             status_code=502,
             code=502,
             message="Agent LLM did not return valid JSON",
-        ) from exc
+        ) from decode_error
+
+
+def _decode_json_object(candidate: str) -> dict[str, Any]:
+    parsed = json.loads(candidate)
     if not isinstance(parsed, dict):
         raise ApiError(status_code=502, code=502, message="Agent LLM JSON must be an object")
     return parsed
 
 
-__all__ = ["AnthropicPlannerClient", "PlannerClient"]
+def _strip_code_fences(text: str) -> str:
+    candidate = text.strip()
+    if not candidate.startswith("```"):
+        return candidate
+    lines = candidate.splitlines()
+    if lines and lines[0].startswith("```"):
+        lines = lines[1:]
+    if lines and lines[-1].startswith("```"):
+        lines = lines[:-1]
+    return "\n".join(lines).strip()
+
+
+def _extract_balanced_json_object(text: str) -> str | None:
+    start = -1
+    depth = 0
+    in_string = False
+    escaped = False
+    for idx, ch in enumerate(text):
+        if start < 0:
+            if ch == "{":
+                start = idx
+                depth = 1
+                in_string = False
+                escaped = False
+            continue
+        if in_string:
+            if escaped:
+                escaped = False
+            elif ch == "\\":
+                escaped = True
+            elif ch == '"':
+                in_string = False
+            continue
+        if ch == '"':
+            in_string = True
+            continue
+        if ch == "{":
+            depth += 1
+            continue
+        if ch == "}":
+            depth -= 1
+            if depth == 0:
+                return text[start : idx + 1]
+            if depth < 0:
+                start = -1
+                depth = 0
+    return None
+
+
+__all__ = ["AnswerClient", "AnthropicPlannerClient", "PlannerClient", "ToolExecutor"]
diff --git a/app/src/fileflash/agents/runtime/plan_runner.py b/app/src/fileflash/agents/runtime/plan_runner.py
index e3421d0..6caaa75 100644
--- a/app/src/fileflash/agents/runtime/plan_runner.py
+++ b/app/src/fileflash/agents/runtime/plan_runner.py
@@ -1,6 +1,7 @@
 from __future__ import annotations
 
 import hashlib
+import inspect
 import json
 from datetime import UTC, datetime
 from typing import Any
@@ -19,26 +20,19 @@
 from ...schemas.agent import (
     AgentChosenSkill,
     AgentCostEstimate,
+    AgentPlanningEvidence,
     AgentPlanResult,
     AgentProposedAction,
     PlanAgentRequest,
 )
+from ..harness.ask import AskProtocol
+from ..harness.event_bus import AgentEventBus
 from ..harness.policy import classify_tool_side_effect, normalize_action_risk
+from ..harness.router import ToolCall, ToolRouter
+from ..harness.tool_registry import REGISTRY
 from .llm import AnthropicPlannerClient, PlannerClient
 from .reference_rules import is_symbolic_id_placeholder, parse_step_reference
 
-DEFAULT_AGENT_TOOLS = (
-    "drive.listFolder",
-    "drive.countFiles",
-    "drive.createFolder",
-    "drive.moveFile",
-    "drive.moveFolder",
-    "drive.renameFile",
-    "drive.renameFolder",
-    "drive.deleteFile",
-    "drive.deleteFolder",
-)
-
 
 class PlanRunner:
     def __init__(
@@ -46,11 +40,30 @@ def __init__(
         *,
         settings: Settings | None = None,
         planner_client: PlannerClient | None = None,
+        event_bus: AgentEventBus | None = None,
     ) -> None:
         self.settings = settings or get_settings()
         self.planner_client = planner_client or AnthropicPlannerClient(settings=self.settings)
+        self.event_bus = event_bus
 
     async def run(self, *, db: AsyncSession, job: BackgroundJob) -> AgentPlanResult:
+        ask: AskProtocol | None = None
+        if self.event_bus is not None:
+            ask = AskProtocol(db=db, event_bus=self.event_bus, job_id=int(job.job_id))
+            await ask.start()
+        try:
+            return await self._run(db=db, job=job, ask=ask)
+        finally:
+            if ask is not None:
+                await ask.aclose()
+
+    async def _run(
+        self,
+        *,
+        db: AsyncSession,
+        job: BackgroundJob,
+        ask: AskProtocol | None,
+    ) -> AgentPlanResult:
         if job.requested_by is None:
             raise ApiError(status_code=400, code=400, message="Agent job is missing requestedBy")
 
@@ -64,26 +77,60 @@ async def run(self, *, db: AsyncSession, job: BackgroundJob) -> AgentPlanResult:
         )
         metadata = await _collect_context_metadata(db, user_id=user_id, request=request)
         allowed_tools = _skill_tool_whitelist(skill)
-        try:
-            llm_payload = await self.planner_client.create_plan(
-                system_prompt=_system_prompt(),
-                user_prompt=_user_prompt(
-                    request=request,
-                    skill=skill,
-                    allowed_tools=allowed_tools,
-                    metadata=metadata,
-                ),
-                max_tokens=request.hints.budget_tokens,
-                reasoning_effort=request.hints.reasoning_effort,
-            )
-        except ApiError as exc:
-            if exc.status_code != 502:
-                raise
-            llm_payload = _safe_fallback_payload(
+        allowed_tool_set = set(allowed_tools)
+        planner_router = ToolRouter(db=db, user_id=user_id)
+        tool_call_budget = min(self.settings.agent_job_max_tool_calls, 32)
+        planned_tool_calls = 0
+        planning_evidence: list[AgentPlanningEvidence] = []
+
+        async def _planning_tool_executor(tool_name: str, args: dict[str, Any]) -> dict[str, Any]:
+            nonlocal planned_tool_calls
+            if tool_name not in allowed_tool_set:
+                raise ApiError(
+                    status_code=400,
+                    code=400,
+                    message=f"Planner attempted disallowed tool: {tool_name}",
+                )
+            spec = REGISTRY.get(tool_name)
+            if spec.side_effect != "read":
+                raise ApiError(
+                    status_code=400,
+                    code=400,
+                    message=f"Planner exploratory tool call must be read-only: {tool_name}",
+                )
+            planned_tool_calls += 1
+            if planned_tool_calls > tool_call_budget:
+                raise ApiError(
+                    status_code=400,
+                    code=400,
+                    message="Planner exceeded exploratory tool-call budget",
+                )
+            output = await planner_router.dispatch(ToolCall(tool_name=tool_name, arguments=args))
+            if len(planning_evidence) < 12:
+                planning_evidence.append(
+                    AgentPlanningEvidence(
+                        step=planned_tool_calls,
+                        tool=tool_name,
+                        input=_evidence_mapping(args),
+                        output_preview=_evidence_preview(output),
+                    )
+                )
+            return output
+
+        llm_payload = await self.planner_client.create_plan(
+            system_prompt=_system_prompt(),
+            user_prompt=_user_prompt(
                 request=request,
-                metadata=metadata,
+                skill=skill,
                 allowed_tools=allowed_tools,
-            )
+                metadata=metadata,
+            ),
+            max_tokens=request.hints.budget_tokens,
+            reasoning_effort=request.hints.reasoning_effort,
+            tools=REGISTRY.anthropic_tools_for(allowed_tools),
+            tool_executor=_planning_tool_executor,
+            max_tool_roundtrips=6,
+        )
 
         actions = _normalize_actions(
             llm_payload=llm_payload,
@@ -91,11 +138,19 @@ async def run(self, *, db: AsyncSession, job: BackgroundJob) -> AgentPlanResult:
             max_steps=min(request.hints.max_steps, self.settings.agent_job_max_tool_calls),
         )
         chosen_skill = _chosen_skill(skill)
-        summary = str(
+        llm_summary = str(
             llm_payload.get("summary") or f"Prepared {len(actions)} file action(s)."
         ).strip()
-        if not summary:
-            summary = f"Prepared {len(actions)} file action(s)."
+        if not llm_summary:
+            llm_summary = f"Prepared {len(actions)} file action(s)."
+        summary = llm_summary
+        if _has_write_actions(actions):
+            summary = await _grounded_write_summary(
+                db,
+                user_id=user_id,
+                actions=actions,
+                fallback_summary=llm_summary,
+            )
 
         requires_confirmation = (
             request.execution_policy != "autopilot"
@@ -115,6 +170,7 @@ async def run(self, *, db: AsyncSession, job: BackgroundJob) -> AgentPlanResult:
             summary=summary,
             requires_confirmation=requires_confirmation,
             cost_estimate=cost_estimate,
+            planning_evidence=planning_evidence or None,
         )
         await _upsert_agent_plan(
             db,
@@ -129,6 +185,21 @@ async def run(self, *, db: AsyncSession, job: BackgroundJob) -> AgentPlanResult:
             raise
         return result
 
+    async def _ask(
+        self,
+        *,
+        ask: AskProtocol | None,
+        prompt: str,
+        schema: dict[str, Any],
+    ) -> Any | None:
+        if ask is None:
+            return None
+        return await ask.ask(
+            prompt=prompt,
+            schema=schema,
+            timeout_sec=float(self.settings.agent_inbox_ask_timeout_sec),
+        )
+
 
 async def _choose_skill(
     db: AsyncSession,
@@ -193,10 +264,16 @@ def _skill_tool_whitelist(skill: AgentSkill | AgentSkillCatalogEntry | None) ->
         raw = skill.tool_whitelist_json
     if isinstance(raw, list) and raw:
         tools = tuple(str(item) for item in raw if str(item).strip())
-        if "drive.countFiles" not in tools:
-            return (*tools, "drive.countFiles")
+        unknown = REGISTRY.unknown_names(tools)
+        if unknown:
+            raise ApiError(
+                status_code=422,
+                code=422,
+                message="Unknown agent tool in selected skill",
+                data={"unknownTools": sorted(unknown)},
+            )
         return tools
-    return DEFAULT_AGENT_TOOLS
+    return REGISTRY.all_names()
 
 
 def _chosen_skill(skill: AgentSkill | AgentSkillCatalogEntry | None) -> AgentChosenSkill | None:
@@ -368,9 +445,8 @@ def _folder_metadata(row: Folder) -> dict[str, Any]:
 
 def _system_prompt() -> str:
     return (
-        "You are FileFlash Agent Planner. Return only JSON. "
-        "Plan file-management actions or read-only answers using the provided tools and metadata. "
-        "For count/how many questions, prefer drive.countFiles over listing folders. "
+        "You are FileFlash Agent Planner. Build plans from tool-grounded facts, not assumptions. "
+        "If you need facts, first call read-only tools; then output one final JSON object that matches outputSchema. "
         "Do not read or infer file contents. Deletions are high risk and must be explicit. "
         "Cross-step dependencies must use '$stepN.field' references only and never symbolic placeholders "
         "like 'newFolderId'."
@@ -392,6 +468,17 @@ def _user_prompt(
         "skill": _skill_payload(skill),
         "allowedTools": list(allowed_tools),
         "toolSchemas": _tool_schemas(allowed_tools),
+        "toolUseMode": (
+            "Use read-only tools first when facts are missing. "
+            "Write tools must appear only in final proposedActions, not exploratory tool_use steps."
+        ),
+        "plannerDefaults": {
+            "organizeRequest": {
+                "scope": "root recursive unless user constrained the scope",
+                "folderNaming": "reuse existing folders first; create english category folders if missing",
+                "writePlanPolicy": "generate executable write actions by default",
+            }
+        },
         "referenceContract": {
             "syntax": "$stepN.field",
             "rules": [
@@ -449,89 +536,7 @@ def _skill_payload(skill: AgentSkill | AgentSkillCatalogEntry | None) -> dict[st
 
 
 def _tool_schemas(allowed_tools: tuple[str, ...]) -> list[dict[str, Any]]:
-    descriptions = {
-        "drive.listFolder": "List direct folder contents by folderId.",
-        "drive.countFiles": (
-            "Count files under folderId. Supports recursive=true and category values "
-            "video, audio, image, document, archive, other. Use category=video for movie/电影 questions."
-        ),
-        "drive.createFolder": "Create a folder under parentFolderId with name.",
-        "drive.moveFile": "Move fileId into targetFolderId.",
-        "drive.moveFolder": "Move folderId into targetParentId.",
-        "drive.renameFile": "Rename fileId to fileName.",
-        "drive.renameFolder": "Rename folderId to folderName.",
-        "drive.deleteFile": "Soft-delete fileId into recycle bin. High risk.",
-        "drive.deleteFolder": "Soft-delete folderId into recycle bin. High risk.",
-    }
-    return [{"tool": tool, "description": descriptions.get(tool, "")} for tool in allowed_tools]
-
-
-def _safe_fallback_payload(
-    *,
-    request: PlanAgentRequest,
-    metadata: dict[str, Any],
-    allowed_tools: tuple[str, ...],
-) -> dict[str, Any]:
-    fallback_actions: list[dict[str, Any]] = []
-    if "drive.countFiles" in allowed_tools and _looks_like_count_question(request.input):
-        fallback_actions.append(
-            {
-                "step": 1,
-                "tool": "drive.countFiles",
-                "input": {
-                    "folderId": metadata.get("rootFolderId") or request.context.root_folder_id or "root",
-                    "recursive": True,
-                    "category": _fallback_count_category(request.input),
-                },
-                "sideEffect": "read",
-                "riskLevel": "low",
-                "requiresConfirmation": False,
-            }
-        )
-        return {
-            "summary": "Planner fallback mode: generated a safe read-only count plan.",
-            "proposedActions": fallback_actions,
-        }
-    if "drive.listFolder" in allowed_tools:
-        root_folder_id = str(
-            metadata.get("rootFolderId")
-            or request.context.root_folder_id
-            or "root"
-        )
-        fallback_actions.append(
-            {
-                "step": 1,
-                "tool": "drive.listFolder",
-                "input": {"folderId": root_folder_id},
-                "sideEffect": "read",
-                "riskLevel": "low",
-                "requiresConfirmation": False,
-            }
-        )
-    return {
-        "summary": "Planner fallback mode: generated a safe read-only plan.",
-        "proposedActions": fallback_actions,
-    }
-
-
-def _looks_like_count_question(text: str) -> bool:
-    normalized = text.lower()
-    return any(token in normalized for token in ("多少", "几个", "几部", "count", "how many", "number of"))
-
-
-def _fallback_count_category(text: str) -> str | None:
-    normalized = text.lower()
-    if any(token in normalized for token in ("电影", "影片", "视频", "movie", "film", "video")):
-        return "video"
-    if any(token in normalized for token in ("图片", "照片", "image", "photo", "picture")):
-        return "image"
-    if any(token in normalized for token in ("音频", "音乐", "audio", "music")):
-        return "audio"
-    if any(token in normalized for token in ("文档", "document", "doc")):
-        return "document"
-    if any(token in normalized for token in ("压缩", "archive", "zip")):
-        return "archive"
-    return None
+    return REGISTRY.schemas_for(allowed_tools)
 
 
 def _normalize_actions(
@@ -668,6 +673,300 @@ def _validate_action_input_value(
             )
 
 
+def _has_write_actions(actions: list[AgentProposedAction]) -> bool:
+    return any(action.side_effect == "write" for action in actions)
+
+
+async def _grounded_write_summary(
+    db: AsyncSession,
+    *,
+    user_id: int,
+    actions: list[AgentProposedAction],
+    fallback_summary: str,
+) -> str:
+    write_actions = [action for action in actions if action.side_effect == "write"]
+    if not write_actions:
+        return fallback_summary
+
+    created_folder_names: list[str] = []
+    created_folder_by_step: dict[int, str] = {}
+    move_file_actions: list[AgentProposedAction] = []
+    move_folder_actions: list[AgentProposedAction] = []
+    file_ids: set[int] = set()
+    folder_ids: set[int] = set()
+
+    for action in write_actions:
+        if action.tool == "drive.createFolder":
+            folder_name = str(action.input.get("name") or action.input.get("folderName") or "").strip()
+            if folder_name:
+                created_folder_names.append(folder_name)
+                created_folder_by_step[action.step] = folder_name
+            continue
+        if action.tool == "drive.moveFile":
+            move_file_actions.append(action)
+            file_id = _coerce_positive_int(action.input.get("fileId"))
+            if file_id is not None:
+                file_ids.add(file_id)
+            target_folder_id = action.input.get("targetFolderId")
+            if isinstance(target_folder_id, str):
+                parsed_folder_id = _coerce_positive_int(target_folder_id)
+                if parsed_folder_id is not None:
+                    folder_ids.add(parsed_folder_id)
+            continue
+        if action.tool == "drive.moveFolder":
+            move_folder_actions.append(action)
+            source_folder_id = _coerce_positive_int(action.input.get("folderId"))
+            if source_folder_id is not None:
+                folder_ids.add(source_folder_id)
+            target_parent_id = action.input.get("targetParentId", action.input.get("targetFolderId"))
+            if isinstance(target_parent_id, str):
+                parsed_parent_id = _coerce_positive_int(target_parent_id)
+                if parsed_parent_id is not None:
+                    folder_ids.add(parsed_parent_id)
+
+    file_name_map = await _safe_fetch_file_names(db, user_id=user_id, file_ids=file_ids)
+    folder_name_map = await _safe_fetch_folder_names(db, user_id=user_id, folder_ids=folder_ids)
+
+    moved_file_names: list[str] = []
+    destination_folder_names: list[str] = []
+    for action in move_file_actions:
+        file_id = _coerce_positive_int(action.input.get("fileId"))
+        if file_id is not None:
+            file_name = file_name_map.get(file_id)
+            if file_name:
+                moved_file_names.append(file_name)
+        destination = _resolve_destination_folder_name(
+            action.input.get("targetFolderId"),
+            created_folder_by_step=created_folder_by_step,
+            folder_name_map=folder_name_map,
+        )
+        if destination:
+            destination_folder_names.append(destination)
+
+    moved_folder_count = len(move_folder_actions)
+    moved_file_count = len(move_file_actions)
+    clauses: list[str] = []
+
+    if created_folder_names:
+        unique_created = _unique_preserve_order(created_folder_names)
+        if len(unique_created) == 1:
+            clauses.append(f"创建“{unique_created[0]}”文件夹")
+        else:
+            clauses.append(f"创建 {len(unique_created)} 个文件夹")
+
+    if moved_file_count > 0:
+        clauses.append(
+            f"将{_format_moved_file_subject(moved_file_names, moved_file_count)}移动到"
+            f"{_format_destination_folder(destination_folder_names)}"
+        )
+
+    if moved_folder_count > 0:
+        clauses.append(f"移动 {moved_folder_count} 个文件夹")
+
+    if not clauses:
+        return fallback_summary
+    return "，并".join(clauses) + "。"
+
+
+async def _safe_fetch_file_names(
+    db: AsyncSession,
+    *,
+    user_id: int,
+    file_ids: set[int],
+) -> dict[int, str]:
+    if not file_ids:
+        return {}
+    try:
+        result = await db.execute(
+            select(File.file_id, File.file_name).where(
+                and_(
+                    File.owner_id == user_id,
+                    File.file_id.in_(sorted(file_ids)),
+                    File.status == FileStatus.ACTIVE,
+                    File.is_latest.is_(True),
+                )
+            )
+        )
+        rows = result.all() if hasattr(result, "all") else []
+        if inspect.isawaitable(rows):
+            rows = await rows
+    except Exception:
+        return {}
+    out: dict[int, str] = {}
+    if not isinstance(rows, list):
+        return out
+    for row in rows:
+        try:
+            file_id = row[0]
+            file_name = row[1]
+        except Exception:
+            continue
+        parsed = _coerce_positive_int(file_id)
+        name = str(file_name or "").strip()
+        if parsed is None or not name:
+            continue
+        out[parsed] = name
+    return out
+
+
+async def _safe_fetch_folder_names(
+    db: AsyncSession,
+    *,
+    user_id: int,
+    folder_ids: set[int],
+) -> dict[int, str]:
+    if not folder_ids:
+        return {}
+    try:
+        result = await db.execute(
+            select(Folder.folder_id, Folder.folder_name).where(
+                and_(
+                    Folder.owner_id == user_id,
+                    Folder.folder_id.in_(sorted(folder_ids)),
+                    Folder.status == FolderStatus.ACTIVE,
+                )
+            )
+        )
+        rows = result.all() if hasattr(result, "all") else []
+        if inspect.isawaitable(rows):
+            rows = await rows
+    except Exception:
+        return {}
+    out: dict[int, str] = {}
+    if not isinstance(rows, list):
+        return out
+    for row in rows:
+        try:
+            folder_id = row[0]
+            folder_name = row[1]
+        except Exception:
+            continue
+        parsed = _coerce_positive_int(folder_id)
+        name = str(folder_name or "").strip()
+        if parsed is None or not name:
+            continue
+        out[parsed] = name
+    return out
+
+
+def _resolve_destination_folder_name(
+    raw_value: Any,
+    *,
+    created_folder_by_step: dict[int, str],
+    folder_name_map: dict[int, str],
+) -> str | None:
+    if not isinstance(raw_value, str):
+        return None
+    value = raw_value.strip()
+    if not value:
+        return None
+    reference = parse_step_reference(value)
+    if reference is not None:
+        step, path = reference
+        if path and path[0].lower() in {"folderid", "id"}:
+            return created_folder_by_step.get(step)
+        return None
+    parsed = _coerce_positive_int(value)
+    if parsed is None:
+        return None
+    return folder_name_map.get(parsed)
+
+
+def _format_moved_file_subject(file_names: list[str], total_count: int) -> str:
+    unique_names = _unique_preserve_order(
+        [name.strip() for name in file_names if isinstance(name, str) and name.strip()]
+    )
+    if not unique_names:
+        return f"{total_count} 个文件"
+    if len(unique_names) == 1 and total_count == 1:
+        return f"“{unique_names[0]}”"
+    preview = unique_names[:3]
+    quoted = "、".join(f"“{name}”" for name in preview)
+    if total_count > len(preview):
+        return f"{quoted}等 {total_count} 个文件"
+    if total_count > len(unique_names):
+        return f"{quoted}共 {total_count} 个文件"
+    return f"{quoted}共 {total_count} 个文件"
+
+
+def _format_destination_folder(folder_names: list[str]) -> str:
+    unique_names = _unique_preserve_order(
+        [name.strip() for name in folder_names if isinstance(name, str) and name.strip()]
+    )
+    if not unique_names:
+        return "目标文件夹"
+    if len(unique_names) == 1:
+        return f"“{unique_names[0]}”文件夹"
+    return "多个目标文件夹"
+
+
+def _unique_preserve_order(items: list[str]) -> list[str]:
+    out: list[str] = []
+    seen: set[str] = set()
+    for item in items:
+        if item in seen:
+            continue
+        seen.add(item)
+        out.append(item)
+    return out
+
+
+def _coerce_positive_int(value: Any) -> int | None:
+    text = str(value or "").strip()
+    if not text.isdigit():
+        return None
+    parsed = int(text)
+    if parsed <= 0:
+        return None
+    return parsed
+
+
+def _evidence_mapping(value: Any) -> dict[str, Any]:
+    if isinstance(value, dict):
+        preview = _evidence_value_preview(value, depth=0)
+        if isinstance(preview, dict):
+            return preview
+    return {}
+
+
+def _evidence_preview(value: Any) -> dict[str, Any]:
+    preview = _evidence_value_preview(value, depth=0)
+    if isinstance(preview, dict):
+        return preview
+    return {"value": preview}
+
+
+def _evidence_value_preview(value: Any, *, depth: int) -> Any:
+    if depth >= 3:
+        if isinstance(value, str):
+            return value[:120] + ("…" if len(value) > 120 else "")
+        if isinstance(value, (int, float, bool)) or value is None:
+            return value
+        return str(value)[:120]
+
+    if isinstance(value, dict):
+        out: dict[str, Any] = {}
+        items = list(value.items())
+        for index, (key, item) in enumerate(items):
+            if index >= 12:
+                out["_truncatedKeys"] = len(items) - 12
+                break
+            out[str(key)] = _evidence_value_preview(item, depth=depth + 1)
+        return out
+
+    if isinstance(value, list):
+        preview_items = [_evidence_value_preview(item, depth=depth + 1) for item in value[:6]]
+        if len(value) > 6:
+            preview_items.append(f"...({len(value) - 6} more)")
+        return preview_items
+
+    if isinstance(value, str):
+        return value[:200] + ("…" if len(value) > 200 else "")
+    if isinstance(value, (int, float, bool)) or value is None:
+        return value
+    return str(value)[:200]
+
+
 def _cost_estimate(
     *,
     llm_payload: dict[str, Any],
diff --git a/app/src/fileflash/agents/tools/__init__.py b/app/src/fileflash/agents/tools/__init__.py
new file mode 100644
index 0000000..7ea9a9d
--- /dev/null
+++ b/app/src/fileflash/agents/tools/__init__.py
@@ -0,0 +1,5 @@
+from __future__ import annotations
+
+from . import drive as drive
+
+__all__ = ["drive"]
diff --git a/app/src/fileflash/agents/tools/drive.py b/app/src/fileflash/agents/tools/drive.py
new file mode 100644
index 0000000..f74d369
--- /dev/null
+++ b/app/src/fileflash/agents/tools/drive.py
@@ -0,0 +1,878 @@
+from __future__ import annotations
+
+from datetime import UTC, datetime
+from typing import Any
+
+from sqlalchemy import and_, select
+
+from ...core.errors import ApiError
+from ...core.mime import resolve_file_mime_type
+from ...models import File, Folder
+from ...models.enums import FileStatus, FolderStatus, FolderType
+from ...models.tables_storage import StorageObject
+from ...schemas.file import (
+    CreateFolderRequest,
+    GetFolderContentsQuery,
+    MoveFileRequest,
+    MoveFolderRequest,
+    RenameFileRequest,
+    RenameFolderRequest,
+)
+from ..harness.tool_registry import REGISTRY, ToolContext, ToolSpec
+
+_CATEGORIES = ("video", "audio", "image", "document", "archive", "other")
+_COUNT_FILE_NAME_LIMIT = 12
+
+
+async def _list_folder(ctx: ToolContext, args: dict[str, Any]) -> dict[str, Any]:
+    folder_id = _first_value(args, "folderId", "parentFolderId") or "root"
+    query = GetFolderContentsQuery(
+        folder_id=str(folder_id),
+        page=_int_arg(args.get("page"), default=1, minimum=1),
+        per_page=_int_arg(args.get("perPage"), default=200, minimum=1, maximum=200),
+        search=_optional_text(args.get("search")),
+    )
+    if str(folder_id) == "root":
+        result = await ctx.folder_service.get_root_contents(user_id=ctx.user_id, query=query)
+    else:
+        result = await ctx.folder_service.get_folder_contents(user_id=ctx.user_id, query=query)
+    return result.model_dump(by_alias=True, mode="json")
+
+
+async def _count_files(ctx: ToolContext, args: dict[str, Any]) -> dict[str, Any]:
+    folder_id = str(_first_value(args, "folderId", "parentFolderId") or "root")
+    recursive = _bool_arg(args.get("recursive"), default=True)
+    category = _normalize_category(args.get("category"))
+    search = str(args.get("search") or "").strip()
+    root_folder_id = await _resolve_folder_id(ctx, folder_id=folder_id)
+    folder_ids = await _folder_scope_ids(ctx, root_folder_id=root_folder_id, recursive=recursive)
+
+    statement = _active_files_query(ctx, folder_ids=folder_ids)
+    if search:
+        statement = statement.where(File.file_name.ilike(f"%{search}%"))
+    statement = statement.order_by(File.file_name.asc())
+
+    rows = list(await ctx.db.scalars(statement))
+    by_mime_type: dict[str, int] = {}
+    sample_items: list[dict[str, Any]] = []
+    item_names: list[str] = []
+    names_truncated = False
+    total_items = 0
+    for row in rows:
+        resolved_mime = _resolved_mime(row)
+        if category is not None and _category_for_file(row) != category:
+            continue
+
+        total_items += 1
+        by_mime_type[resolved_mime] = by_mime_type.get(resolved_mime, 0) + 1
+        file_name = str(row.file_name or "").strip()
+        if file_name:
+            if len(item_names) < _COUNT_FILE_NAME_LIMIT:
+                item_names.append(file_name)
+            else:
+                names_truncated = True
+        if len(sample_items) < 5:
+            sample_items.append(await _file_payload(ctx, row, include_path=False))
+
+    return {
+        "totalItems": total_items,
+        "category": category,
+        "recursive": recursive,
+        "folderId": str(root_folder_id),
+        "search": search or None,
+        "byMimeType": dict(sorted(by_mime_type.items())),
+        "itemNames": item_names,
+        "itemNamesTruncated": names_truncated,
+        "sampleItems": sample_items,
+    }
+
+
+async def _create_folder(ctx: ToolContext, args: dict[str, Any]) -> dict[str, Any]:
+    name = _required_text(args, "name", "folderName")
+    parent_id = _first_value(args, "parentFolderId", "targetParentId", "folderId") or "root"
+    result = await ctx.folder_service.create_folder(
+        user_id=ctx.user_id,
+        payload=CreateFolderRequest(folder_name=name, parent_folder_id=str(parent_id)),
+    )
+    data = result.model_dump(by_alias=True, mode="json")
+    data.setdefault("folderId", data.get("id"))
+    return data
+
+
+async def _move_file(ctx: ToolContext, args: dict[str, Any]) -> dict[str, Any]:
+    file_id = _required_text(args, "fileId", "id")
+    target_folder_id = _required_text(args, "targetFolderId", "targetParentId")
+    result = await ctx.file_service.move_file(
+        user_id=ctx.user_id,
+        file_id=file_id,
+        payload=MoveFileRequest(
+            target_folder_id=target_folder_id,
+            share_handling=str(args.get("shareHandling") or "keep"),
+        ),
+    )
+    return result.model_dump(by_alias=True, mode="json")
+
+
+async def _move_folder(ctx: ToolContext, args: dict[str, Any]) -> dict[str, Any]:
+    folder_id = _required_text(args, "folderId", "id")
+    target_parent_id = _required_text(args, "targetParentId", "targetFolderId")
+    result = await ctx.folder_service.move_folder(
+        user_id=ctx.user_id,
+        folder_id=folder_id,
+        payload=MoveFolderRequest(
+            target_parent_id=target_parent_id,
+            share_handling=str(args.get("shareHandling") or "keep"),
+        ),
+    )
+    return result.model_dump(by_alias=True, mode="json")
+
+
+async def _rename_file(ctx: ToolContext, args: dict[str, Any]) -> dict[str, Any]:
+    file_id = _required_text(args, "fileId", "id")
+    file_name = _required_text(args, "fileName", "name")
+    result = await ctx.file_service.rename_file(
+        user_id=ctx.user_id,
+        file_id=file_id,
+        payload=RenameFileRequest(file_name=file_name),
+    )
+    return result.model_dump(by_alias=True, mode="json")
+
+
+async def _rename_folder(ctx: ToolContext, args: dict[str, Any]) -> dict[str, Any]:
+    folder_id = _required_text(args, "folderId", "id")
+    folder_name = _required_text(args, "folderName", "name")
+    result = await ctx.folder_service.rename_folder(
+        user_id=ctx.user_id,
+        folder_id=folder_id,
+        payload=RenameFolderRequest(folder_name=folder_name),
+    )
+    return result.model_dump(by_alias=True, mode="json")
+
+
+async def _delete_file(ctx: ToolContext, args: dict[str, Any]) -> dict[str, Any]:
+    file_id = _required_text(args, "fileId", "id")
+    result = await ctx.file_service.delete_file(user_id=ctx.user_id, file_id=file_id)
+    return result.model_dump(by_alias=True, mode="json")
+
+
+async def _delete_folder(ctx: ToolContext, args: dict[str, Any]) -> dict[str, Any]:
+    folder_id = _required_text(args, "folderId", "id")
+    result = await ctx.folder_service.delete_folder(user_id=ctx.user_id, folder_id=folder_id)
+    return result.model_dump(by_alias=True, mode="json")
+
+
+async def _search_files(ctx: ToolContext, args: dict[str, Any]) -> dict[str, Any]:
+    query = _optional_text(args.get("query")) or _optional_text(args.get("search")) or ""
+    folder_id = str(args.get("folderId") or "root")
+    recursive = _bool_arg(args.get("recursive"), default=True)
+    category = _normalize_category(args.get("category"))
+    mime_prefix = _optional_text(args.get("mimePrefix"))
+    modified_after = _parse_datetime_arg(args.get("modifiedAfter"))
+    limit = _int_arg(args.get("limit"), default=50, minimum=1, maximum=200)
+
+    root_folder_id = await _resolve_folder_id(ctx, folder_id=folder_id)
+    folder_ids = await _folder_scope_ids(ctx, root_folder_id=root_folder_id, recursive=recursive)
+    statement = _active_files_query(ctx, folder_ids=folder_ids)
+    if query:
+        statement = statement.where(File.file_name.ilike(f"%{query}%"))
+    if modified_after is not None:
+        statement = statement.where(File.updated_at >= modified_after)
+    statement = statement.order_by(File.file_name.asc())
+
+    items: list[dict[str, Any]] = []
+    for row in list(await ctx.db.scalars(statement)):
+        mime_type = _resolved_mime(row)
+        if mime_prefix and not mime_type.lower().startswith(mime_prefix.lower()):
+            continue
+        if category is not None and _category_for_file(row) != category:
+            continue
+        items.append(await _file_payload(ctx, row, include_path=True))
+        if len(items) >= limit:
+            break
+
+    return {
+        "items": items,
+        "totalItems": len(items),
+        "query": query or None,
+        "folderId": str(root_folder_id),
+        "recursive": recursive,
+        "category": category,
+        "mimePrefix": mime_prefix,
+        "modifiedAfter": modified_after.isoformat() if modified_after else None,
+    }
+
+
+async def _get_file_info(ctx: ToolContext, args: dict[str, Any]) -> dict[str, Any]:
+    file_id = _parse_positive_int(_required_text(args, "fileId", "id"), "fileId")
+    row = await ctx.db.scalar(
+        select(File).where(
+            and_(
+                File.file_id == file_id,
+                File.owner_id == ctx.user_id,
+                File.status == FileStatus.ACTIVE,
+                File.is_latest.is_(True),
+            )
+        )
+    )
+    if row is None:
+        raise ApiError(status_code=404, code=404, message="File not found")
+    storage = await ctx.db.get(StorageObject, int(row.storage_object_id))
+    payload = await _file_payload(ctx, row, include_path=True)
+    payload.update(
+        {
+            "objectHash": str(storage.object_hash) if storage and storage.object_hash else None,
+            "hashAlgorithm": str(storage.hash_algorithm) if storage else None,
+            "storageObjectId": str(row.storage_object_id),
+            "category": _category_for_file(row),
+        }
+    )
+    return payload
+
+
+async def _list_recent(ctx: ToolContext, args: dict[str, Any]) -> dict[str, Any]:
+    limit = _int_arg(args.get("limit"), default=20, minimum=1, maximum=50)
+    since = _parse_datetime_arg(args.get("since"))
+    statement = _active_files_query(ctx, folder_ids=None)
+    if since is not None:
+        statement = statement.where(File.updated_at >= since)
+    statement = statement.order_by(File.updated_at.desc(), File.file_id.desc()).limit(limit)
+    rows = list(await ctx.db.scalars(statement))
+    return {
+        "items": [await _file_payload(ctx, row, include_path=True) for row in rows],
+        "totalItems": len(rows),
+        "limit": limit,
+        "since": since.isoformat() if since else None,
+    }
+
+
+async def _stats_by_category(ctx: ToolContext, args: dict[str, Any]) -> dict[str, Any]:
+    folder_id = str(args.get("folderId") or "root")
+    recursive = _bool_arg(args.get("recursive"), default=True)
+    root_folder_id = await _resolve_folder_id(ctx, folder_id=folder_id)
+    folder_ids = await _folder_scope_ids(ctx, root_folder_id=root_folder_id, recursive=recursive)
+    rows = list(await ctx.db.scalars(_active_files_query(ctx, folder_ids=folder_ids)))
+
+    categories = {
+        category: {"count": 0, "totalSize": 0}
+        for category in _CATEGORIES
+    }
+    total_size = 0
+    for row in rows:
+        category = _category_for_file(row)
+        size = int(row.file_size or 0)
+        categories[category]["count"] += 1
+        categories[category]["totalSize"] += size
+        total_size += size
+
+    return {
+        "folderId": str(root_folder_id),
+        "recursive": recursive,
+        "totalItems": len(rows),
+        "totalSize": total_size,
+        "categories": categories,
+        "video": categories["video"]["count"],
+        "audio": categories["audio"]["count"],
+        "image": categories["image"]["count"],
+        "document": categories["document"]["count"],
+        "archive": categories["archive"]["count"],
+        "other": categories["other"]["count"],
+    }
+
+
+async def _find_duplicates(ctx: ToolContext, args: dict[str, Any]) -> dict[str, Any]:
+    folder_id = str(args.get("folderId") or "root")
+    recursive = _bool_arg(args.get("recursive"), default=True)
+    by = str(args.get("by") or "hash").strip() or "hash"
+    if by not in {"hash", "nameSize"}:
+        raise ApiError(status_code=400, code=400, message="Invalid duplicate mode")
+
+    root_folder_id = await _resolve_folder_id(ctx, folder_id=folder_id)
+    folder_ids = await _folder_scope_ids(ctx, root_folder_id=root_folder_id, recursive=recursive)
+    rows = (
+        await ctx.db.execute(
+            _active_files_query(ctx, folder_ids=folder_ids)
+            .join(StorageObject, StorageObject.object_id == File.storage_object_id)
+            .add_columns(StorageObject.object_hash, StorageObject.hash_algorithm)
+            .order_by(File.file_name.asc())
+        )
+    ).all()
+
+    groups: dict[str, dict[str, Any]] = {}
+    for row in rows:
+        file_row: File = row[0]
+        object_hash = row[1]
+        hash_algorithm = row[2]
+        if by == "hash":
+            if not object_hash:
+                continue
+            key = f"{hash_algorithm}:{object_hash}:{int(file_row.file_size or 0)}"
+        else:
+            key = f"{file_row.file_name.lower()}:{int(file_row.file_size or 0)}"
+        group = groups.setdefault(
+            key,
+            {
+                "key": key,
+                "by": by,
+                "hash": str(object_hash) if object_hash else None,
+                "hashAlgorithm": str(hash_algorithm) if hash_algorithm else None,
+                "size": int(file_row.file_size or 0),
+                "files": [],
+            },
+        )
+        group["files"].append(await _file_payload(ctx, file_row, include_path=True))
+
+    duplicate_groups = [group for group in groups.values() if len(group["files"]) > 1]
+    return {
+        "folderId": str(root_folder_id),
+        "recursive": recursive,
+        "by": by,
+        "groups": duplicate_groups,
+        "totalGroups": len(duplicate_groups),
+        "totalFiles": sum(len(group["files"]) for group in duplicate_groups),
+    }
+
+
+def _active_files_query(ctx: ToolContext, *, folder_ids: list[int] | None):
+    statement = select(File).where(
+        and_(
+            File.owner_id == ctx.user_id,
+            File.status == FileStatus.ACTIVE,
+            File.is_latest.is_(True),
+        )
+    )
+    if folder_ids is not None:
+        statement = statement.where(File.folder_id.in_(folder_ids))
+    return statement
+
+
+async def _file_payload(
+    ctx: ToolContext,
+    row: File,
+    *,
+    include_path: bool,
+) -> dict[str, Any]:
+    payload = {
+        "id": str(row.file_id),
+        "fileId": str(row.file_id),
+        "name": str(row.file_name),
+        "size": int(row.file_size or 0),
+        "mimeType": _resolved_mime(row),
+        "folderId": str(row.folder_id),
+        "createdAt": row.created_at.isoformat() if row.created_at else None,
+        "updatedAt": row.updated_at.isoformat() if row.updated_at else None,
+    }
+    if include_path:
+        folder_path = await _folder_path(ctx, folder_id=int(row.folder_id))
+        payload["path"] = f"{folder_path}/{row.file_name}" if folder_path else str(row.file_name)
+    return payload
+
+
+async def _resolve_folder_id(ctx: ToolContext, *, folder_id: str) -> int:
+    if not folder_id or folder_id == "root":
+        root_id = await ctx.db.scalar(
+            select(Folder.folder_id).where(
+                and_(
+                    Folder.owner_id == ctx.user_id,
+                    Folder.parent_folder_id.is_(None),
+                    Folder.folder_type == FolderType.ROOT,
+                    Folder.status == FolderStatus.ACTIVE,
+                )
+            )
+        )
+        if root_id is None:
+            raise ApiError(status_code=404, code=404, message="Root folder not found")
+        return int(root_id)
+    parsed = _parse_positive_int(folder_id, "folderId")
+    exists = await ctx.db.scalar(
+        select(Folder.folder_id).where(
+            and_(
+                Folder.folder_id == parsed,
+                Folder.owner_id == ctx.user_id,
+                Folder.status == FolderStatus.ACTIVE,
+            )
+        )
+    )
+    if exists is None:
+        raise ApiError(status_code=404, code=404, message="Folder not found")
+    return parsed
+
+
+async def _folder_scope_ids(
+    ctx: ToolContext,
+    *,
+    root_folder_id: int,
+    recursive: bool,
+) -> list[int]:
+    if not recursive:
+        return [root_folder_id]
+    return await _active_descendant_folder_ids(ctx, root_folder_id=root_folder_id)
+
+
+async def _active_descendant_folder_ids(ctx: ToolContext, *, root_folder_id: int) -> list[int]:
+    descendants = (
+        select(Folder.folder_id)
+        .where(
+            and_(
+                Folder.folder_id == root_folder_id,
+                Folder.owner_id == ctx.user_id,
+                Folder.status == FolderStatus.ACTIVE,
+            )
+        )
+        .cte(name="agent_tool_descendants", recursive=True)
+    )
+    descendants = descendants.union_all(
+        select(Folder.folder_id).where(
+            and_(
+                Folder.parent_folder_id == descendants.c.folder_id,
+                Folder.owner_id == ctx.user_id,
+                Folder.status == FolderStatus.ACTIVE,
+            )
+        )
+    )
+    folder_ids = list(await ctx.db.scalars(select(descendants.c.folder_id)))
+    return [int(folder_id) for folder_id in folder_ids]
+
+
+async def _folder_path(ctx: ToolContext, *, folder_id: int) -> str:
+    parts: list[str] = []
+    current_id: int | None = folder_id
+    while current_id is not None:
+        folder = await ctx.db.scalar(
+            select(Folder).where(
+                and_(
+                    Folder.folder_id == current_id,
+                    Folder.owner_id == ctx.user_id,
+                    Folder.status == FolderStatus.ACTIVE,
+                )
+            )
+        )
+        if folder is None:
+            break
+        parts.append(str(folder.folder_name))
+        current_id = int(folder.parent_folder_id) if folder.parent_folder_id is not None else None
+    parts.reverse()
+    return "/" + "/".join(parts) if parts else ""
+
+
+def _first_value(args: dict[str, Any], *keys: str) -> Any:
+    for key in keys:
+        value = args.get(key)
+        if value not in (None, ""):
+            return value
+    return None
+
+
+def _required_text(args: dict[str, Any], *keys: str) -> str:
+    value = _first_value(args, *keys)
+    if value is None:
+        raise ApiError(status_code=400, code=400, message=f"Missing required tool input: {keys[0]}")
+    text = str(value).strip()
+    if not text:
+        raise ApiError(status_code=400, code=400, message=f"Missing required tool input: {keys[0]}")
+    return text
+
+
+def _optional_text(value: Any) -> str | None:
+    text = str(value or "").strip()
+    return text or None
+
+
+def _bool_arg(value: Any, *, default: bool) -> bool:
+    if value is None:
+        return default
+    if isinstance(value, bool):
+        return value
+    text = str(value).strip().lower()
+    if text in {"1", "true", "yes", "y"}:
+        return True
+    if text in {"0", "false", "no", "n"}:
+        return False
+    return default
+
+
+def _int_arg(
+    value: Any,
+    *,
+    default: int,
+    minimum: int,
+    maximum: int | None = None,
+) -> int:
+    try:
+        parsed = int(value if value is not None else default)
+    except (TypeError, ValueError):
+        parsed = default
+    parsed = max(minimum, parsed)
+    if maximum is not None:
+        parsed = min(maximum, parsed)
+    return parsed
+
+
+def _parse_positive_int(value: str, field_name: str) -> int:
+    try:
+        parsed = int(value)
+    except ValueError as exc:
+        raise ApiError(status_code=400, code=400, message=f"Invalid {field_name}") from exc
+    if parsed <= 0:
+        raise ApiError(status_code=400, code=400, message=f"Invalid {field_name}")
+    return parsed
+
+
+def _parse_datetime_arg(value: Any) -> datetime | None:
+    text = str(value or "").strip()
+    if not text:
+        return None
+    try:
+        parsed = datetime.fromisoformat(text.replace("Z", "+00:00"))
+    except ValueError as exc:
+        raise ApiError(status_code=400, code=400, message="Invalid datetime") from exc
+    if parsed.tzinfo is None:
+        return parsed.replace(tzinfo=UTC)
+    return parsed
+
+
+def _normalize_category(value: Any) -> str | None:
+    text = str(value or "").strip().lower()
+    aliases = {
+        "movies": "video",
+        "movie": "video",
+        "film": "video",
+        "films": "video",
+        "videos": "video",
+        "anime": "video",
+        "animation": "video",
+        "视频": "video",
+        "影片": "video",
+        "电影": "video",
+        "动漫": "video",
+        "番剧": "video",
+        "documents": "document",
+        "docs": "document",
+        "images": "image",
+        "pictures": "image",
+        "archives": "archive",
+        "compressed": "archive",
+    }
+    text = aliases.get(text, text)
+    if text in _CATEGORIES:
+        return text
+    return None
+
+
+def _resolved_mime(row: File) -> str:
+    return resolve_file_mime_type(
+        mime_type=row.mime_type,
+        file_ext=row.file_ext,
+        file_name=row.file_name,
+    )
+
+
+def _category_for_file(row: File) -> str:
+    mime = _resolved_mime(row).lower()
+    ext = _normalized_extension(row.file_ext) or _filename_extension(row.file_name)
+    if mime.startswith("video/") or ext in {"mp4", "mov", "avi", "mkv", "webm", "m4v"}:
+        return "video"
+    if mime.startswith("audio/") or ext in {"mp3", "wav", "flac", "m4a", "aac", "ogg"}:
+        return "audio"
+    if mime.startswith("image/") or ext in {"jpg", "jpeg", "png", "gif", "webp", "svg", "bmp"}:
+        return "image"
+    if mime in {"application/pdf"} or ext in {"pdf", "doc", "docx", "xls", "xlsx", "ppt", "pptx", "txt", "md"}:
+        return "document"
+    if ext in {"zip", "rar", "7z", "tar", "gz", "bz2", "xz"}:
+        return "archive"
+    return "other"
+
+
+def _count_files_answer(output: dict[str, Any]) -> str:
+    total_items = int(output.get("totalItems") or 0)
+    category = str(output.get("category") or "").strip().lower()
+    qualifier = _search_qualifier(output)
+    if category == "video":
+        return f"你上传了 {total_items} 部{qualifier}电影（按视频文件统计）。"
+    if category == "audio":
+        return f"你上传了 {total_items} 个{qualifier}音频文件。"
+    if category == "image":
+        return f"你上传了 {total_items} 张{qualifier}图片。"
+    if category == "document":
+        return f"你上传了 {total_items} 个{qualifier}文档。"
+    if category == "archive":
+        return f"你上传了 {total_items} 个{qualifier}压缩包。"
+    return f"你上传了 {total_items} 个{qualifier}文件。"
+
+
+def _search_qualifier(output: dict[str, Any]) -> str:
+    search = str(output.get("search") or "").strip()
+    if not search:
+        return ""
+    return f"名称包含“{search}”的"
+
+
+def _normalized_extension(value: str | None) -> str:
+    return str(value or "").strip().lower().lstrip(".")
+
+
+def _filename_extension(value: str | None) -> str:
+    name = str(value or "").strip().lower()
+    if "." not in name:
+        return ""
+    return name.rsplit(".", 1)[-1]
+
+
+def _schema(properties: dict[str, Any], required: list[str] | None = None) -> dict[str, Any]:
+    return {
+        "type": "object",
+        "properties": properties,
+        "required": required or [],
+    }
+
+
+_FOLDER_ID = {"type": "string", "description": "Folder id, or root for the user's root folder."}
+_FILE_ID = {"type": "string", "description": "File id owned by the current user."}
+_CATEGORY = {"type": "string", "enum": list(_CATEGORIES)}
+_SHARE_HANDLING = {"type": "string", "enum": ["keep", "revoke"], "default": "keep"}
+
+
+REGISTRY.register(
+    ToolSpec(
+        name="drive.listFolder",
+        description="List direct files and folders inside a folder.",
+        input_schema=_schema(
+            {
+                "folderId": _FOLDER_ID,
+                "page": {"type": "integer", "minimum": 1, "default": 1},
+                "perPage": {"type": "integer", "minimum": 1, "maximum": 200, "default": 200},
+                "search": {"type": "string"},
+            }
+        ),
+        side_effect="read",
+        risk_level="low",
+        requires_confirmation=False,
+        handler=_list_folder,
+    )
+)
+
+REGISTRY.register(
+    ToolSpec(
+        name="drive.countFiles",
+        description=(
+            "Count files under a folder. Supports recursive counts, broad file categories, "
+            "and filename contains search."
+        ),
+        input_schema=_schema(
+            {
+                "folderId": _FOLDER_ID,
+                "recursive": {"type": "boolean", "default": True},
+                "category": _CATEGORY,
+                "search": {"type": "string"},
+            }
+        ),
+        side_effect="read",
+        risk_level="low",
+        requires_confirmation=False,
+        handler=_count_files,
+        answer_formatter=_count_files_answer,
+    )
+)
+
+REGISTRY.register(
+    ToolSpec(
+        name="drive.createFolder",
+        description="Create a folder under parentFolderId with name.",
+        input_schema=_schema(
+            {
+                "parentFolderId": _FOLDER_ID,
+                "name": {"type": "string", "minLength": 1, "maxLength": 255},
+            },
+            required=["name"],
+        ),
+        side_effect="write",
+        risk_level="medium",
+        requires_confirmation=False,
+        handler=_create_folder,
+    )
+)
+
+REGISTRY.register(
+    ToolSpec(
+        name="drive.moveFile",
+        description="Move fileId into targetFolderId.",
+        input_schema=_schema(
+            {
+                "fileId": _FILE_ID,
+                "targetFolderId": _FOLDER_ID,
+                "shareHandling": _SHARE_HANDLING,
+            },
+            required=["fileId", "targetFolderId"],
+        ),
+        side_effect="write",
+        risk_level="medium",
+        requires_confirmation=False,
+        handler=_move_file,
+    )
+)
+
+REGISTRY.register(
+    ToolSpec(
+        name="drive.moveFolder",
+        description="Move folderId into targetParentId.",
+        input_schema=_schema(
+            {
+                "folderId": _FOLDER_ID,
+                "targetParentId": _FOLDER_ID,
+                "shareHandling": _SHARE_HANDLING,
+            },
+            required=["folderId", "targetParentId"],
+        ),
+        side_effect="write",
+        risk_level="medium",
+        requires_confirmation=False,
+        handler=_move_folder,
+    )
+)
+
+REGISTRY.register(
+    ToolSpec(
+        name="drive.renameFile",
+        description="Rename fileId to fileName.",
+        input_schema=_schema(
+            {
+                "fileId": _FILE_ID,
+                "fileName": {"type": "string", "minLength": 1, "maxLength": 255},
+            },
+            required=["fileId", "fileName"],
+        ),
+        side_effect="write",
+        risk_level="medium",
+        requires_confirmation=False,
+        handler=_rename_file,
+    )
+)
+
+REGISTRY.register(
+    ToolSpec(
+        name="drive.renameFolder",
+        description="Rename folderId to folderName.",
+        input_schema=_schema(
+            {
+                "folderId": _FOLDER_ID,
+                "folderName": {"type": "string", "minLength": 1, "maxLength": 255},
+            },
+            required=["folderId", "folderName"],
+        ),
+        side_effect="write",
+        risk_level="medium",
+        requires_confirmation=False,
+        handler=_rename_folder,
+    )
+)
+
+REGISTRY.register(
+    ToolSpec(
+        name="drive.deleteFile",
+        description="Soft-delete fileId into the recycle bin. This is high risk.",
+        input_schema=_schema({"fileId": _FILE_ID}, required=["fileId"]),
+        side_effect="write",
+        risk_level="high",
+        requires_confirmation=True,
+        handler=_delete_file,
+    )
+)
+
+REGISTRY.register(
+    ToolSpec(
+        name="drive.deleteFolder",
+        description="Soft-delete folderId into the recycle bin. This is high risk.",
+        input_schema=_schema({"folderId": _FOLDER_ID}, required=["folderId"]),
+        side_effect="write",
+        risk_level="high",
+        requires_confirmation=True,
+        handler=_delete_folder,
+    )
+)
+
+REGISTRY.register(
+    ToolSpec(
+        name="drive.searchFiles",
+        description="Search active files by filename, folder scope, category, MIME prefix, and update time.",
+        input_schema=_schema(
+            {
+                "query": {"type": "string"},
+                "folderId": _FOLDER_ID,
+                "recursive": {"type": "boolean", "default": True},
+                "category": _CATEGORY,
+                "mimePrefix": {"type": "string", "description": "MIME type prefix such as video/."},
+                "modifiedAfter": {"type": "string", "format": "date-time"},
+                "limit": {"type": "integer", "minimum": 1, "maximum": 200, "default": 50},
+            }
+        ),
+        side_effect="read",
+        risk_level="low",
+        requires_confirmation=False,
+        handler=_search_files,
+    )
+)
+
+REGISTRY.register(
+    ToolSpec(
+        name="drive.getFileInfo",
+        description="Return detailed metadata for one active file.",
+        input_schema=_schema({"fileId": _FILE_ID}, required=["fileId"]),
+        side_effect="read",
+        risk_level="low",
+        requires_confirmation=False,
+        handler=_get_file_info,
+    )
+)
+
+REGISTRY.register(
+    ToolSpec(
+        name="drive.listRecent",
+        description="List recently updated active files.",
+        input_schema=_schema(
+            {
+                "limit": {"type": "integer", "minimum": 1, "maximum": 50, "default": 20},
+                "since": {"type": "string", "format": "date-time"},
+            }
+        ),
+        side_effect="read",
+        risk_level="low",
+        requires_confirmation=False,
+        handler=_list_recent,
+    )
+)
+
+REGISTRY.register(
+    ToolSpec(
+        name="drive.statsByCategory",
+        description="Compute file counts and sizes by broad category under a folder.",
+        input_schema=_schema(
+            {
+                "folderId": _FOLDER_ID,
+                "recursive": {"type": "boolean", "default": True},
+            }
+        ),
+        side_effect="read",
+        risk_level="low",
+        requires_confirmation=False,
+        handler=_stats_by_category,
+    )
+)
+
+REGISTRY.register(
+    ToolSpec(
+        name="drive.findDuplicates",
+        description="Find duplicate active files by content hash or by name plus size.",
+        input_schema=_schema(
+            {
+                "folderId": _FOLDER_ID,
+                "recursive": {"type": "boolean", "default": True},
+                "by": {"type": "string", "enum": ["hash", "nameSize"], "default": "hash"},
+            }
+        ),
+        side_effect="read",
+        risk_level="low",
+        requires_confirmation=False,
+        handler=_find_duplicates,
+    )
+)
+
+__all__ = []
diff --git a/app/src/fileflash/agents/worker.py b/app/src/fileflash/agents/worker.py
index 6fd4e89..a122e31 100644
--- a/app/src/fileflash/agents/worker.py
+++ b/app/src/fileflash/agents/worker.py
@@ -17,6 +17,7 @@
 from ..models import BackgroundJob
 from ..services.job_queue import RedisStreamJobQueue
 from ..workers.contracts import WorkerJobMessage
+from .harness.event_bus import AgentEventBus, AgentEventEnvelope, build_agent_event_bus
 from .runtime import AgentJobCanceled, ExecuteRunner, PlanRunner
 
 logger = logging.getLogger(__name__)
@@ -28,10 +29,12 @@ def __init__(
         *,
         queue: RedisStreamJobQueue,
         session_factory: async_sessionmaker[AsyncSession] = SessionLocal,
+        event_bus: AgentEventBus | None = None,
     ) -> None:
         self._settings = get_settings()
         self._queue = queue
         self._session_factory = session_factory
+        self._event_bus = event_bus or build_agent_event_bus(settings=self._settings)
 
     async def run(self) -> None:
         logger.info(
@@ -103,12 +106,15 @@ async def _run_job(self, *, job: BackgroundJob) -> tuple[dict[str, Any], str]:
             if fresh_job is None:
                 raise ApiError(status_code=404, code=404, message="Job not found")
             if fresh_job.task_type == "agent.plan":
-                result = await PlanRunner(settings=self._settings).run(db=db, job=fresh_job)
+                result = await PlanRunner(
+                    settings=self._settings,
+                    event_bus=self._event_bus,
+                ).run(db=db, job=fresh_job)
                 phase = "awaiting_confirm" if result.requires_confirmation else "completed"
-                return result.model_dump(by_alias=True), phase
+                return result.model_dump(by_alias=True, mode="json"), phase
             if fresh_job.task_type == "agent.execute":
-                result = await ExecuteRunner().run(db=db, job=fresh_job)
-                return result.model_dump(by_alias=True), "completed"
+                result = await ExecuteRunner(event_bus=self._event_bus).run(db=db, job=fresh_job)
+                return result.model_dump(by_alias=True, mode="json"), "completed"
             raise ApiError(
                 status_code=400,
                 code=400,
@@ -135,6 +141,8 @@ async def _mark_running(self, message: WorkerJobMessage) -> BackgroundJob | None
                 return job
 
     async def _mark_succeeded(self, *, job_id: int, result: dict[str, Any], phase: str) -> None:
+        safe_result = jsonable_encoder(result)
+        should_publish = False
         async with self._session_factory() as db:
             async with db.begin():
                 await apply_local_lock_timeout(db)
@@ -147,14 +155,22 @@ async def _mark_succeeded(self, *, job_id: int, result: dict[str, Any], phase: s
                     return
                 now = datetime.now(UTC)
                 job.status = "succeeded"
-                job.result = jsonable_encoder(result)
+                job.result = safe_result
                 job.error_message = None
                 job.agent_phase = phase
                 job.finished_at = now
                 job.updated_at = now
+                should_publish = True
+        if should_publish:
+            await self._publish_terminal(
+                job_id=job_id,
+                event_type="job.succeeded",
+                payload={"status": "succeeded", "agentPhase": phase, "data": {"result": safe_result}},
+            )
 
     async def _mark_failed(self, *, job_id: int, error: Exception) -> None:
         message = _error_message(error)
+        should_publish = False
         async with self._session_factory() as db:
             async with db.begin():
                 await apply_local_lock_timeout(db)
@@ -171,8 +187,21 @@ async def _mark_failed(self, *, job_id: int, error: Exception) -> None:
                 job.error_message = message[:2000]
                 job.finished_at = now
                 job.updated_at = now
+                should_publish = True
+        if should_publish:
+            await self._publish_terminal(
+                job_id=job_id,
+                event_type="job.failed",
+                payload={
+                    "status": "failed",
+                    "agentPhase": "failed",
+                    "message": message[:2000],
+                    "data": {"errorMessage": message[:2000]},
+                },
+            )
 
     async def _mark_canceled(self, *, job_id: int) -> None:
+        should_publish = False
         async with self._session_factory() as db:
             async with db.begin():
                 await apply_local_lock_timeout(db)
@@ -187,6 +216,36 @@ async def _mark_canceled(self, *, job_id: int) -> None:
                 job.cancel_requested_at = job.cancel_requested_at or now
                 job.finished_at = now
                 job.updated_at = now
+                should_publish = True
+        if should_publish:
+            await self._publish_terminal(
+                job_id=job_id,
+                event_type="job.canceled",
+                payload={"status": "canceled", "agentPhase": "canceled"},
+            )
+
+    async def _publish_terminal(
+        self,
+        *,
+        job_id: int,
+        event_type: str,
+        payload: dict[str, Any] | None = None,
+    ) -> None:
+        try:
+            await self._event_bus.publish(
+                AgentEventEnvelope(
+                    job_id=job_id,
+                    event_type=event_type,
+                    payload=payload or {},
+                    emitted_at=datetime.now(UTC),
+                )
+            )
+        except Exception:
+            logger.exception(
+                "Failed to publish terminal event jobId=%s eventType=%s",
+                job_id,
+                event_type,
+            )
 
 
 def _error_message(error: Exception) -> str:
diff --git a/app/src/fileflash/core/deps.py b/app/src/fileflash/core/deps.py
index c4fd5be..5ac1f45 100644
--- a/app/src/fileflash/core/deps.py
+++ b/app/src/fileflash/core/deps.py
@@ -5,9 +5,10 @@
 from jwt import InvalidTokenError
 from sqlalchemy.ext.asyncio import AsyncSession
 
+from ..agents.harness.event_bus import AgentEventBus, build_agent_event_bus
 from ..db.deps import get_db
-from ..models.tables_identity import User
 from ..models.enums import UserRole
+from ..models.tables_identity import User
 from ..repositories import (
     AgentActionLogRepository,
     AgentMcpRepository,
@@ -17,17 +18,27 @@
     AgentSkillRepository,
     AgentWorkSessionRepository,
 )
-from ..services.archive import ArchiveService
-from ..services.agent import ExecuteService, McpService, MemoryService, PlanService, SessionService, SettingsService, SkillService
-from ..services.admin.users import AdminUsersService
-from ..services.admin.storage import AdminStorageService
+from ..s3 import MinioObjectStorageClient
 from ..services.admin.files import AdminFilesService
-from ..services.admin.moderation import AdminModerationService
 from ..services.admin.logs import AdminLogsService
+from ..services.admin.moderation import AdminModerationService
 from ..services.admin.notifications import AdminNotificationsService
+from ..services.admin.storage import AdminStorageService
 from ..services.admin.system import AdminSystemService
+from ..services.admin.users import AdminUsersService
+from ..services.agent import (
+    ExecuteService,
+    McpService,
+    MemoryService,
+    PlanService,
+    SessionService,
+    SettingsService,
+    SkillService,
+)
+from ..services.archive import ArchiveService
 from ..services.auth import AuthService
 from ..services.background_jobs import BackgroundJobService
+from ..services.download_rate_limit import DownloadRateLimitService
 from ..services.email_delivery import VerificationEmailDeliveryService
 from ..services.file import FileService
 from ..services.folder import FolderService
@@ -37,7 +48,6 @@
 from ..services.registration_email_domain_rule import RegistrationEmailDomainRuleService
 from ..services.share import ShareService
 from ..services.upload import UploadService
-from ..s3 import MinioObjectStorageClient
 from .errors import ApiError
 from .security import decode_access_token
 from .settings import Settings, get_settings
@@ -55,6 +65,7 @@
     redis_url=_settings.redis_url,
     stream_key=_settings.agent_queue_stream,
 )
+_agent_event_bus_singleton: AgentEventBus | None = None
 
 
 def get_rate_limiter() -> RedisRateLimiter:
@@ -77,6 +88,13 @@ def get_agent_job_queue_publisher() -> RedisStreamJobQueue:
     return _agent_job_queue_publisher
 
 
+def get_agent_event_bus() -> AgentEventBus:
+    global _agent_event_bus_singleton
+    if _agent_event_bus_singleton is None:
+        _agent_event_bus_singleton = build_agent_event_bus(settings=_settings)
+    return _agent_event_bus_singleton
+
+
 def get_background_job_service(
     queue_publisher: RedisStreamJobQueue = Depends(get_job_queue_publisher),
 ) -> BackgroundJobService:
@@ -93,6 +111,14 @@ def get_settings_dep() -> Settings:
     return _settings
 
 
+def get_download_rate_limit_service(
+    db: AsyncSession = Depends(get_db),
+    settings: Settings = Depends(get_settings_dep),
+    rate_limiter: RedisRateLimiter = Depends(get_rate_limiter),
+) -> DownloadRateLimitService:
+    return DownloadRateLimitService(db=db, settings=settings, rate_limiter=rate_limiter)
+
+
 def get_client_ip(request: Request) -> str:
     forwarded_for = request.headers.get("x-forwarded-for")
     if forwarded_for:
diff --git a/app/src/fileflash/core/settings.py b/app/src/fileflash/core/settings.py
index 80316a2..71dde62 100644
--- a/app/src/fileflash/core/settings.py
+++ b/app/src/fileflash/core/settings.py
@@ -56,6 +56,22 @@ class Settings(BaseSettings):
     cors_origins: list[str] = Field(default_factory=lambda: ["http://localhost:5173", "http://localhost:8080"])
 
     redis_url: str | None = Field(default=None, alias="REDIS_URL")
+    agent_inbox_ask_timeout_sec: int = Field(
+        default=1800,
+        alias="AGENT_INBOX_ASK_TIMEOUT_SEC",
+    )
+    agent_event_channel_prefix: str = Field(
+        default="agent:job",
+        alias="AGENT_EVENT_CHANNEL_PREFIX",
+    )
+    agent_inbox_channel_prefix: str = Field(
+        default="agent:inbox",
+        alias="AGENT_INBOX_CHANNEL_PREFIX",
+    )
+    agent_event_bus_buffer_size: int = Field(
+        default=64,
+        alias="AGENT_EVENT_BUS_BUFFER_SIZE",
+    )
     rabbitmq_url: str | None = Field(default=None, alias="RABBITMQ_URL")
 
     email_verify_base_url: str = Field(default="", alias="EMAIL_VERIFY_BASE_URL")
@@ -95,19 +111,25 @@ class Settings(BaseSettings):
     upload_temp_prefix: str = Field(default="tmp", alias="UPLOAD_TEMP_PREFIX")
     upload_object_prefix: str = Field(default="objects", alias="UPLOAD_OBJECT_PREFIX")
 
-    max_failed_login_attempts: int = 5
-    account_lock_minutes: int = 15
+    max_failed_login_attempts: int = 8
+    account_lock_minutes: int = 5
     email_verification_expire_minutes: int = 60
     password_reset_expire_minutes: int = 30
 
-    register_rate_limit: int = 5
+    register_rate_limit: int = 12
     register_rate_window_seconds: int = 600
-    login_rate_limit: int = 10
+    login_rate_limit: int = 30
     login_rate_window_seconds: int = 300
     forgot_password_rate_limit: int = 5
     forgot_password_rate_window_seconds: int = 600
     resend_verification_rate_limit: int = 5
     resend_verification_rate_window_seconds: int = 600
+    download_rate_window_seconds: int = Field(default=600, alias="DOWNLOAD_RATE_WINDOW_SECONDS")
+    download_rate_limit_requests: int = Field(default=120, alias="DOWNLOAD_RATE_LIMIT_REQUESTS")
+    download_rate_limit_bytes: int = Field(
+        default=2 * 1024 * 1024 * 1024,
+        alias="DOWNLOAD_RATE_LIMIT_BYTES",
+    )
 
     worker_poll_interval_seconds: float = Field(
         default=2.0,
@@ -145,6 +167,7 @@ class Settings(BaseSettings):
     agent_llm_model: str = Field(default="claude-sonnet-4-6", alias="AGENT_LLM_MODEL")
     agent_llm_base_url: str | None = Field(default=None, alias="AGENT_LLM_BASE_URL")
     agent_llm_api_key: str | None = Field(default=None, alias="AGENT_LLM_API_KEY")
+    agent_llm_plan_max_tokens: int = Field(default=8192, alias="AGENT_LLM_PLAN_MAX_TOKENS")
     agent_mcp_endpoints_raw: str = Field(default="[]", alias="AGENT_MCP_ENDPOINTS")
 
     ffmpeg_binary: str = Field(default="ffmpeg", alias="FFMPEG_BINARY")
diff --git a/app/src/fileflash/models/__init__.py b/app/src/fileflash/models/__init__.py
index 575fa97..21cd3a5 100644
--- a/app/src/fileflash/models/__init__.py
+++ b/app/src/fileflash/models/__init__.py
@@ -2,6 +2,7 @@
 from .tables import (
     Acl,
     AgentActionLog,
+    AgentInboxMessage,
     AgentMcpServer,
     AgentMemory,
     AgentPlan,
@@ -40,6 +41,7 @@
 __all__ = [
     "Acl",
     "AgentActionLog",
+    "AgentInboxMessage",
     "AgentMcpServer",
     "AgentMemory",
     "AgentPlan",
diff --git a/app/src/fileflash/models/enums.py b/app/src/fileflash/models/enums.py
index 0ce1e32..7228c78 100644
--- a/app/src/fileflash/models/enums.py
+++ b/app/src/fileflash/models/enums.py
@@ -147,6 +147,29 @@ class AgentMcpVisibility(BaseStrEnum):
     PRIVATE = "private"
 
 
+class AgentInboxRole(BaseStrEnum):
+    AGENT = "agent"
+    USER = "user"
+
+
+class AgentInboxKind(BaseStrEnum):
+    ASK = "ask"
+    REPLY = "reply"
+    CONTROL_PAUSE = "control.pause"
+    CONTROL_RESUME = "control.resume"
+    CONTROL_APPROVE = "control.approve"
+    CONTROL_DENY = "control.deny"
+    CONTROL_SKIP = "control.skip"
+    CONTROL_CANCEL = "control.cancel"
+
+
+class AgentInboxStatus(BaseStrEnum):
+    WAITING = "waiting"
+    ANSWERED = "answered"
+    TIMED_OUT = "timed_out"
+    DROPPED = "dropped"
+
+
 __all__ = [
 	"BaseStrEnum",
 	"UploadStatus",
@@ -172,5 +195,8 @@ class AgentMcpVisibility(BaseStrEnum):
     "AgentMemoryKind",
     "AgentSkillVisibility",
     "AgentMcpVisibility",
+    "AgentInboxRole",
+    "AgentInboxKind",
+    "AgentInboxStatus",
 ]
 
diff --git a/app/src/fileflash/models/tables.py b/app/src/fileflash/models/tables.py
index 0040f7b..5f4930c 100644
--- a/app/src/fileflash/models/tables.py
+++ b/app/src/fileflash/models/tables.py
@@ -11,6 +11,7 @@
 )
 from .tables_agent import (
     AgentActionLog,
+    AgentInboxMessage,
     AgentMcpServer,
     AgentMemory,
     AgentPlan,
@@ -50,6 +51,7 @@
 __all__ = [
     "Acl",
     "AgentActionLog",
+    "AgentInboxMessage",
     "AgentMcpServer",
     "AgentMemory",
     "AgentPlan",
diff --git a/app/src/fileflash/models/tables_agent.py b/app/src/fileflash/models/tables_agent.py
index 33b4e79..3ad9591 100644
--- a/app/src/fileflash/models/tables_agent.py
+++ b/app/src/fileflash/models/tables_agent.py
@@ -21,6 +21,9 @@
 from .base import Base
 from .enums import (
     AgentExecutionPolicy,
+    AgentInboxKind,
+    AgentInboxRole,
+    AgentInboxStatus,
     AgentMcpVisibility,
     AgentMemoryKind,
     AgentMemoryScope,
@@ -345,8 +348,55 @@ class AgentWorkSession(Base):
     closed_at: Mapped[datetime | None] = mapped_column(DateTime)
 
 
+class AgentInboxMessage(Base):
+    __tablename__ = "agent_inbox_message"
+    __table_args__ = (
+        Index("idx_agent_inbox_message_job_created", "job_id", "created_at"),
+        Index(
+            "idx_agent_inbox_message_job_status",
+            "job_id",
+            "status",
+            postgresql_where=text("status IS NOT NULL"),
+        ),
+    )
+
+    inbox_message_id: Mapped[int] = mapped_column(BigInteger, Identity(), primary_key=True)
+    job_id: Mapped[int] = mapped_column(
+        BigInteger,
+        ForeignKey("background_job.job_id", ondelete="CASCADE"),
+        nullable=False,
+    )
+    role: Mapped[AgentInboxRole] = mapped_column(
+        pg_enum(AgentInboxRole, "agent_inbox_role_enum"),
+        nullable=False,
+    )
+    kind: Mapped[AgentInboxKind] = mapped_column(
+        pg_enum(AgentInboxKind, "agent_inbox_kind_enum"),
+        nullable=False,
+    )
+    payload_json: Mapped[dict[str, Any]] = mapped_column(
+        JSONB,
+        nullable=False,
+        server_default=text("'{}'::jsonb"),
+    )
+    reply_to_id: Mapped[int | None] = mapped_column(
+        BigInteger,
+        ForeignKey("agent_inbox_message.inbox_message_id", ondelete="SET NULL"),
+    )
+    status: Mapped[AgentInboxStatus | None] = mapped_column(
+        pg_enum(AgentInboxStatus, "agent_inbox_status_enum"),
+    )
+    created_at: Mapped[datetime] = mapped_column(
+        DateTime,
+        nullable=False,
+        server_default=text("CURRENT_TIMESTAMP"),
+    )
+    answered_at: Mapped[datetime | None] = mapped_column(DateTime)
+
+
 __all__ = [
     "AgentActionLog",
+    "AgentInboxMessage",
     "AgentMcpServer",
     "AgentMemory",
     "AgentPlan",
diff --git a/app/src/fileflash/repositories/__init__.py b/app/src/fileflash/repositories/__init__.py
index 84b1407..c063ea1 100644
--- a/app/src/fileflash/repositories/__init__.py
+++ b/app/src/fileflash/repositories/__init__.py
@@ -1,5 +1,6 @@
 from .agent import (
     AgentActionLogRepository,
+    AgentInboxMessageRepository,
     AgentMcpCatalogEntry,
     AgentMcpRepository,
     AgentMemoryActiveEntry,
@@ -13,6 +14,7 @@
 
 __all__ = [
     "AgentActionLogRepository",
+    "AgentInboxMessageRepository",
     "AgentMcpCatalogEntry",
     "AgentMcpRepository",
     "AgentMemoryActiveEntry",
diff --git a/app/src/fileflash/repositories/agent/__init__.py b/app/src/fileflash/repositories/agent/__init__.py
index ac9837d..c551d06 100644
--- a/app/src/fileflash/repositories/agent/__init__.py
+++ b/app/src/fileflash/repositories/agent/__init__.py
@@ -1,5 +1,6 @@
 from .action_log import AgentActionLogRepository
 from .contracts import AgentMcpCatalogEntry, AgentMemoryActiveEntry, AgentSkillCatalogEntry
+from .inbox import AgentInboxMessageRepository
 from .mcp import AgentMcpRepository
 from .memory import AgentMemoryRepository
 from .plan import AgentPlanRepository
@@ -9,6 +10,7 @@
 
 __all__ = [
     "AgentActionLogRepository",
+    "AgentInboxMessageRepository",
     "AgentMcpCatalogEntry",
     "AgentMcpRepository",
     "AgentMemoryActiveEntry",
diff --git a/app/src/fileflash/repositories/agent/inbox.py b/app/src/fileflash/repositories/agent/inbox.py
new file mode 100644
index 0000000..d6996b2
--- /dev/null
+++ b/app/src/fileflash/repositories/agent/inbox.py
@@ -0,0 +1,136 @@
+from __future__ import annotations
+
+from datetime import UTC, datetime
+from typing import Any
+
+from sqlalchemy import and_, select
+from sqlalchemy.ext.asyncio import AsyncSession
+
+from ...models import AgentInboxMessage
+from ...models.enums import AgentInboxKind, AgentInboxRole, AgentInboxStatus
+
+_CONTROL_KINDS = frozenset(
+    {
+        AgentInboxKind.CONTROL_PAUSE,
+        AgentInboxKind.CONTROL_RESUME,
+        AgentInboxKind.CONTROL_APPROVE,
+        AgentInboxKind.CONTROL_DENY,
+        AgentInboxKind.CONTROL_SKIP,
+        AgentInboxKind.CONTROL_CANCEL,
+    }
+)
+
+
+class AgentInboxMessageRepository:
+    def __init__(self, db: AsyncSession) -> None:
+        self._db = db
+
+    async def create_ask(
+        self,
+        *,
+        job_id: int,
+        payload: dict[str, Any],
+    ) -> AgentInboxMessage:
+        msg = AgentInboxMessage(
+            job_id=job_id,
+            role=AgentInboxRole.AGENT,
+            kind=AgentInboxKind.ASK,
+            payload_json=payload,
+            status=AgentInboxStatus.WAITING,
+            created_at=datetime.now(UTC),
+        )
+        self._db.add(msg)
+        await self._db.flush()
+        return msg
+
+    async def record_user_message(
+        self,
+        *,
+        job_id: int,
+        kind: AgentInboxKind,
+        payload: dict[str, Any],
+        reply_to_id: int | None = None,
+    ) -> AgentInboxMessage:
+        msg = AgentInboxMessage(
+            job_id=job_id,
+            role=AgentInboxRole.USER,
+            kind=kind,
+            payload_json=payload,
+            reply_to_id=reply_to_id,
+            status=None,
+            created_at=datetime.now(UTC),
+        )
+        self._db.add(msg)
+        await self._db.flush()
+        return msg
+
+    async def mark_answered(
+        self,
+        *,
+        inbox_message_id: int,
+        answered_at: datetime,
+    ) -> AgentInboxMessage:
+        msg = await self._db.get(AgentInboxMessage, inbox_message_id)
+        if msg is None:
+            raise ValueError(f"AgentInboxMessage {inbox_message_id} not found")
+        msg.status = AgentInboxStatus.ANSWERED
+        msg.answered_at = answered_at
+        await self._db.flush()
+        return msg
+
+    async def mark_timed_out(
+        self,
+        *,
+        inbox_message_id: int,
+        answered_at: datetime,
+    ) -> AgentInboxMessage:
+        msg = await self._db.get(AgentInboxMessage, inbox_message_id)
+        if msg is None:
+            raise ValueError(f"AgentInboxMessage {inbox_message_id} not found")
+        msg.status = AgentInboxStatus.TIMED_OUT
+        msg.answered_at = answered_at
+        await self._db.flush()
+        return msg
+
+    async def mark_dropped(self, *, inbox_message_id: int) -> None:
+        msg = await self._db.get(AgentInboxMessage, inbox_message_id)
+        if msg is None:
+            return
+        if msg.kind in _CONTROL_KINDS:
+            msg.status = AgentInboxStatus.DROPPED
+            msg.answered_at = datetime.now(UTC)
+        await self._db.flush()
+
+    async def get_ask(self, *, inbox_message_id: int) -> AgentInboxMessage | None:
+        msg = await self._db.get(AgentInboxMessage, inbox_message_id)
+        if msg is None or msg.kind != AgentInboxKind.ASK:
+            return None
+        return msg
+
+    async def get_reply_for(self, *, ask_id: int) -> AgentInboxMessage | None:
+        return await self._db.scalar(
+            select(AgentInboxMessage).where(
+                and_(
+                    AgentInboxMessage.reply_to_id == ask_id,
+                    AgentInboxMessage.kind == AgentInboxKind.REPLY,
+                )
+            )
+        )
+
+    async def list_pending_controls(self, *, job_id: int) -> list[AgentInboxMessage]:
+        rows = await self._db.scalars(
+            select(AgentInboxMessage)
+            .where(
+                and_(
+                    AgentInboxMessage.job_id == job_id,
+                    AgentInboxMessage.role == AgentInboxRole.USER,
+                    AgentInboxMessage.kind.in_(list(_CONTROL_KINDS)),
+                    AgentInboxMessage.status.is_(None),
+                )
+            )
+            .order_by(AgentInboxMessage.created_at.asc())
+        )
+        return list(rows)
+
+
+__all__ = ["AgentInboxMessageRepository"]
diff --git a/app/src/fileflash/routers/admin_users.py b/app/src/fileflash/routers/admin_users.py
index 09278c0..0eb8619 100644
--- a/app/src/fileflash/routers/admin_users.py
+++ b/app/src/fileflash/routers/admin_users.py
@@ -11,9 +11,19 @@
 router = APIRouter(prefix="/admin/users", tags=["admin"])
 
 
+def get_list_admin_users_query(query: ListAdminUsersQuery = Depends()) -> ListAdminUsersQuery:
+    try:
+        query.resolve_usage_window()
+    except ValueError as exc:
+        from ..core.errors import ApiError
+
+        raise ApiError(status_code=400, code=400, message=str(exc)) from exc
+    return query
+
+
 @router.get("")
 async def list_admin_users(
-    query: ListAdminUsersQuery = Depends(),
+    query: ListAdminUsersQuery = Depends(get_list_admin_users_query),
     _: User = Depends(require_admin),
     service: AdminUsersService = Depends(get_admin_users_service),
 ):
diff --git a/app/src/fileflash/routers/agent.py b/app/src/fileflash/routers/agent.py
index 2e56108..4cc869f 100644
--- a/app/src/fileflash/routers/agent.py
+++ b/app/src/fileflash/routers/agent.py
@@ -1,18 +1,34 @@
 from __future__ import annotations
 
-from datetime import UTC, datetime
-from typing import Annotated
+import json
+from typing import Annotated, Any, get_args
 
 from fastapi import APIRouter, Depends
+from fastapi.responses import StreamingResponse
 from sqlalchemy import and_, select
 from sqlalchemy.ext.asyncio import AsyncSession
 
-from ..core.deps import get_agent_execute_service, get_agent_plan_service, get_current_user
+from ..agents.harness.event_bus import AgentEventBus, AgentEventEnvelope
+from ..agents.harness.inbox import AgentInbox
+from ..core.deps import (
+    get_agent_event_bus,
+    get_agent_execute_service,
+    get_agent_plan_service,
+    get_current_user,
+)
 from ..core.errors import ApiError, api_success
 from ..db.deps import get_db
-from ..models import BackgroundJob
+from ..models import AgentActionLog, BackgroundJob
+from ..models.enums import AgentInboxKind
 from ..models.tables_identity import User
-from ..schemas.agent import CancelAgentResponse, ExecuteAgentRequest, PlanAgentRequest
+from ..schemas.agent import (
+    AgentInboxMessageRequest,
+    AgentInboxMessageResponse,
+    AgentJobEvent,
+    AgentJobEventType,
+    ExecuteAgentRequest,
+    PlanAgentRequest,
+)
 from ..services.agent import ExecuteService, PlanService
 
 router = APIRouter(prefix="/agent", tags=["agent"])
@@ -44,16 +60,63 @@ async def execute_agent_plan(
     )
 
 
-@router.post("/cancel/{job_id}")
-async def cancel_agent_job(
+@router.get("/jobs/{job_id}/events")
+async def stream_agent_job_events(
     job_id: str,
     current_user: Annotated[User, Depends(get_current_user)],
     db: Annotated[AsyncSession, Depends(get_db)],
+    event_bus: Annotated[AgentEventBus, Depends(get_agent_event_bus)],
 ):
-    try:
-        parsed_job_id = int(job_id)
-    except ValueError as exc:
-        raise ApiError(status_code=400, code=400, message="Invalid jobId") from exc
+    parsed_job_id = _parse_job_id(job_id)
+    initial_events, initial_terminal = await _agent_job_events_for_job(
+        db=db,
+        job_id=parsed_job_id,
+        user_id=int(current_user.user_id),
+    )
+
+    async def event_stream():
+        seen: set[str] = set()
+        for event in initial_events:
+            seen.add(event.id)
+            yield _format_sse_event(event)
+        if initial_terminal:
+            return
+        async with event_bus.subscribe(job_id=parsed_job_id) as stream:
+            while True:
+                try:
+                    envelope = await stream.next(timeout=30.0)
+                except TimeoutError:
+                    yield ": keep-alive\n\n"
+                    continue
+                event = _envelope_to_job_event(envelope)
+                if event is None:
+                    continue
+                if event.id in seen:
+                    continue
+                seen.add(event.id)
+                yield _format_sse_event(event)
+                if event.type in {"job.succeeded", "job.failed", "job.canceled"}:
+                    break
+
+    return StreamingResponse(
+        event_stream(),
+        media_type="text/event-stream",
+        headers={
+            "Cache-Control": "no-cache",
+            "X-Accel-Buffering": "no",
+        },
+    )
+
+
+@router.post("/jobs/{job_id}/messages")
+async def post_agent_job_message(
+    job_id: str,
+    payload: AgentInboxMessageRequest,
+    current_user: Annotated[User, Depends(get_current_user)],
+    db: Annotated[AsyncSession, Depends(get_db)],
+    event_bus: Annotated[AgentEventBus, Depends(get_agent_event_bus)],
+):
+    parsed_job_id = _parse_job_id(job_id)
     job = await db.scalar(
         select(BackgroundJob)
         .where(
@@ -63,27 +126,260 @@ async def cancel_agent_job(
                 BackgroundJob.task_type.in_(["agent.plan", "agent.execute"]),
             )
         )
-        .with_for_update()
     )
     if job is None:
         raise ApiError(status_code=404, code=404, message="Job not found")
 
-    canceled_at = datetime.now(UTC)
-    if job.status not in {"succeeded", "failed", "canceled"}:
-        job.cancel_requested_at = canceled_at
-        job.status = "canceled"
-        job.agent_phase = "canceled"
-        job.finished_at = canceled_at
-        job.updated_at = canceled_at
+    kind = AgentInboxKind(payload.kind)
+    reply_to_id: int | None = None
+    if payload.reply_to is not None:
+        try:
+            reply_to_id = int(payload.reply_to)
+        except ValueError as exc:
+            raise ApiError(status_code=400, code=400, message="Invalid replyTo") from exc
+
+    inbox = AgentInbox(db=db, event_bus=event_bus)
+    try:
+        msg = await inbox.handle(
+            job_id=parsed_job_id,
+            kind=kind,
+            payload=_inbox_payload_from_request(payload),
+            reply_to_id=reply_to_id,
+        )
+    except ValueError as exc:
+        raise ApiError(status_code=400, code=400, message=str(exc)) from exc
     await db.commit()
-    await db.refresh(job)
 
-    data = CancelAgentResponse(
+    data = AgentInboxMessageResponse(
+        inbox_message_id=str(msg.inbox_message_id),
+        kind=payload.kind,
+        accepted_at=msg.created_at,
+    )
+    return api_success(data=data.model_dump(by_alias=True), message="Message accepted")
+
+
+def _inbox_payload_from_request(req: AgentInboxMessageRequest) -> dict[str, Any]:
+    body: dict[str, Any] = {}
+    if req.value is not None:
+        body["value"] = req.value
+    if req.metadata:
+        body["metadata"] = req.metadata
+    return body
+
+
+def _parse_job_id(raw: str) -> int:
+    try:
+        parsed_job_id = int(raw)
+    except ValueError as exc:
+        raise ApiError(status_code=400, code=400, message="Invalid jobId") from exc
+    if parsed_job_id <= 0:
+        raise ApiError(status_code=400, code=400, message="Invalid jobId")
+    return parsed_job_id
+
+
+async def _agent_job_events_for_job(
+    *,
+    db: AsyncSession,
+    job_id: int,
+    user_id: int,
+) -> tuple[list[AgentJobEvent], bool]:
+    job = await db.scalar(
+        select(BackgroundJob).where(
+            and_(
+                BackgroundJob.job_id == job_id,
+                BackgroundJob.requested_by == user_id,
+                BackgroundJob.task_type.in_(["agent.plan", "agent.execute"]),
+            )
+        )
+    )
+    if job is None:
+        raise ApiError(status_code=404, code=404, message="Job not found")
+
+    terminal = str(job.status) in {"succeeded", "failed", "canceled"}
+    events: list[AgentJobEvent] = []
+    if job.task_type == "agent.plan" and job.status == "succeeded" and job.result:
+        events.append(_plan_ready_event(job))
+        events.append(_job_status_event(job))
+    elif job.task_type != "agent.execute" or not terminal:
+        events.append(_job_status_event(job))
+
+    if job.task_type == "agent.execute":
+        action_logs = list(
+            await db.scalars(
+                select(AgentActionLog)
+                .where(AgentActionLog.job_id == job_id)
+                .order_by(AgentActionLog.step_no.asc())
+            )
+        )
+        for action_log in action_logs:
+            events.extend(_tool_events(job=job, action_log=action_log))
+        if terminal:
+            events.append(_job_status_event(job))
+
+    return events, terminal
+
+
+def _job_status_event(job: BackgroundJob) -> AgentJobEvent:
+    status = str(job.status)
+    event_type = {
+        "pending": "job.queued",
+        "running": "job.running",
+        "succeeded": "job.succeeded",
+        "failed": "job.failed",
+        "canceled": "job.canceled",
+    }.get(status, "job.running")
+    timestamp = job.updated_at or job.created_at
+    return AgentJobEvent(
+        id=f"{job.job_id}:job:{status}:{timestamp.isoformat()}",
         job_id=str(job.job_id),
+        task_type=str(job.task_type),
+        type=event_type,  # type: ignore[arg-type]
+        status=status,
+        agent_phase=job.agent_phase,
+        message=_job_status_message(job),
+        data=_job_status_data(job),
+        timestamp=timestamp,
+    )
+
+
+def _plan_ready_event(job: BackgroundJob) -> AgentJobEvent:
+    timestamp = job.finished_at or job.updated_at or job.created_at
+    return AgentJobEvent(
+        id=f"{job.job_id}:plan-ready",
+        job_id=str(job.job_id),
+        task_type=str(job.task_type),
+        type="plan.ready",
         status=str(job.status),
-        canceled_at=job.cancel_requested_at or canceled_at,
+        agent_phase=job.agent_phase,
+        message="计划已生成。",
+        data={"result": dict(job.result or {})},
+        timestamp=timestamp,
+    )
+
+
+def _tool_events(*, job: BackgroundJob, action_log: AgentActionLog) -> list[AgentJobEvent]:
+    events = [
+        AgentJobEvent(
+            id=f"{job.job_id}:tool:{action_log.action_log_id}:started",
+            job_id=str(job.job_id),
+            task_type=str(job.task_type),
+            type="tool.started",
+            status=str(job.status),
+            agent_phase=job.agent_phase,
+            message=_tool_started_message(action_log),
+            data=_tool_event_data(action_log, include_output=False),
+            timestamp=action_log.started_at,
+        )
+    ]
+    if action_log.status in {"succeeded", "failed"} and action_log.finished_at is not None:
+        events.append(
+            AgentJobEvent(
+                id=f"{job.job_id}:tool:{action_log.action_log_id}:{action_log.status}",
+                job_id=str(job.job_id),
+                task_type=str(job.task_type),
+                type="tool.succeeded" if action_log.status == "succeeded" else "tool.failed",
+                status=str(job.status),
+                agent_phase=job.agent_phase,
+                message=_tool_finished_message(action_log),
+                data=_tool_event_data(action_log, include_output=True),
+                timestamp=action_log.finished_at,
+            )
+        )
+    return events
+
+
+def _job_status_message(job: BackgroundJob) -> str:
+    status = str(job.status)
+    if status == "pending":
+        return "任务已排队。"
+    if status == "running":
+        return "正在规划任务。" if job.task_type == "agent.plan" else "正在执行计划。"
+    if status == "succeeded":
+        result = dict(job.result or {})
+        answer = result.get("answer")
+        if isinstance(answer, str) and answer.strip():
+            return "答案已生成。"
+        return "任务已完成。"
+    if status == "failed":
+        return str(job.error_message or "任务失败。")
+    if status == "canceled":
+        return "任务已取消。"
+    return "任务状态已更新。"
+
+
+def _job_status_data(job: BackgroundJob) -> dict[str, object]:
+    data: dict[str, object] = {}
+    if job.status in {"succeeded", "failed", "canceled"}:
+        data["result"] = dict(job.result or {})
+    if job.error_message:
+        data["errorMessage"] = job.error_message
+    return data
+
+
+def _tool_started_message(action_log: AgentActionLog) -> str:
+    if action_log.tool_name == "drive.countFiles":
+        inputs = dict(action_log.inputs_json or {})
+        search = str(inputs.get("search") or "").strip()
+        category = str(inputs.get("category") or "").strip()
+        target = "视频文件" if category == "video" else "文件"
+        if search:
+            return f"正在读取名称包含“{search}”的{target}数量。"
+        return f"正在读取{target}数量。"
+    return f"正在调用 {action_log.tool_name}。"
+
+
+def _tool_finished_message(action_log: AgentActionLog) -> str:
+    if action_log.status == "failed":
+        return str(action_log.error_message or f"{action_log.tool_name} 调用失败。")
+    if action_log.tool_name == "drive.countFiles":
+        outputs = dict(action_log.outputs_json or {})
+        total_items = int(outputs.get("totalItems") or 0)
+        return f"读取完成，匹配 {total_items} 个文件。"
+    return f"{action_log.tool_name} 已完成。"
+
+
+def _tool_event_data(action_log: AgentActionLog, *, include_output: bool) -> dict[str, object]:
+    data: dict[str, object] = {
+        "step": int(action_log.step_no),
+        "tool": str(action_log.tool_name),
+        "input": dict(action_log.inputs_json or {}),
+    }
+    if include_output:
+        data["output"] = dict(action_log.outputs_json or {})
+        if action_log.duration_ms is not None:
+            data["durationMs"] = int(action_log.duration_ms)
+    if action_log.error_message:
+        data["errorMessage"] = action_log.error_message
+    return data
+
+
+def _envelope_to_job_event(env: AgentEventEnvelope) -> AgentJobEvent | None:
+    if env.event_type.startswith("agent.inbox."):
+        return None
+    if env.event_type not in get_args(AgentJobEventType):
+        return None
+    payload = dict(env.payload or {})
+    data = payload.get("data")
+    return AgentJobEvent(
+        id=env.event_id or f"{env.job_id}:{env.event_type}:{env.emitted_at.isoformat()}",
+        job_id=str(env.job_id),
+        task_type=str(payload.get("taskType") or "agent.execute"),
+        type=env.event_type,  # type: ignore[arg-type]
+        status=str(payload.get("status") or "running"),
+        agent_phase=payload.get("agentPhase"),
+        message=str(payload.get("message") or ""),
+        data=dict(data) if isinstance(data, dict) else payload,
+        timestamp=env.emitted_at,
+    )
+
+
+def _format_sse_event(event: AgentJobEvent) -> str:
+    payload = event.model_dump(by_alias=True, mode="json")
+    return (
+        f"id: {event.id}\n"
+        f"event: {event.type}\n"
+        f"data: {json.dumps(payload, ensure_ascii=False, separators=(',', ':'))}\n\n"
     )
-    return api_success(data=data.model_dump(by_alias=True), message="Job canceled")
 
 
 __all__ = ["router"]
diff --git a/app/src/fileflash/routers/files.py b/app/src/fileflash/routers/files.py
index e54c99a..8938b4d 100644
--- a/app/src/fileflash/routers/files.py
+++ b/app/src/fileflash/routers/files.py
@@ -9,7 +9,13 @@
 from jwt import InvalidTokenError
 from starlette.background import BackgroundTask
 
-from ..core.deps import get_archive_service, get_current_user, get_file_service, get_settings_dep
+from ..core.deps import (
+    get_archive_service,
+    get_current_user,
+    get_download_rate_limit_service,
+    get_file_service,
+    get_settings_dep,
+)
 from ..core.errors import ApiError, api_success
 from ..core.security import create_file_preview_token, decode_file_preview_token
 from ..core.settings import Settings
@@ -26,11 +32,19 @@
 )
 from ..schemas.job import to_background_job_response
 from ..services.archive import ArchiveService
+from ..services.download_rate_limit import DownloadRateLimitService
 from ..services.file import FileService
 
 router = APIRouter(prefix="/files", tags=["files"])
 
 
+def _content_length(headers: dict[str, str]) -> int:
+    try:
+        return max(0, int(headers.get("Content-Length") or 0))
+    except ValueError:
+        return 0
+
+
 @router.get("")
 async def list_files(
     folder_id: str | None = Query(None, alias="folderId"),
@@ -112,11 +126,14 @@ async def batch_download_files(
     payload: BatchDownloadRequest,
     current_user: User = Depends(get_current_user),
     file_service: FileService = Depends(get_file_service),
+    download_limiter: DownloadRateLimitService = Depends(get_download_rate_limit_service),
 ):
-    archive_path, archive_name = await file_service.create_batch_download_archive(
+    plan = await file_service.create_batch_download_plan(
         user_id=current_user.user_id,
         payload=payload,
     )
+    await download_limiter.enforce_user(user=current_user, bytes_count=plan.estimated_bytes)
+    archive_path, archive_name = await file_service.create_batch_download_archive_from_plan(plan=plan)
     return FileResponse(
         archive_path,
         media_type="application/zip",
@@ -146,12 +163,14 @@ async def download_file(
     range_header: str | None = Header(default=None, alias="Range"),
     current_user: User = Depends(get_current_user),
     file_service: FileService = Depends(get_file_service),
+    download_limiter: DownloadRateLimitService = Depends(get_download_rate_limit_service),
 ):
     result = await file_service.get_download_stream(
         user_id=current_user.user_id,
         file_id=file_id,
         range_header=range_header,
     )
+    await download_limiter.enforce_user(user=current_user, bytes_count=_content_length(result.headers))
     return StreamingResponse(
         result.stream,
         media_type=result.content_type,
@@ -166,12 +185,14 @@ async def preview_file(
     range_header: str | None = Header(default=None, alias="Range"),
     current_user: User = Depends(get_current_user),
     file_service: FileService = Depends(get_file_service),
+    download_limiter: DownloadRateLimitService = Depends(get_download_rate_limit_service),
 ):
     result = await file_service.get_preview_stream(
         user_id=current_user.user_id,
         file_id=file_id,
         range_header=range_header,
     )
+    await download_limiter.enforce_user(user=current_user, bytes_count=_content_length(result.headers))
     return StreamingResponse(
         result.stream,
         media_type=result.content_type,
@@ -216,6 +237,7 @@ async def preview_file_stream(
     range_header: str | None = Header(default=None, alias="Range"),
     file_service: FileService = Depends(get_file_service),
     settings: Settings = Depends(get_settings_dep),
+    download_limiter: DownloadRateLimitService = Depends(get_download_rate_limit_service),
 ):
     try:
         payload = decode_file_preview_token(token, settings)
@@ -232,6 +254,7 @@ async def preview_file_stream(
         file_id=file_id,
         range_header=range_header,
     )
+    await download_limiter.enforce_user_id(user_id=user_id, bytes_count=_content_length(result.headers))
     return StreamingResponse(
         result.stream,
         media_type=result.content_type,
diff --git a/app/src/fileflash/routers/shares.py b/app/src/fileflash/routers/shares.py
index 4341854..4ac18c0 100644
--- a/app/src/fileflash/routers/shares.py
+++ b/app/src/fileflash/routers/shares.py
@@ -3,7 +3,14 @@
 from fastapi import APIRouter, Depends, Header
 from fastapi.responses import StreamingResponse
 
-from ..core.deps import get_client_ip, get_share_service, get_user_agent, get_current_user, require_verified_user
+from ..core.deps import (
+    get_client_ip,
+    get_current_user,
+    get_download_rate_limit_service,
+    get_share_service,
+    get_user_agent,
+    require_verified_user,
+)
 from ..core.errors import api_success
 from ..core.http_headers import build_content_disposition
 from ..models.tables_identity import User
@@ -14,6 +21,7 @@
     SaveShareRequest,
     UpdateShareSettingsRequest,
 )
+from ..services.download_rate_limit import DownloadRateLimitService
 from ..services.share import ShareService
 
 router = APIRouter(prefix="/shares", tags=["shares"])
@@ -85,6 +93,19 @@ def _sanitize_stream_headers(
     return sanitized
 
 
+def _content_length(headers: dict[str, str] | None) -> int:
+    if not headers:
+        return 0
+    for key, value in headers.items():
+        if key.lower() != "content-length":
+            continue
+        try:
+            return max(0, int(value))
+        except ValueError:
+            return 0
+    return 0
+
+
 @router.post("")
 async def create_share(
     payload: CreateShareRequest,
@@ -195,6 +216,7 @@ async def download_shared_file(
     client_ip: str = Depends(get_client_ip),
     user_agent: str | None = Depends(get_user_agent),
     share_service: ShareService = Depends(get_share_service),
+    download_limiter: DownloadRateLimitService = Depends(get_download_rate_limit_service),
 ):
     token = _extract_bearer_token(authorization)
     if not token:
@@ -210,6 +232,10 @@ async def download_shared_file(
             range_header=range_header,
             ip_address=client_ip,
             user_agent=user_agent,
+            rate_limit_check=lambda bytes_count: download_limiter.enforce_share_ip(
+                client_ip=client_ip,
+                bytes_count=bytes_count,
+            ),
         )
     else:
         raw = await share_service.get_shared_file_stream(
@@ -220,6 +246,8 @@ async def download_shared_file(
             user_agent=user_agent,
         )
     stream, filename, content_type, status_code, headers = _extract_share_stream(tuple(raw))
+    if not hasattr(share_service, "get_shared_file_download_stream_response"):
+        await download_limiter.enforce_share_ip(client_ip=client_ip, bytes_count=_content_length(headers))
     response_headers = _sanitize_stream_headers(headers=headers, filename=filename, disposition="attachment")
     return StreamingResponse(stream, media_type=content_type, headers=response_headers, status_code=status_code)
 
@@ -232,6 +260,7 @@ async def preview_shared_file(
     client_ip: str = Depends(get_client_ip),
     user_agent: str | None = Depends(get_user_agent),
     share_service: ShareService = Depends(get_share_service),
+    download_limiter: DownloadRateLimitService = Depends(get_download_rate_limit_service),
 ):
     token = _extract_bearer_token(authorization)
     if not token:
@@ -247,6 +276,10 @@ async def preview_shared_file(
             range_header=range_header,
             ip_address=client_ip,
             user_agent=user_agent,
+            rate_limit_check=lambda bytes_count: download_limiter.enforce_share_ip(
+                client_ip=client_ip,
+                bytes_count=bytes_count,
+            ),
         )
     else:
         raw = await share_service.get_shared_file_stream(
@@ -257,6 +290,8 @@ async def preview_shared_file(
             user_agent=user_agent,
         )
     stream, filename, content_type, status_code, headers = _extract_share_stream(tuple(raw))
+    if not hasattr(share_service, "get_shared_file_download_stream_response"):
+        await download_limiter.enforce_share_ip(client_ip=client_ip, bytes_count=_content_length(headers))
     response_headers = _sanitize_stream_headers(headers=headers, filename=filename, disposition="inline")
     return StreamingResponse(stream, media_type=content_type, headers=response_headers, status_code=status_code)
 
diff --git a/app/src/fileflash/schemas/__init__.py b/app/src/fileflash/schemas/__init__.py
index c970aae..1e577d9 100644
--- a/app/src/fileflash/schemas/__init__.py
+++ b/app/src/fileflash/schemas/__init__.py
@@ -1,22 +1,10 @@
-from .auth import (
-    ForgotPasswordRequest,
-    ForgotPasswordResponse,
-    LoginRequest,
-    RegisterResponseData,
-    RegisterRequest,
-    ResetPasswordRequest,
-    TokenResponse,
-    VerifyEmailRequest,
-)
-from .agent_skill import (
-    AgentSkillItem,
-    CreateAgentSkillRequest,
-    ImportAgentSkillItem,
-    ImportAgentSkillResult,
-    ImportAgentSkillsRequest,
-    ImportAgentSkillsResponse,
-    ListAgentSkillsQuery,
-    UpdateAgentSkillRequest,
+from .admin.files import (
+    AdminFileAuditDetail,
+    AdminFileAuditItem,
+    AdminFileAuditOwner,
+    AdminFileLatestScan,
+    ListAdminFilesQuery,
+    RescanResponse,
 )
 from .agent import (
     AgentApproval,
@@ -25,7 +13,12 @@
     AgentDataPolicy,
     AgentExecutionResult,
     AgentHints,
+    AgentInboxMessageKind,
+    AgentInboxMessageRequest,
+    AgentInboxMessageResponse,
+    AgentJobEvent,
     AgentPlanContext,
+    AgentPlanningEvidence,
     AgentPlanResult,
     AgentProposedAction,
     AgentReasoningEffort,
@@ -35,20 +28,32 @@
     PlanAgentRequest,
     PlanAgentResponse,
 )
-from .common import ApiResponse, CamelModel, PageQuery, PaginatedData, PaginationMeta
-from .admin.files import (
-    AdminFileAuditDetail,
-    AdminFileAuditItem,
-    AdminFileAuditOwner,
-    AdminFileLatestScan,
-    ListAdminFilesQuery,
-    RescanResponse,
+from .agent_skill import (
+    AgentSkillItem,
+    CreateAgentSkillRequest,
+    ImportAgentSkillItem,
+    ImportAgentSkillResult,
+    ImportAgentSkillsRequest,
+    ImportAgentSkillsResponse,
+    ListAgentSkillsQuery,
+    UpdateAgentSkillRequest,
+)
+from .auth import (
+    ForgotPasswordRequest,
+    ForgotPasswordResponse,
+    LoginRequest,
+    RegisterRequest,
+    RegisterResponseData,
+    ResetPasswordRequest,
+    TokenResponse,
+    VerifyEmailRequest,
 )
+from .common import ApiResponse, CamelModel, PageQuery, PaginatedData, PaginationMeta
 from .file import (
     BatchDownloadRequest,
-    BatchMoveItemResult,
     BatchFilesRequest,
     BatchFilesResponse,
+    BatchMoveItemResult,
     ContentItem,
     CopyFileRequest,
     CopyFileResponse,
@@ -97,12 +102,6 @@
     PermissionItem,
     UpdatePermissionRequest,
 )
-from .registration_email_domain_rule import (
-    CreateRegistrationEmailDomainRuleRequest,
-    ListRegistrationEmailDomainRulesQuery,
-    RegistrationEmailDomainRuleItem,
-    UpdateRegistrationEmailDomainRuleRequest,
-)
 from .recycle import (
     ClearRecycleBinResponse,
     GetRecycleBinQuery,
@@ -111,11 +110,17 @@
     RestoreRecycleItemRequest,
     RestoreRecycleItemResponse,
 )
+from .registration_email_domain_rule import (
+    CreateRegistrationEmailDomainRuleRequest,
+    ListRegistrationEmailDomainRulesQuery,
+    RegistrationEmailDomainRuleItem,
+    UpdateRegistrationEmailDomainRuleRequest,
+)
 from .share import (
+    AcceptSharedItemResponse,
     AccessShareRequest,
     AccessShareResponseData,
     AccessUrls,
-    AcceptSharedItemResponse,
     CreateShareRequest,
     DeleteShareResponse,
     GetSharedItemsQuery,
@@ -178,7 +183,12 @@
     "AgentDataPolicy",
     "AgentExecutionResult",
     "AgentHints",
+    "AgentInboxMessageKind",
+    "AgentInboxMessageRequest",
+    "AgentInboxMessageResponse",
+    "AgentJobEvent",
     "AgentPlanContext",
+    "AgentPlanningEvidence",
     "AgentPlanResult",
     "AgentProposedAction",
     "AgentReasoningEffort",
diff --git a/app/src/fileflash/schemas/admin/users.py b/app/src/fileflash/schemas/admin/users.py
index a62d4f8..9eab779 100644
--- a/app/src/fileflash/schemas/admin/users.py
+++ b/app/src/fileflash/schemas/admin/users.py
@@ -1,12 +1,28 @@
 from __future__ import annotations
 
-from datetime import datetime
+from datetime import UTC, datetime, timedelta
 from typing import Literal
 
+from pydantic import Field
+
 from ..common import CamelModel, PageQuery
 
 ExternalUserStatus = Literal["active", "suspended", "pending_verification"]
 
+DEFAULT_USAGE_WINDOW = timedelta(days=7)
+MAX_USAGE_WINDOW = timedelta(days=90)
+
+
+def _normalize_datetime(value: datetime) -> datetime:
+    if value.tzinfo is None:
+        return value.replace(tzinfo=UTC)
+    return value.astimezone(UTC)
+
+
+class AdminUserUsageStats(CamelModel):
+    traffic_bytes: int = Field(ge=0)
+    agent_tokens: int = Field(ge=0)
+
 
 class AdminUserItem(CamelModel):
     user_id: str
@@ -22,6 +38,7 @@ class AdminUserItem(CamelModel):
     last_login_at: datetime | None = None
     last_active_at: datetime | None = None
     created_at: datetime
+    usage_stats: AdminUserUsageStats
 
 
 class ListAdminUsersQuery(PageQuery):
@@ -30,6 +47,23 @@ class ListAdminUsersQuery(PageQuery):
     role: Literal["USER", "ADMIN"] | None = None
     sort: Literal["username", "createdAt", "storageUsed"] = "createdAt"
     order: Literal["asc", "desc"] = "desc"
+    usage_from: datetime | None = None
+    usage_to: datetime | None = None
+
+    def resolve_usage_window(self, *, now: datetime | None = None) -> tuple[datetime, datetime]:
+        resolved_now = _normalize_datetime(now or datetime.now(UTC))
+        if self.usage_from is None and self.usage_to is None:
+            return resolved_now - DEFAULT_USAGE_WINDOW, resolved_now
+        if self.usage_from is None or self.usage_to is None:
+            raise ValueError("usageFrom and usageTo must be provided together")
+
+        usage_from = _normalize_datetime(self.usage_from)
+        usage_to = _normalize_datetime(self.usage_to)
+        if usage_from > usage_to:
+            raise ValueError("usageFrom must be earlier than or equal to usageTo")
+        if usage_to - usage_from > MAX_USAGE_WINDOW:
+            raise ValueError("usage window must not exceed 90 days")
+        return usage_from, usage_to
 
 
 class UpdateUserStatusRequest(CamelModel):
@@ -44,6 +78,7 @@ class UpdateUserStatusResponse(CamelModel):
 
 __all__ = [
     "AdminUserItem",
+    "AdminUserUsageStats",
     "ListAdminUsersQuery",
     "UpdateUserStatusRequest",
     "UpdateUserStatusResponse",
diff --git a/app/src/fileflash/schemas/agent.py b/app/src/fileflash/schemas/agent.py
index e253be0..97a25dd 100644
--- a/app/src/fileflash/schemas/agent.py
+++ b/app/src/fileflash/schemas/agent.py
@@ -20,6 +20,23 @@
     "failed",
     "canceled",
 ]
+AgentJobEventType = Literal[
+    "job.queued",
+    "job.running",
+    "plan.ready",
+    "tool.started",
+    "tool.succeeded",
+    "tool.failed",
+    "tool.partial",
+    "agent.thinking",
+    "agent.progress",
+    "agent.ask",
+    "agent.paused",
+    "agent.resumed",
+    "job.succeeded",
+    "job.failed",
+    "job.canceled",
+]
 
 
 class AgentDataPolicy(CamelModel):
@@ -77,6 +94,13 @@ class AgentChosenSkill(CamelModel):
     name: str
 
 
+class AgentPlanningEvidence(CamelModel):
+    step: int = Field(ge=1)
+    tool: str = Field(min_length=1, max_length=120)
+    input: dict[str, Any] = Field(default_factory=dict)
+    output_preview: dict[str, Any] = Field(default_factory=dict)
+
+
 class AgentPlanResult(CamelModel):
     plan_job_id: str
     plan_hash: str
@@ -85,6 +109,7 @@ class AgentPlanResult(CamelModel):
     summary: str
     requires_confirmation: bool
     cost_estimate: AgentCostEstimate
+    planning_evidence: list[AgentPlanningEvidence] | None = None
 
 
 class AgentApproval(CamelModel):
@@ -123,6 +148,42 @@ class AgentExecutionResult(CamelModel):
     finished_at: datetime
 
 
+class AgentJobEvent(CamelModel):
+    id: str
+    job_id: str
+    task_type: str
+    type: AgentJobEventType
+    status: str
+    agent_phase: str | None = None
+    message: str
+    data: dict[str, Any] = Field(default_factory=dict)
+    timestamp: datetime
+
+
+AgentInboxMessageKind = Literal[
+    "reply",
+    "control.pause",
+    "control.resume",
+    "control.approve",
+    "control.deny",
+    "control.skip",
+    "control.cancel",
+]
+
+
+class AgentInboxMessageRequest(CamelModel):
+    kind: AgentInboxMessageKind
+    reply_to: str | None = None
+    value: Any = None
+    metadata: dict[str, Any] = Field(default_factory=dict)
+
+
+class AgentInboxMessageResponse(CamelModel):
+    inbox_message_id: str
+    kind: AgentInboxMessageKind
+    accepted_at: datetime
+
+
 __all__ = [
     "AgentActionSideEffect",
     "AgentApproval",
@@ -132,8 +193,14 @@ class AgentExecutionResult(CamelModel):
     "AgentExecutionPolicy",
     "AgentExecutionResult",
     "AgentHints",
+    "AgentInboxMessageKind",
+    "AgentInboxMessageRequest",
+    "AgentInboxMessageResponse",
     "AgentJobPhase",
+    "AgentJobEvent",
+    "AgentJobEventType",
     "AgentPlanContext",
+    "AgentPlanningEvidence",
     "AgentPlanResult",
     "AgentProposedAction",
     "AgentReasoningEffort",
diff --git a/app/src/fileflash/services/__init__.py b/app/src/fileflash/services/__init__.py
index e523bba..551c022 100644
--- a/app/src/fileflash/services/__init__.py
+++ b/app/src/fileflash/services/__init__.py
@@ -2,6 +2,7 @@
 from .agent import ExecuteService, McpService, MemoryService, PlanService, SessionService, SettingsService, SkillService
 from .auth import AuthService
 from .background_jobs import BackgroundJobService
+from .download_rate_limit import DownloadRateLimitService
 from .email_delivery import VerificationEmailDeliveryService
 from .file import FileService
 from .folder import FolderService
@@ -17,6 +18,7 @@
     "AuthService",
     "ArchiveService",
     "BackgroundJobService",
+    "DownloadRateLimitService",
     "VerificationEmailDeliveryService",
     "ExecuteService",
     "FileService",
diff --git a/app/src/fileflash/services/admin/users.py b/app/src/fileflash/services/admin/users.py
index e53a881..7c86a9a 100644
--- a/app/src/fileflash/services/admin/users.py
+++ b/app/src/fileflash/services/admin/users.py
@@ -6,9 +6,16 @@
 from sqlalchemy.ext.asyncio import AsyncSession
 
 from ...core.errors import ApiError
-from ...models.enums import UserRole, UserStatus
+from ...models.enums import UploadTaskStatus, UserRole, UserStatus
 from ...models.tables_identity import User, UserSession
-from ...schemas.admin.users import AdminUserItem, ListAdminUsersQuery, UpdateUserStatusResponse
+from ...models.tables_storage import UploadTask
+from ...models.tables_worker import BackgroundJob
+from ...schemas.admin.users import (
+    AdminUserItem,
+    AdminUserUsageStats,
+    ListAdminUsersQuery,
+    UpdateUserStatusResponse,
+)
 from ...schemas.common import PaginatedData, PaginationMeta
 from ._status import external_to_internal, internal_to_external
 
@@ -42,8 +49,25 @@ async def list_users(self, *, query: ListAdminUsersQuery) -> PaginatedData[Admin
         offset = (query.page - 1) * query.per_page
         rows = list(await self.db.scalars(statement.offset(offset).limit(query.per_page)))
 
-        last_seen_map = await self._collect_last_seen([int(row.user_id) for row in rows])
-        items = [self._to_item(row, last_seen_map.get(int(row.user_id))) for row in rows]
+        user_ids = [int(row.user_id) for row in rows]
+        last_seen_map = await self._collect_last_seen(user_ids)
+        usage_from, usage_to = self._resolve_usage_window(query)
+        usage_map = await self._collect_usage_stats(
+            user_ids=user_ids,
+            usage_from=usage_from,
+            usage_to=usage_to,
+        )
+        items = [
+            self._to_item(
+                row,
+                last_seen_map.get(int(row.user_id)),
+                usage_map.get(
+                    int(row.user_id),
+                    AdminUserUsageStats(traffic_bytes=0, agent_tokens=0),
+                ),
+            )
+            for row in rows
+        ]
         return PaginatedData(
             items=items,
             pagination=PaginationMeta(
@@ -56,6 +80,71 @@ async def list_users(self, *, query: ListAdminUsersQuery) -> PaginatedData[Admin
             ),
         )
 
+    @staticmethod
+    def _resolve_usage_window(query: ListAdminUsersQuery) -> tuple[datetime, datetime]:
+        try:
+            return query.resolve_usage_window()
+        except ValueError as exc:
+            raise ApiError(status_code=400, code=400, message=str(exc)) from exc
+
+    async def _collect_usage_stats(
+        self,
+        *,
+        user_ids: list[int],
+        usage_from: datetime,
+        usage_to: datetime,
+    ) -> dict[int, AdminUserUsageStats]:
+        if not user_ids:
+            return {}
+
+        traffic_rows = await self.db.execute(
+            select(UploadTask.user_id, func.coalesce(func.sum(UploadTask.total_size), 0))
+            .where(
+                and_(
+                    UploadTask.user_id.in_(user_ids),
+                    UploadTask.status == UploadTaskStatus.COMPLETED,
+                    UploadTask.completed_at.is_not(None),
+                    UploadTask.completed_at >= usage_from,
+                    UploadTask.completed_at <= usage_to,
+                )
+            )
+            .group_by(UploadTask.user_id)
+        )
+        stats: dict[int, AdminUserUsageStats] = {
+            int(user_id): AdminUserUsageStats(traffic_bytes=int(total or 0), agent_tokens=0)
+            for user_id, total in traffic_rows.all()
+        }
+
+        token_expr = BackgroundJob.result["costEstimate"]["tokens"].as_integer()
+        agent_rows = await self.db.execute(
+            select(
+                BackgroundJob.requested_by,
+                func.coalesce(func.sum(func.coalesce(token_expr, 0)), 0),
+            )
+            .where(
+                and_(
+                    BackgroundJob.requested_by.in_(user_ids),
+                    BackgroundJob.task_type == "agent.plan",
+                    BackgroundJob.status == "succeeded",
+                    BackgroundJob.finished_at.is_not(None),
+                    BackgroundJob.finished_at >= usage_from,
+                    BackgroundJob.finished_at <= usage_to,
+                )
+            )
+            .group_by(BackgroundJob.requested_by)
+        )
+        for user_id, total in agent_rows.all():
+            if user_id is None:
+                continue
+            key = int(user_id)
+            current = stats.get(key, AdminUserUsageStats(traffic_bytes=0, agent_tokens=0))
+            stats[key] = AdminUserUsageStats(
+                traffic_bytes=current.traffic_bytes,
+                agent_tokens=int(total or 0),
+            )
+
+        return stats
+
     async def set_status(self, *, user_id: int, external_status: str) -> UpdateUserStatusResponse:
         target = await self.db.get(User, user_id)
         if target is None or target.deleted_at is not None:
@@ -113,7 +202,11 @@ async def _collect_last_seen(self, user_ids: list[int]) -> dict[int, datetime]:
         return {int(user_id): seen for user_id, seen in rows.all()}
 
     @staticmethod
-    def _to_item(row: User, last_active_at: datetime | None) -> AdminUserItem:
+    def _to_item(
+        row: User,
+        last_active_at: datetime | None,
+        usage_stats: AdminUserUsageStats,
+    ) -> AdminUserItem:
         limit = max(int(row.storage_limit), 1)
         return AdminUserItem(
             user_id=str(row.user_id),
@@ -129,6 +222,7 @@ def _to_item(row: User, last_active_at: datetime | None) -> AdminUserItem:
             last_login_at=row.last_login_at,
             last_active_at=last_active_at,
             created_at=row.created_at,
+            usage_stats=usage_stats,
         )
 
 
diff --git a/app/src/fileflash/services/agent/skill_service.py b/app/src/fileflash/services/agent/skill_service.py
index cc06582..634c2d9 100644
--- a/app/src/fileflash/services/agent/skill_service.py
+++ b/app/src/fileflash/services/agent/skill_service.py
@@ -23,6 +23,7 @@
     UpdateAgentSkillRequest,
 )
 from ...schemas.common import PaginatedData, PaginationMeta
+from ...agents.harness.tool_registry import REGISTRY
 
 
 class SkillService:
@@ -66,6 +67,19 @@ def _coerce_tool_whitelist(raw: Any) -> list[str]:
             return [str(item) for item in raw if isinstance(item, (str, int, float))]
         return []
 
+    @staticmethod
+    def _validate_tool_whitelist(raw: list[str]) -> list[str]:
+        tools = [str(item).strip() for item in raw if str(item).strip()]
+        unknown = REGISTRY.unknown_names(tools)
+        if unknown:
+            raise ApiError(
+                status_code=422,
+                code=422,
+                message="Unknown agent tool in toolWhitelist",
+                data={"unknownTools": sorted(unknown)},
+            )
+        return tools
+
     @classmethod
     def _to_item(cls, entity: AgentSkill) -> AgentSkillItem:
         visibility_value = (
@@ -140,13 +154,14 @@ async def get_skill(self, *, user_id: int, skill_key: str) -> AgentSkillItem:
 
     async def create_custom_skill(self, *, user_id: int, payload: CreateAgentSkillRequest) -> AgentSkillItem:
         skill_key = await self._generate_unique_user_skill_key(user_id=user_id, name=payload.name)
+        tool_whitelist = self._validate_tool_whitelist(payload.tool_whitelist)
         entity = await self.skills.create(
             values={
                 "skill_key": skill_key,
                 "name": payload.name,
                 "description": payload.description,
                 "triggers_text": payload.triggers_text,
-                "tool_whitelist_json": payload.tool_whitelist,
+                "tool_whitelist_json": tool_whitelist,
                 "plan_template_json": payload.plan_template,
                 "inputs_schema_json": payload.inputs_schema,
                 "outputs_schema_json": payload.outputs_schema,
@@ -178,7 +193,9 @@ async def update_custom_skill(self, *, user_id: int, skill_key: str, payload: Up
         if "triggers_text" in fields_set:
             values["triggers_text"] = payload.triggers_text
         if "tool_whitelist" in fields_set:
-            values["tool_whitelist_json"] = payload.tool_whitelist or []
+            values["tool_whitelist_json"] = self._validate_tool_whitelist(
+                payload.tool_whitelist or []
+            )
         if "plan_template" in fields_set:
             values["plan_template_json"] = payload.plan_template or {}
         if "inputs_schema" in fields_set:
@@ -232,12 +249,13 @@ async def import_global_skills(self, *, payload: ImportAgentSkillsRequest) -> Im
 
         results: list[ImportAgentSkillResult] = []
         for item in payload.items:
+            tool_whitelist = self._validate_tool_whitelist(item.tool_whitelist)
             existing = existing_by_key.get(item.skill_key)
             values = {
                 "name": item.name,
                 "description": item.description,
                 "triggers_text": item.triggers_text,
-                "tool_whitelist_json": item.tool_whitelist,
+                "tool_whitelist_json": tool_whitelist,
                 "plan_template_json": item.plan_template,
                 "inputs_schema_json": item.inputs_schema,
                 "outputs_schema_json": item.outputs_schema,
diff --git a/app/src/fileflash/services/download_rate_limit.py b/app/src/fileflash/services/download_rate_limit.py
new file mode 100644
index 0000000..7f1870b
--- /dev/null
+++ b/app/src/fileflash/services/download_rate_limit.py
@@ -0,0 +1,62 @@
+from __future__ import annotations
+
+from sqlalchemy.ext.asyncio import AsyncSession
+
+from ..core.errors import ApiError
+from ..core.settings import Settings
+from ..models.enums import UserRole
+from ..models.tables_identity import User
+from .rate_limiter import RedisRateLimiter
+
+
+class DownloadRateLimitService:
+    def __init__(
+        self,
+        *,
+        db: AsyncSession,
+        settings: Settings,
+        rate_limiter: RedisRateLimiter,
+    ) -> None:
+        self.db = db
+        self.settings = settings
+        self.rate_limiter = rate_limiter
+
+    async def enforce_user(self, *, user: User, bytes_count: int) -> None:
+        if user.role == UserRole.ADMIN:
+            return
+        await self._enforce(scope=f"user:{int(user.user_id)}", bytes_count=bytes_count)
+
+    async def enforce_user_id(self, *, user_id: int, bytes_count: int) -> None:
+        user = await self.db.get(User, user_id)
+        if user is not None and user.role == UserRole.ADMIN:
+            return
+        await self._enforce(scope=f"user:{int(user_id)}", bytes_count=bytes_count)
+
+    async def enforce_share_ip(self, *, client_ip: str, bytes_count: int) -> None:
+        await self._enforce(scope=f"share-ip:{client_ip}", bytes_count=bytes_count)
+
+    async def _enforce(self, *, scope: str, bytes_count: int) -> None:
+        window_seconds = max(1, int(self.settings.download_rate_window_seconds))
+        request_limit = max(1, int(self.settings.download_rate_limit_requests))
+        byte_limit = max(1, int(self.settings.download_rate_limit_bytes))
+        normalized_bytes = max(0, int(bytes_count))
+
+        request_allowed = await self.rate_limiter.allow(
+            key=f"download-rate:{scope}:requests",
+            limit=request_limit,
+            window_seconds=window_seconds,
+        )
+        if not request_allowed:
+            raise ApiError(status_code=429, code=429, message="Download rate limit exceeded")
+
+        bytes_allowed = await self.rate_limiter.allow_weighted(
+            key=f"download-rate:{scope}:bytes",
+            limit=byte_limit,
+            window_seconds=window_seconds,
+            weight=normalized_bytes,
+        )
+        if not bytes_allowed:
+            raise ApiError(status_code=429, code=429, message="Download bandwidth limit exceeded")
+
+
+__all__ = ["DownloadRateLimitService"]
diff --git a/app/src/fileflash/services/file.py b/app/src/fileflash/services/file.py
index 453abdb..7d18814 100644
--- a/app/src/fileflash/services/file.py
+++ b/app/src/fileflash/services/file.py
@@ -74,6 +74,12 @@ class DownloadStreamResult:
     headers: dict[str, str]
 
 
+@dataclass(slots=True)
+class BatchDownloadPlan:
+    files: list[tuple[File, StorageObject, str]]
+    estimated_bytes: int
+
+
 @dataclass(slots=True)
 class ResolvedStreamObject:
     storage_object: StorageObject
@@ -358,6 +364,15 @@ async def create_batch_download_archive(
         user_id: int,
         payload: BatchDownloadRequest,
     ) -> tuple[str, str]:
+        plan = await self.create_batch_download_plan(user_id=user_id, payload=payload)
+        return await self.create_batch_download_archive_from_plan(plan=plan)
+
+    async def create_batch_download_plan(
+        self,
+        *,
+        user_id: int,
+        payload: BatchDownloadRequest,
+    ) -> BatchDownloadPlan:
         if self.storage is None:
             raise ApiError(status_code=503, code=503, message="Object storage is unavailable")
 
@@ -427,6 +442,31 @@ async def create_batch_download_archive(
         if not files_with_storage:
             raise ApiError(status_code=404, code=404, message="No downloadable files found")
 
+        files = [
+            (
+                file_row,
+                storage_object,
+                self._safe_zip_path(file_paths.get(int(file_row.file_id), file_row.file_name)),
+            )
+            for file_row, storage_object in files_with_storage
+        ]
+        estimated_bytes = sum(
+            int(storage_object.object_size or file_row.file_size or 0)
+            for file_row, storage_object, _zip_path in files
+        )
+        return BatchDownloadPlan(files=files, estimated_bytes=max(0, estimated_bytes))
+
+    async def create_batch_download_archive_from_plan(
+        self,
+        *,
+        plan: BatchDownloadPlan,
+    ) -> tuple[str, str]:
+        if self.storage is None:
+            raise ApiError(status_code=503, code=503, message="Object storage is unavailable")
+
+        if not plan.files:
+            raise ApiError(status_code=404, code=404, message="No downloadable files found")
+
         archive_name = f"fileflash-download-{datetime.now(UTC).strftime('%Y%m%d-%H%M%S')}.zip"
         tmp = tempfile.NamedTemporaryFile(prefix="fileflash-download-", suffix=".zip", delete=False)
         tmp_path = tmp.name
@@ -434,8 +474,7 @@ async def create_batch_download_archive(
 
         try:
             with zipfile.ZipFile(tmp_path, mode="w", compression=zipfile.ZIP_DEFLATED, allowZip64=True) as archive:
-                for file_row, storage_object in files_with_storage:
-                    zip_path = self._safe_zip_path(file_paths.get(int(file_row.file_id), file_row.file_name))
+                for _file_row, storage_object, zip_path in plan.files:
                     with archive.open(zip_path, mode="w") as entry:
                         async for chunk in self.storage.iter_object(
                             bucket_name=storage_object.bucket_name,
diff --git a/app/src/fileflash/services/rate_limiter.py b/app/src/fileflash/services/rate_limiter.py
index 9ced38d..00450a9 100644
--- a/app/src/fileflash/services/rate_limiter.py
+++ b/app/src/fileflash/services/rate_limiter.py
@@ -21,13 +21,17 @@ async def _client(self) -> Redis | None:
         return self._redis
 
     async def allow(self, key: str, limit: int, window_seconds: int) -> bool:
+        return await self.allow_weighted(key=key, limit=limit, window_seconds=window_seconds, weight=1)
+
+    async def allow_weighted(self, key: str, limit: int, window_seconds: int, weight: int) -> bool:
         client = await self._client()
         if client is None:
             return True
 
+        normalized_weight = max(0, int(weight))
         try:
-            current = await client.incr(key)
-            if current == 1:
+            current = await client.incrby(key, normalized_weight)
+            if current == normalized_weight:
                 await client.expire(key, window_seconds)
             return current <= limit
         except RedisError:
diff --git a/app/src/fileflash/services/share.py b/app/src/fileflash/services/share.py
index 4d0ce35..a2b0755 100644
--- a/app/src/fileflash/services/share.py
+++ b/app/src/fileflash/services/share.py
@@ -2,7 +2,7 @@
 
 import logging
 import secrets
-from collections.abc import AsyncIterator
+from collections.abc import AsyncIterator, Awaitable, Callable
 from datetime import UTC, datetime
 from math import ceil
 from pathlib import Path
@@ -422,6 +422,7 @@ async def get_shared_file_download_stream_response(
         range_header: str | None,
         ip_address: str,
         user_agent: str | None,
+        rate_limit_check: Callable[[int], Awaitable[None]] | None = None,
     ) -> tuple[AsyncIterator[bytes], str, str, int, dict[str, str]]:
         async def _operation() -> tuple[AsyncIterator[bytes], str, str, int, dict[str, str]]:
             await apply_local_lock_timeout(self.db)
@@ -449,6 +450,11 @@ async def _operation() -> tuple[AsyncIterator[bytes], str, str, int, dict[str, s
             if object_size <= 0:
                 raise ApiError(status_code=404, code=404, message="Shared file content not found")
 
+            byte_range = self._parse_range_header(range_header=range_header, file_size=object_size)
+            bytes_to_send = object_size if byte_range is None else byte_range[1] - byte_range[0] + 1
+            if rate_limit_check is not None:
+                await rate_limit_check(bytes_to_send)
+
             if action == "download":
                 await self.db.execute(
                     update(Share)
@@ -479,7 +485,6 @@ async def _operation() -> tuple[AsyncIterator[bytes], str, str, int, dict[str, s
                 ),
             }
 
-            byte_range = self._parse_range_header(range_header=range_header, file_size=object_size)
             if byte_range is None:
                 headers["Content-Length"] = str(object_size)
                 return (
diff --git a/app/tests/test_admin_system_service.py b/app/tests/test_admin_system_service.py
index f5cbe7c..2c94b41 100644
--- a/app/tests/test_admin_system_service.py
+++ b/app/tests/test_admin_system_service.py
@@ -35,3 +35,19 @@ async def test_health_hash_computation_enabled_follows_settings() -> None:
     )
     enabled_health = await enabled_service.health()
     assert enabled_health.hash_computation_enabled is True
+
+
+@pytest.mark.asyncio
+async def test_rate_limit_status_uses_auth_default_limits() -> None:
+    service = AdminSystemService(
+        db=DummySession(),
+        settings=make_settings(),
+    )
+
+    status = await service.rate_limit_status()
+    rules_by_scope = {rule.scope: rule for rule in status.rules}
+
+    assert rules_by_scope["auth.login"].limit == 30
+    assert rules_by_scope["auth.login"].window_seconds == 300
+    assert rules_by_scope["auth.register"].limit == 12
+    assert rules_by_scope["auth.register"].window_seconds == 600
diff --git a/app/tests/test_admin_users_routes.py b/app/tests/test_admin_users_routes.py
index b5cccae..bff1702 100644
--- a/app/tests/test_admin_users_routes.py
+++ b/app/tests/test_admin_users_routes.py
@@ -9,7 +9,7 @@
 from fileflash.core.deps import get_admin_users_service, require_admin
 from fileflash.core.errors import ApiError, api_error_handler
 from fileflash.routers.admin_users import router as admin_users_router
-from fileflash.schemas.admin.users import AdminUserItem, UpdateUserStatusResponse
+from fileflash.schemas.admin.users import AdminUserItem, AdminUserUsageStats, UpdateUserStatusResponse
 from fileflash.schemas.common import PaginatedData, PaginationMeta
 
 
@@ -29,6 +29,7 @@ async def list_users(self, *, query):  # noqa: ANN001
             last_login_at=None,
             last_active_at=None,
             created_at=datetime.now(UTC),
+            usage_stats=AdminUserUsageStats(traffic_bytes=1024, agent_tokens=42),
         )
         return PaginatedData(
             items=[item],
@@ -73,6 +74,7 @@ def test_admin_can_list_users() -> None:
     body = resp.json()
     assert body["success"] is True
     assert body["data"]["items"][0]["username"] == "alice"
+    assert body["data"]["items"][0]["usageStats"] == {"trafficBytes": 1024, "agentTokens": 42}
 
 
 def test_non_admin_gets_403() -> None:
@@ -81,6 +83,32 @@ def test_non_admin_gets_403() -> None:
     assert resp.status_code == 403
 
 
+def test_usage_window_requires_both_bounds() -> None:
+    with _client(admin=True) as c:
+        resp = c.get("/api/v1/admin/users?usageFrom=2026-01-01T00:00:00Z")
+    assert resp.status_code == 400
+
+
+def test_usage_window_rejects_reversed_bounds() -> None:
+    with _client(admin=True) as c:
+        resp = c.get(
+            "/api/v1/admin/users"
+            "?usageFrom=2026-02-01T00:00:00Z"
+            "&usageTo=2026-01-01T00:00:00Z"
+        )
+    assert resp.status_code == 400
+
+
+def test_usage_window_rejects_more_than_90_days() -> None:
+    with _client(admin=True) as c:
+        resp = c.get(
+            "/api/v1/admin/users"
+            "?usageFrom=2026-01-01T00:00:00Z"
+            "&usageTo=2026-04-02T00:00:00Z"
+        )
+    assert resp.status_code == 400
+
+
 def test_admin_can_patch_status() -> None:
     with _client(admin=True) as c:
         resp = c.patch("/api/v1/admin/users/42/status", json={"status": "suspended"})
diff --git a/app/tests/test_admin_users_service.py b/app/tests/test_admin_users_service.py
index 9e455a8..1370023 100644
--- a/app/tests/test_admin_users_service.py
+++ b/app/tests/test_admin_users_service.py
@@ -42,6 +42,14 @@ def __init__(self) -> None:
         self.execute = AsyncMock()
 
 
+class ResultRows:
+    def __init__(self, rows) -> None:  # noqa: ANN001
+        self._rows = rows
+
+    def all(self):  # noqa: ANN201
+        return self._rows
+
+
 @pytest.mark.asyncio
 async def test_list_users_returns_paginated_items() -> None:
     session = DummySession()
@@ -55,6 +63,41 @@ async def test_list_users_returns_paginated_items() -> None:
     assert result.pagination.total_items == 1
     assert result.items[0].username == "alice"
     assert result.items[0].status == "active"
+    assert result.items[0].usage_stats.traffic_bytes == 0
+    assert result.items[0].usage_stats.agent_tokens == 0
+
+
+def test_list_users_query_default_usage_window() -> None:
+    now = datetime(2026, 5, 26, 12, 0, tzinfo=UTC)
+    usage_from, usage_to = ListAdminUsersQuery().resolve_usage_window(now=now)
+
+    assert usage_to == now
+    assert (usage_to - usage_from).days == 7
+
+
+@pytest.mark.asyncio
+async def test_collect_usage_stats_aggregates_traffic_and_tokens() -> None:
+    session = DummySession()
+    session.execute = AsyncMock(
+        side_effect=[
+            ResultRows([(1, 2048), (2, 4096)]),
+            ResultRows([(1, 1500), (3, None)]),
+        ]
+    )
+    service = AdminUsersService(db=session)  # type: ignore[arg-type]
+
+    stats = await service._collect_usage_stats(
+        user_ids=[1, 2, 3],
+        usage_from=datetime(2026, 5, 1, tzinfo=UTC),
+        usage_to=datetime(2026, 5, 26, tzinfo=UTC),
+    )
+
+    assert stats[1].traffic_bytes == 2048
+    assert stats[1].agent_tokens == 1500
+    assert stats[2].traffic_bytes == 4096
+    assert stats[2].agent_tokens == 0
+    assert stats[3].traffic_bytes == 0
+    assert stats[3].agent_tokens == 0
 
 
 @pytest.mark.asyncio
diff --git a/app/tests/test_agent_a_end_to_end.py b/app/tests/test_agent_a_end_to_end.py
new file mode 100644
index 0000000..377fcbc
--- /dev/null
+++ b/app/tests/test_agent_a_end_to_end.py
@@ -0,0 +1,108 @@
+from __future__ import annotations
+
+import asyncio
+from datetime import UTC, datetime
+from types import SimpleNamespace
+from unittest.mock import AsyncMock
+
+import pytest
+from test_agent_inbox_repository import InboxSession
+
+from fileflash.agents.harness.event_bus import InMemoryAgentEventBus
+from fileflash.agents.harness.inbox import AgentInbox
+from fileflash.agents.runtime import execute_runner as execute_module
+from fileflash.agents.runtime.execute_runner import AgentJobCanceled, ExecuteRunner
+from fileflash.models import BackgroundJob
+from fileflash.models.enums import AgentInboxKind
+
+
+class RuntimeInboxSession(InboxSession):
+    async def refresh(self, _job: BackgroundJob) -> None:
+        return None
+
+    async def rollback(self) -> None:
+        return None
+
+
+def _execute_job() -> BackgroundJob:
+    now = datetime.now(UTC)
+    return BackgroundJob(
+        job_id=800,
+        task_type="agent.execute",
+        status="running",
+        payload={
+            "planJobId": "500",
+            "planHash": "sha256:test",
+            "approval": {
+                "confirmedBy": "7",
+                "confirmedAt": now.isoformat(),
+                "highRiskConfirmed": False,
+            },
+        },
+        result={},
+        requested_by=7,
+        scheduled_at=now,
+        created_at=now,
+        updated_at=now,
+    )
+
+
+@pytest.mark.asyncio
+async def test_user_pause_then_cancel_via_inbox(monkeypatch: pytest.MonkeyPatch):
+    action = {
+        "step": 1,
+        "tool": "drive.countFiles",
+        "input": {"folderId": "root", "recursive": True, "category": "video"},
+        "sideEffect": "read",
+        "riskLevel": "low",
+        "requiresConfirmation": False,
+    }
+    monkeypatch.setattr(
+        execute_module,
+        "AgentPlanRepository",
+        lambda _db: SimpleNamespace(
+            get_for_execute_binding=AsyncMock(
+                return_value=SimpleNamespace(proposed_actions_json=[action])
+            )
+        ),
+    )
+    monkeypatch.setattr(
+        execute_module,
+        "AgentWorkSessionRepository",
+        lambda _db: SimpleNamespace(
+            create_for_job=AsyncMock(return_value=None),
+            close_session=AsyncMock(return_value=None),
+        ),
+    )
+
+    session = RuntimeInboxSession()
+    bus = InMemoryAgentEventBus()
+    inbox = AgentInbox(db=session, event_bus=bus)  # type: ignore[arg-type]
+    job = _execute_job()
+    seen_events: list[str] = []
+
+    await inbox.handle(job_id=int(job.job_id), kind=AgentInboxKind.CONTROL_PAUSE, payload={})
+    await session.commit()
+
+    async def cancel_when_paused() -> None:
+        async with bus.subscribe(job_id=int(job.job_id)) as stream:
+            while True:
+                event = await stream.next(timeout=2.0)
+                seen_events.append(event.event_type)
+                if event.event_type == "agent.paused":
+                    await inbox.handle(
+                        job_id=int(job.job_id),
+                        kind=AgentInboxKind.CONTROL_CANCEL,
+                        payload={},
+                    )
+                    await session.commit()
+                    return
+
+    listener = asyncio.create_task(cancel_when_paused())
+    await asyncio.sleep(0)
+    with pytest.raises(AgentJobCanceled):
+        await ExecuteRunner(event_bus=bus).run(db=session, job=job)  # type: ignore[arg-type]
+    await listener
+
+    assert "agent.paused" in seen_events
+    assert job.cancel_requested_at is not None
diff --git a/app/tests/test_agent_ask_protocol.py b/app/tests/test_agent_ask_protocol.py
new file mode 100644
index 0000000..d935075
--- /dev/null
+++ b/app/tests/test_agent_ask_protocol.py
@@ -0,0 +1,67 @@
+from __future__ import annotations
+
+import asyncio
+
+import pytest
+from test_agent_inbox_repository import InboxSession
+
+from fileflash.agents.harness.ask import AskProtocol, AskTimedOut
+from fileflash.agents.harness.event_bus import InMemoryAgentEventBus
+from fileflash.agents.harness.inbox import AgentInbox
+from fileflash.models.enums import AgentInboxKind, AgentInboxStatus
+
+
+@pytest.mark.asyncio
+async def test_ask_returns_when_reply_arrives() -> None:
+    session = InboxSession()
+    bus = InMemoryAgentEventBus()
+    inbox = AgentInbox(db=session, event_bus=bus)  # type: ignore[arg-type]
+    protocol = AskProtocol(db=session, event_bus=bus, job_id=1)  # type: ignore[arg-type]
+
+    await protocol.start()
+    try:
+        async def reply_later() -> None:
+            for _ in range(20):
+                asks = [msg for msg in session.messages if msg.kind == AgentInboxKind.ASK]
+                if asks:
+                    ask = asks[-1]
+                    await inbox.handle(
+                        job_id=1,
+                        kind=AgentInboxKind.REPLY,
+                        payload={"value": "A"},
+                        reply_to_id=int(ask.inbox_message_id),
+                    )
+                    await session.commit()
+                    return
+                await asyncio.sleep(0.01)
+            raise AssertionError("ask message was not created")
+
+        replier = asyncio.create_task(reply_later())
+        result = await protocol.ask(
+            prompt="choose",
+            schema={"choice": ["A", "B"]},
+            timeout_sec=2.0,
+        )
+        await replier
+    finally:
+        await protocol.aclose()
+
+    assert result == "A"
+
+
+@pytest.mark.asyncio
+async def test_ask_times_out() -> None:
+    session = InboxSession()
+    bus = InMemoryAgentEventBus()
+    protocol = AskProtocol(db=session, event_bus=bus, job_id=1)  # type: ignore[arg-type]
+
+    await protocol.start()
+    try:
+        with pytest.raises(AskTimedOut):
+            await protocol.ask(prompt="?", schema={}, timeout_sec=0.1)
+    finally:
+        await protocol.aclose()
+
+    asks = [msg for msg in session.messages if msg.kind == AgentInboxKind.ASK]
+    assert asks
+    assert asks[-1].status == AgentInboxStatus.TIMED_OUT
diff --git a/app/tests/test_agent_event_bus.py b/app/tests/test_agent_event_bus.py
new file mode 100644
index 0000000..6214640
--- /dev/null
+++ b/app/tests/test_agent_event_bus.py
@@ -0,0 +1,82 @@
+from __future__ import annotations
+
+from datetime import UTC, datetime
+
+import pytest
+
+from fileflash.agents.harness.event_bus import AgentEventEnvelope, InMemoryAgentEventBus
+
+
+@pytest.mark.asyncio
+async def test_subscriber_receives_published_event() -> None:
+    bus = InMemoryAgentEventBus()
+    envelope = AgentEventEnvelope(
+        job_id=42,
+        event_type="agent.ask",
+        payload={"prompt": "choose"},
+        emitted_at=datetime.now(UTC),
+    )
+
+    async with bus.subscribe(job_id=42) as stream:
+        await bus.publish(envelope)
+        received = await stream.next(timeout=1.0)
+
+    assert received == envelope
+
+
+@pytest.mark.asyncio
+async def test_only_subscribers_of_same_job_receive() -> None:
+    bus = InMemoryAgentEventBus()
+    own = AgentEventEnvelope(
+        job_id=1,
+        event_type="job.running",
+        payload={},
+        emitted_at=datetime.now(UTC),
+    )
+    other = AgentEventEnvelope(
+        job_id=2,
+        event_type="job.running",
+        payload={},
+        emitted_at=datetime.now(UTC),
+    )
+
+    async with bus.subscribe(job_id=1) as stream:
+        await bus.publish(other)
+        await bus.publish(own)
+        first = await stream.next(timeout=1.0)
+
+    assert first == own
+
+
+@pytest.mark.asyncio
+async def test_empty_subscriber_times_out() -> None:
+    bus = InMemoryAgentEventBus()
+    async with bus.subscribe(job_id=7) as stream:
+        with pytest.raises(TimeoutError):
+            await stream.next(timeout=0.1)
+
+
+def test_event_envelope_json_serializes_nested_datetime_payload() -> None:
+    now = datetime.now(UTC).replace(microsecond=0)
+    envelope = AgentEventEnvelope(
+        job_id=9,
+        event_type="job.succeeded",
+        payload={
+            "data": {
+                "result": {
+                    "finishedAt": now,
+                    "steps": [{"completedAt": now}],
+                }
+            }
+        },
+        emitted_at=now,
+        event_id="evt-1",
+    )
+
+    decoded = AgentEventEnvelope.from_json(envelope.to_json())
+
+    assert decoded.job_id == envelope.job_id
+    assert decoded.event_type == envelope.event_type
+    assert decoded.event_id == "evt-1"
+    assert decoded.payload["data"]["result"]["finishedAt"] == now.isoformat()
+    assert decoded.payload["data"]["result"]["steps"][0]["completedAt"] == now.isoformat()
diff --git a/app/tests/test_agent_inbox.py b/app/tests/test_agent_inbox.py
new file mode 100644
index 0000000..7520ffa
--- /dev/null
+++ b/app/tests/test_agent_inbox.py
@@ -0,0 +1,52 @@
+from __future__ import annotations
+
+import pytest
+from test_agent_inbox_repository import InboxSession
+
+from fileflash.agents.harness.event_bus import InMemoryAgentEventBus
+from fileflash.agents.harness.inbox import AgentInbox
+from fileflash.models import AgentInboxMessage
+from fileflash.models.enums import AgentInboxKind
+from fileflash.repositories import AgentInboxMessageRepository
+
+
+@pytest.mark.asyncio
+async def test_handle_reply_persists_and_publishes() -> None:
+    session = InboxSession()
+    repo = AgentInboxMessageRepository(session)  # type: ignore[arg-type]
+    ask = await repo.create_ask(job_id=1, payload={"prompt": "?"})
+    await session.commit()
+
+    bus = InMemoryAgentEventBus()
+    inbox = AgentInbox(db=session, event_bus=bus)  # type: ignore[arg-type]
+
+    async with bus.subscribe(job_id=1) as stream:
+        msg = await inbox.handle(
+            job_id=1,
+            kind=AgentInboxKind.REPLY,
+            payload={"value": "yes"},
+            reply_to_id=int(ask.inbox_message_id),
+        )
+        await session.commit()
+        event = await stream.next(timeout=1.0)
+
+    assert isinstance(msg, AgentInboxMessage)
+    assert msg.kind == AgentInboxKind.REPLY
+    assert event.event_type == "agent.inbox.reply"
+    assert event.payload["replyTo"] == str(ask.inbox_message_id)
+    assert event.payload["value"] == "yes"
+
+
+@pytest.mark.asyncio
+async def test_reply_with_unknown_ask_raises() -> None:
+    session = InboxSession()
+    bus = InMemoryAgentEventBus()
+    inbox = AgentInbox(db=session, event_bus=bus)  # type: ignore[arg-type]
+
+    with pytest.raises(ValueError):
+        await inbox.handle(
+            job_id=1,
+            kind=AgentInboxKind.REPLY,
+            payload={"value": "yes"},
+            reply_to_id=999999,
+        )
diff --git a/app/tests/test_agent_inbox_model.py b/app/tests/test_agent_inbox_model.py
new file mode 100644
index 0000000..b9fae17
--- /dev/null
+++ b/app/tests/test_agent_inbox_model.py
@@ -0,0 +1,22 @@
+from __future__ import annotations
+
+from datetime import UTC, datetime
+
+from fileflash.models import AgentInboxMessage
+from fileflash.models.enums import AgentInboxKind, AgentInboxRole, AgentInboxStatus
+
+
+def test_agent_inbox_message_model_fields() -> None:
+    msg = AgentInboxMessage(
+        job_id=1,
+        role=AgentInboxRole.AGENT,
+        kind=AgentInboxKind.ASK,
+        payload_json={"prompt": "which one?", "schema": {}},
+        status=AgentInboxStatus.WAITING,
+        created_at=datetime.now(UTC),
+    )
+
+    assert AgentInboxMessage.__tablename__ == "agent_inbox_message"
+    assert msg.kind == AgentInboxKind.ASK
+    assert msg.status == AgentInboxStatus.WAITING
+    assert msg.payload_json["prompt"] == "which one?"
diff --git a/app/tests/test_agent_inbox_repository.py b/app/tests/test_agent_inbox_repository.py
new file mode 100644
index 0000000..7f8f62d
--- /dev/null
+++ b/app/tests/test_agent_inbox_repository.py
@@ -0,0 +1,106 @@
+from __future__ import annotations
+
+from datetime import UTC, datetime
+
+import pytest
+
+from fileflash.models import AgentInboxMessage
+from fileflash.models.enums import AgentInboxKind, AgentInboxRole, AgentInboxStatus
+from fileflash.repositories import AgentInboxMessageRepository
+
+
+class InboxSession:
+    def __init__(self) -> None:
+        self.messages: list[AgentInboxMessage] = []
+        self._next_id = 1
+        self.commits = 0
+
+    def add(self, msg: AgentInboxMessage) -> None:
+        msg.inbox_message_id = self._next_id
+        self._next_id += 1
+        self.messages.append(msg)
+
+    async def flush(self) -> None:
+        return None
+
+    async def commit(self) -> None:
+        self.commits += 1
+
+    async def get(self, _model, inbox_message_id: int):  # noqa: ANN001
+        for msg in self.messages:
+            if msg.inbox_message_id == inbox_message_id:
+                return msg
+        return None
+
+    async def scalar(self, _query):  # noqa: ANN001
+        return None
+
+    async def scalars(self, _query):  # noqa: ANN001
+        controls = {
+            AgentInboxKind.CONTROL_PAUSE,
+            AgentInboxKind.CONTROL_RESUME,
+            AgentInboxKind.CONTROL_APPROVE,
+            AgentInboxKind.CONTROL_DENY,
+            AgentInboxKind.CONTROL_SKIP,
+            AgentInboxKind.CONTROL_CANCEL,
+        }
+        return [
+            msg
+            for msg in self.messages
+            if msg.role == AgentInboxRole.USER
+            and msg.kind in controls
+            and msg.status is None
+        ]
+
+
+@pytest.mark.asyncio
+async def test_create_ask_then_record_reply() -> None:
+    session = InboxSession()
+    repo = AgentInboxMessageRepository(session)  # type: ignore[arg-type]
+
+    ask = await repo.create_ask(
+        job_id=1,
+        payload={"prompt": "choose", "schema": {"choice": ["A", "B"]}},
+    )
+    await session.commit()
+    assert ask.status == AgentInboxStatus.WAITING
+    assert ask.role == AgentInboxRole.AGENT
+    assert ask.kind == AgentInboxKind.ASK
+
+    reply = await repo.record_user_message(
+        job_id=1,
+        kind=AgentInboxKind.REPLY,
+        payload={"value": "A"},
+        reply_to_id=int(ask.inbox_message_id),
+    )
+    await session.commit()
+    assert reply.role == AgentInboxRole.USER
+    assert reply.reply_to_id == ask.inbox_message_id
+
+    answered = await repo.mark_answered(
+        inbox_message_id=int(ask.inbox_message_id),
+        answered_at=datetime.now(UTC),
+    )
+    await session.commit()
+    assert answered.status == AgentInboxStatus.ANSWERED
+    assert answered.answered_at is not None
+
+
+@pytest.mark.asyncio
+async def test_pending_controls_excludes_consumed() -> None:
+    session = InboxSession()
+    repo = AgentInboxMessageRepository(session)  # type: ignore[arg-type]
+    pause = await repo.record_user_message(
+        job_id=1,
+        kind=AgentInboxKind.CONTROL_PAUSE,
+        payload={},
+    )
+    await session.commit()
+
+    pending = await repo.list_pending_controls(job_id=1)
+    assert [msg.inbox_message_id for msg in pending] == [pause.inbox_message_id]
+
+    await repo.mark_dropped(inbox_message_id=int(pause.inbox_message_id))
+    await session.commit()
+    pending_after = await repo.list_pending_controls(job_id=1)
+    assert pending_after == []
diff --git a/app/tests/test_agent_inbox_schema.py b/app/tests/test_agent_inbox_schema.py
new file mode 100644
index 0000000..f6f7cd2
--- /dev/null
+++ b/app/tests/test_agent_inbox_schema.py
@@ -0,0 +1,21 @@
+from __future__ import annotations
+
+import pytest
+from pydantic import ValidationError
+
+from fileflash.schemas.agent import AgentInboxMessageRequest
+
+
+def test_reply_with_value_validates() -> None:
+    msg = AgentInboxMessageRequest.model_validate(
+        {"kind": "reply", "replyTo": "42", "value": "yes"}
+    )
+
+    assert msg.kind == "reply"
+    assert msg.reply_to == "42"
+    assert msg.value == "yes"
+
+
+def test_unknown_kind_rejected() -> None:
+    with pytest.raises(ValidationError):
+        AgentInboxMessageRequest.model_validate({"kind": "control.explode"})
diff --git a/app/tests/test_agent_plan_execute_runtime.py b/app/tests/test_agent_plan_execute_runtime.py
index 46fd8ef..256bdeb 100644
--- a/app/tests/test_agent_plan_execute_runtime.py
+++ b/app/tests/test_agent_plan_execute_runtime.py
@@ -1,20 +1,25 @@
 from __future__ import annotations
 
+import asyncio
+from contextlib import asynccontextmanager
 from datetime import UTC, datetime
 from types import SimpleNamespace
+from typing import Any
 from unittest.mock import AsyncMock
 
 import pytest
 
+from fileflash.agents.harness.event_bus import AgentEventEnvelope
 from fileflash.agents.harness.policy import PolicyGuard, classify_tool_risk
 from fileflash.agents.harness.router import ToolCall, ToolRouter
 from fileflash.agents.runtime import execute_runner as execute_module
-from fileflash.agents.runtime.execute_runner import ExecuteRunner
 from fileflash.agents.runtime import plan_runner as plan_module
+from fileflash.agents.runtime.execute_runner import AgentJobCanceled, ExecuteRunner
 from fileflash.agents.runtime.llm import AnthropicPlannerClient
 from fileflash.agents.runtime.plan_runner import PlanRunner
 from fileflash.core.errors import ApiError
 from fileflash.models import BackgroundJob
+from fileflash.models.enums import AgentInboxKind
 from fileflash.repositories import (
     AgentPlanRepository,
     AgentSettingsRepository,
@@ -67,6 +72,7 @@ def settings(**overrides):
         "agent_user_concurrent_limit": 2,
         "agent_user_daily_limit": 50,
         "agent_llm_base_url": None,
+        "agent_llm_plan_max_tokens": 8192,
     }
     base.update(overrides)
     return SimpleNamespace(**base)
@@ -154,7 +160,7 @@ async def create(self, **kwargs):  # noqa: ANN003
     )
 
     assert fake_messages.kwargs["model"] == "claude-test"
-    assert fake_messages.kwargs["max_tokens"] == 4096
+    assert fake_messages.kwargs["max_tokens"] == 8192
     assert fake_messages.kwargs["system"] == "system"
     assert fake_messages.kwargs["messages"] == [{"role": "user", "content": "user"}]
     assert fake_messages.kwargs["thinking"] == {"type": "adaptive"}
@@ -239,6 +245,272 @@ async def create(self, **kwargs):  # noqa: ANN003
     assert result["summary"] == "fallback"
 
 
+@pytest.mark.asyncio
+async def test_anthropic_planner_client_retries_with_json_only_prompt_on_invalid_json():
+    class FakeMessages:
+        def __init__(self) -> None:
+            self.calls: list[dict[str, object]] = []
+
+        async def create(self, **kwargs):  # noqa: ANN003
+            self.calls.append(dict(kwargs))
+            if len(self.calls) == 1:
+                return SimpleNamespace(
+                    content=[SimpleNamespace(type="text", text="I think we should move files.")],
+                    usage={},
+                )
+            if len(self.calls) == 2:
+                return SimpleNamespace(
+                    content=[SimpleNamespace(type="text", text="summary: move files")],
+                    usage={},
+                )
+            return SimpleNamespace(
+                content=[SimpleNamespace(type="text", text='{"summary":"strict","proposedActions":[]}')],
+                usage={},
+            )
+
+    fake_messages = FakeMessages()
+    client = AnthropicPlannerClient(
+        settings=settings(
+            agent_llm_api_key="test-key",
+            agent_llm_model="claude-test",
+        ),
+        client=SimpleNamespace(messages=fake_messages),  # type: ignore[arg-type]
+    )
+
+    result = await client.create_plan(
+        system_prompt="system",
+        user_prompt="user",
+        max_tokens=1024,
+        reasoning_effort="high",
+    )
+
+    assert len(fake_messages.calls) == 3
+    assert "thinking" in fake_messages.calls[0]
+    assert "output_config" in fake_messages.calls[0]
+    assert "thinking" not in fake_messages.calls[1]
+    assert "output_config" not in fake_messages.calls[1]
+    assert "thinking" not in fake_messages.calls[2]
+    assert "output_config" not in fake_messages.calls[2]
+    assert fake_messages.calls[1]["max_tokens"] == 1024
+    assert fake_messages.calls[2]["max_tokens"] == 8192
+    third_messages = fake_messages.calls[2]["messages"]
+    assert isinstance(third_messages, list)
+    assert "Return ONLY one valid JSON object" in third_messages[0]["content"]
+    assert result["summary"] == "strict"
+
+
+@pytest.mark.asyncio
+async def test_anthropic_planner_client_parses_json_from_wrapped_text():
+    class FakeMessages:
+        async def create(self, **kwargs):  # noqa: ANN003
+            return SimpleNamespace(
+                content=[
+                    SimpleNamespace(
+                        type="text",
+                        text='Here is the result:\n{"summary":"ok","proposedActions":[]}\nThanks!',
+                    )
+                ],
+                usage={},
+            )
+
+    client = AnthropicPlannerClient(
+        settings=settings(
+            agent_llm_api_key="test-key",
+            agent_llm_model="claude-test",
+        ),
+        client=SimpleNamespace(messages=FakeMessages()),  # type: ignore[arg-type]
+    )
+
+    result = await client.create_plan(
+        system_prompt="system",
+        user_prompt="user",
+        max_tokens=1000,
+    )
+
+    assert result["summary"] == "ok"
+    assert result["proposedActions"] == []
+
+
+@pytest.mark.asyncio
+async def test_anthropic_planner_client_raises_after_three_invalid_json_responses():
+    class FakeMessages:
+        def __init__(self) -> None:
+            self.calls: list[dict[str, object]] = []
+
+        async def create(self, **kwargs):  # noqa: ANN003
+            self.calls.append(dict(kwargs))
+            return SimpleNamespace(
+                content=[SimpleNamespace(type="text", text="not valid json")],
+                usage={},
+            )
+
+    fake_messages = FakeMessages()
+    client = AnthropicPlannerClient(
+        settings=settings(
+            agent_llm_api_key="test-key",
+            agent_llm_model="claude-test",
+        ),
+        client=SimpleNamespace(messages=fake_messages),  # type: ignore[arg-type]
+    )
+
+    with pytest.raises(ApiError) as exc:
+        await client.create_plan(
+            system_prompt="system",
+            user_prompt="user",
+            max_tokens=1024,
+            reasoning_effort="high",
+        )
+
+    assert exc.value.status_code == 502
+    assert exc.value.message == "Agent LLM did not return valid JSON"
+    assert len(fake_messages.calls) == 3
+
+
+@pytest.mark.asyncio
+async def test_anthropic_planner_client_uses_tools_and_parses_tool_use_blocks():
+    class FakeMessages:
+        def __init__(self) -> None:
+            self.kwargs = {}
+
+        async def create(self, **kwargs):  # noqa: ANN003
+            self.kwargs = kwargs
+            return SimpleNamespace(
+                content=[
+                    SimpleNamespace(type="text", text="Count matching videos."),
+                    SimpleNamespace(
+                        type="tool_use",
+                        id="toolu_1",
+                        name="drive_count_files",
+                        input={"folderId": "root", "category": "video"},
+                    ),
+                ],
+                usage={"input_tokens": 5, "output_tokens": 6},
+            )
+
+    fake_messages = FakeMessages()
+    client = AnthropicPlannerClient(
+        settings=settings(
+            agent_llm_api_key="test-key",
+            agent_llm_model="claude-test",
+        ),
+        client=SimpleNamespace(messages=fake_messages),  # type: ignore[arg-type]
+    )
+
+    result = await client.create_plan(
+        system_prompt="system",
+        user_prompt="user",
+        max_tokens=1024,
+        tools=[
+            {
+                "name": "drive_count_files",
+                "description": "Count files.",
+                "input_schema": {"type": "object"},
+                "internalName": "drive.countFiles",
+            }
+        ],
+    )
+
+    assert fake_messages.kwargs["tool_choice"] == {"type": "auto"}
+    assert fake_messages.kwargs["tools"] == [
+        {
+            "name": "drive_count_files",
+            "description": "Count files.",
+            "input_schema": {"type": "object"},
+        }
+    ]
+    assert result["summary"] == "Count matching videos."
+    assert result["proposedActions"] == [
+        {
+            "step": 1,
+            "tool": "drive.countFiles",
+            "input": {"folderId": "root", "category": "video"},
+        }
+    ]
+    assert result["_usage"] == {"input_tokens": 5, "output_tokens": 6}
+
+
+@pytest.mark.asyncio
+async def test_anthropic_planner_client_executes_tool_loop_before_final_plan():
+    class FakeMessages:
+        def __init__(self) -> None:
+            self.calls: list[dict[str, Any]] = []
+
+        async def create(self, **kwargs):  # noqa: ANN003
+            self.calls.append(dict(kwargs))
+            if len(self.calls) == 1:
+                return SimpleNamespace(
+                    content=[
+                        SimpleNamespace(type="text", text="Need to inspect candidates first."),
+                        SimpleNamespace(
+                            type="tool_use",
+                            id="toolu_1",
+                            name="drive_search_files",
+                            input={"folderId": "root", "query": "银翼杀手", "category": "video"},
+                        ),
+                    ],
+                    usage={"input_tokens": 10, "output_tokens": 5},
+                )
+            return SimpleNamespace(
+                content=[
+                    SimpleNamespace(
+                        type="text",
+                        text=(
+                            '{"summary":"move matched file","proposedActions":['
+                            '{"step":1,"tool":"drive.moveFile","input":{"fileId":"11","targetFolderId":"21"}}'
+                            "]}"
+                        ),
+                    )
+                ],
+                usage={"input_tokens": 8, "output_tokens": 9},
+            )
+
+    fake_messages = FakeMessages()
+    tool_executor = AsyncMock(return_value={"items": [{"id": "11", "name": "银翼杀手2049.mp4"}], "totalItems": 1})
+    client = AnthropicPlannerClient(
+        settings=settings(
+            agent_llm_api_key="test-key",
+            agent_llm_model="claude-test",
+        ),
+        client=SimpleNamespace(messages=fake_messages),  # type: ignore[arg-type]
+    )
+
+    result = await client.create_plan(
+        system_prompt="system",
+        user_prompt="user",
+        max_tokens=1024,
+        tools=[
+            {
+                "name": "drive_search_files",
+                "description": "Search files.",
+                "input_schema": {"type": "object"},
+                "internalName": "drive.searchFiles",
+            },
+            {
+                "name": "drive_move_file",
+                "description": "Move file.",
+                "input_schema": {"type": "object"},
+                "internalName": "drive.moveFile",
+            },
+        ],
+        tool_executor=tool_executor,
+        max_tool_roundtrips=4,
+    )
+
+    tool_executor.assert_awaited_once_with(
+        "drive.searchFiles",
+        {"folderId": "root", "query": "银翼杀手", "category": "video"},
+    )
+    assert len(fake_messages.calls) == 2
+    second_messages = fake_messages.calls[1]["messages"]
+    assert isinstance(second_messages, list)
+    tool_result_blocks = second_messages[-1]["content"]
+    assert isinstance(tool_result_blocks, list)
+    assert tool_result_blocks[0]["type"] == "tool_result"
+    assert result["summary"] == "move matched file"
+    assert result["proposedActions"][0]["tool"] == "drive.moveFile"
+    assert result["_usage"] == {"input_tokens": 18, "output_tokens": 14}
+
+
 def test_anthropic_planner_client_uses_configured_base_url(monkeypatch: pytest.MonkeyPatch):
     captured: dict[str, object] = {}
 
@@ -571,7 +843,7 @@ async def test_plan_runner_rolls_back_when_commit_fails(monkeypatch: pytest.Monk
 
 
 @pytest.mark.asyncio
-async def test_plan_runner_uses_safe_read_only_fallback_when_planner_returns_invalid_output(
+async def test_plan_runner_propagates_llm_output_errors_without_fallback(
     monkeypatch: pytest.MonkeyPatch,
 ):
     monkeypatch.setattr(plan_module, "_choose_skill", AsyncMock(return_value=None))
@@ -618,17 +890,13 @@ async def test_plan_runner_uses_safe_read_only_fallback_when_planner_returns_inv
     )
     db = DummyDb()
 
-    result = await runner.run(db=db, job=job)  # type: ignore[arg-type]
-
-    assert "fallback mode" in result.summary.lower()
-    assert len(result.proposed_actions) == 1
-    assert result.proposed_actions[0].tool == "drive.listFolder"
-    assert result.proposed_actions[0].side_effect == "read"
-    assert result.requires_confirmation is False
+    with pytest.raises(ApiError) as exc:
+        await runner.run(db=db, job=job)  # type: ignore[arg-type]
+    assert exc.value.status_code == 502
 
 
 @pytest.mark.asyncio
-async def test_plan_runner_fallback_uses_count_files_for_movie_count_question(
+async def test_plan_runner_uses_planner_returned_count_action_for_movie_question(
     monkeypatch: pytest.MonkeyPatch,
 ):
     monkeypatch.setattr(plan_module, "_choose_skill", AsyncMock(return_value=None))
@@ -640,11 +908,16 @@ async def test_plan_runner_fallback_uses_count_files_for_movie_count_question(
     monkeypatch.setattr(plan_module, "_upsert_agent_plan", AsyncMock(return_value=None))
 
     planner = AsyncMock(
-        side_effect=ApiError(
-            status_code=502,
-            code=502,
-            message="Agent LLM returned an empty response",
-        )
+        return_value={
+            "summary": "count videos",
+            "proposedActions": [
+                {
+                    "step": 1,
+                    "tool": "drive.countFiles",
+                    "input": {"folderId": "root", "recursive": True, "category": "video"},
+                }
+            ],
+        }
     )
     runner = PlanRunner(
         settings=settings(),
@@ -682,171 +955,1321 @@ async def test_plan_runner_fallback_uses_count_files_for_movie_count_question(
     assert result.proposed_actions[0].side_effect == "read"
 
 
-def test_normalize_actions_rejects_symbolic_placeholder_target_folder():
-    with pytest.raises(ApiError) as exc:
-        plan_module._normalize_actions(
-            llm_payload={
-                "summary": "organize movies",
-                "proposedActions": [
-                    {
-                        "step": 1,
-                        "tool": "drive.createFolder",
-                        "input": {"parentFolderId": "root", "name": "Movies"},
-                    },
-                    {
-                        "step": 2,
-                        "tool": "drive.moveFile",
-                        "input": {"fileId": "13", "targetFolderId": "newFolderId"},
-                    },
-                ],
-            },
-            allowed_tools=("drive.createFolder", "drive.moveFile"),
-            max_steps=10,
-        )
-
-    assert exc.value.status_code == 400
-    assert "step 2" in exc.value.message
-    assert "targetFolderId" in exc.value.message
-    assert "newFolderId" in exc.value.message
-
+@pytest.mark.asyncio
+async def test_plan_runner_uses_planner_returned_count_action_for_anime_question(
+    monkeypatch: pytest.MonkeyPatch,
+):
+    monkeypatch.setattr(plan_module, "_choose_skill", AsyncMock(return_value=None))
+    monkeypatch.setattr(
+        plan_module,
+        "_collect_context_metadata",
+        AsyncMock(return_value={"scope": "currentFolder", "rootFolderId": "root", "files": [], "folders": []}),
+    )
+    monkeypatch.setattr(plan_module, "_upsert_agent_plan", AsyncMock(return_value=None))
 
-def test_normalize_actions_accepts_previous_step_reference():
-    actions = plan_module._normalize_actions(
-        llm_payload={
-            "summary": "organize movies",
+    planner = AsyncMock(
+        return_value={
+            "summary": "count anime videos",
             "proposedActions": [
                 {
                     "step": 1,
-                    "tool": "drive.createFolder",
-                    "input": {"parentFolderId": "root", "name": "Movies"},
-                },
-                {
-                    "step": 2,
-                    "tool": "drive.moveFile",
-                    "input": {"fileId": "13", "targetFolderId": "$step1.folderId"},
-                },
+                    "tool": "drive.countFiles",
+                    "input": {"folderId": "root", "recursive": True, "category": "video"},
+                }
             ],
-        },
-        allowed_tools=("drive.createFolder", "drive.moveFile"),
-        max_steps=10,
+        }
     )
-
-    assert len(actions) == 2
-    assert actions[1].input["targetFolderId"] == "$step1.folderId"
-
-
-def test_normalize_actions_rejects_future_step_reference():
-    with pytest.raises(ApiError) as exc:
-        plan_module._normalize_actions(
-            llm_payload={
-                "summary": "organize movies",
-                "proposedActions": [
-                    {
-                        "step": 3,
-                        "tool": "drive.moveFile",
-                        "input": {"fileId": "13", "targetFolderId": "$step4.folderId"},
-                    },
-                    {
-                        "step": 4,
-                        "tool": "drive.createFolder",
-                        "input": {"parentFolderId": "root", "name": "Movies"},
+    runner = PlanRunner(
+        settings=settings(),
+        planner_client=SimpleNamespace(create_plan=planner),  # type: ignore[arg-type]
+    )
+    request = PlanAgentRequest.model_validate(
+        {
+            "input": "我上传了多少动漫？",
+            "context": {
+                "rootFolderId": "root",
+                "selectedFileIds": [],
+                "selectedFolderIds": [],
+                "currentPath": "/My Files",
+            },
+            "executionPolicy": "confirm",
+        }
+    )
+    job = BackgroundJob(
+        job_id=336,
+        task_type="agent.plan",
+        status="running",
+        payload=request.model_dump(by_alias=True),
+        result={},
+        requested_by=7,
+        scheduled_at=datetime.now(UTC),
+        created_at=datetime.now(UTC),
+        updated_at=datetime.now(UTC),
+    )
+
+    result = await runner.run(db=DummyDb(), job=job)  # type: ignore[arg-type]
+
+    assert len(result.proposed_actions) == 1
+    action = result.proposed_actions[0]
+    assert action.tool == "drive.countFiles"
+    assert action.input["category"] == "video"
+    assert action.input.get("search") in (None, "")
+
+
+@pytest.mark.asyncio
+async def test_plan_runner_delegates_count_question_with_search_term_to_planner(
+    monkeypatch: pytest.MonkeyPatch,
+):
+    monkeypatch.setattr(plan_module, "_choose_skill", AsyncMock(return_value=None))
+    monkeypatch.setattr(
+        plan_module,
+        "_collect_context_metadata",
+        AsyncMock(return_value={"scope": "currentFolder", "rootFolderId": "root", "files": [], "folders": []}),
+    )
+    monkeypatch.setattr(plan_module, "_upsert_agent_plan", AsyncMock(return_value=None))
+
+    planner = AsyncMock(
+        return_value={
+            "summary": "count matching movies",
+            "proposedActions": [
+                {
+                    "step": 1,
+                    "tool": "drive.countFiles",
+                    "input": {
+                        "folderId": "root",
+                        "recursive": True,
+                        "category": "video",
+                        "search": "银翼杀手",
                     },
-                ],
+                }
+            ],
+        }
+    )
+    runner = PlanRunner(
+        settings=settings(),
+        planner_client=SimpleNamespace(create_plan=planner),  # type: ignore[arg-type]
+    )
+    request = PlanAgentRequest.model_validate(
+        {
+            "input": "我上传了几部银翼杀手？",
+            "context": {
+                "rootFolderId": "root",
+                "selectedFileIds": [],
+                "selectedFolderIds": [],
+                "currentPath": "/My Files",
             },
-            allowed_tools=("drive.createFolder", "drive.moveFile"),
-            max_steps=10,
-        )
+            "executionPolicy": "confirm",
+        }
+    )
+    job = BackgroundJob(
+        job_id=335,
+        task_type="agent.plan",
+        status="running",
+        payload=request.model_dump(by_alias=True),
+        result={},
+        requested_by=7,
+        scheduled_at=datetime.now(UTC),
+        created_at=datetime.now(UTC),
+        updated_at=datetime.now(UTC),
+    )
+
+    result = await runner.run(db=DummyDb(), job=job)  # type: ignore[arg-type]
+
+    planner.assert_awaited_once()
+    assert len(result.proposed_actions) == 1
+    action = result.proposed_actions[0]
+    assert action.tool == "drive.countFiles"
+    assert action.input["category"] == "video"
+    assert action.input["search"] == "银翼杀手"
+    assert action.side_effect == "read"
+
+
+@pytest.mark.asyncio
+async def test_plan_runner_rejects_write_tool_in_exploratory_loop(
+    monkeypatch: pytest.MonkeyPatch,
+):
+    monkeypatch.setattr(plan_module, "_choose_skill", AsyncMock(return_value=None))
+    monkeypatch.setattr(
+        plan_module,
+        "_collect_context_metadata",
+        AsyncMock(return_value={"scope": "currentFolder", "rootFolderId": "root", "files": [], "folders": []}),
+    )
+    monkeypatch.setattr(plan_module, "_upsert_agent_plan", AsyncMock(return_value=None))
+
+    async def fake_create_plan(**kwargs):  # noqa: ANN003
+        tool_executor = kwargs["tool_executor"]
+        await tool_executor("drive.moveFile", {"fileId": "1", "targetFolderId": "2"})
+        return {"summary": "should not reach", "proposedActions": []}
+
+    runner = PlanRunner(
+        settings=settings(),
+        planner_client=SimpleNamespace(create_plan=fake_create_plan),  # type: ignore[arg-type]
+    )
+    request = PlanAgentRequest.model_validate(
+        {
+            "input": "整理文件",
+            "context": {
+                "rootFolderId": "root",
+                "selectedFileIds": [],
+                "selectedFolderIds": [],
+                "currentPath": "/My Files",
+            },
+            "executionPolicy": "confirm",
+        }
+    )
+    job = BackgroundJob(
+        job_id=340,
+        task_type="agent.plan",
+        status="running",
+        payload=request.model_dump(by_alias=True),
+        result={},
+        requested_by=7,
+        scheduled_at=datetime.now(UTC),
+        created_at=datetime.now(UTC),
+        updated_at=datetime.now(UTC),
+    )
 
+    with pytest.raises(ApiError) as exc:
+        await runner.run(db=DummyDb(), job=job)  # type: ignore[arg-type]
     assert exc.value.status_code == 400
-    assert "future step 4" in exc.value.message
-    assert "$step4.folderId" in exc.value.message
+    assert "read-only" in exc.value.message
+
 
+@pytest.mark.asyncio
+async def test_plan_runner_uses_planner_returned_move_action_when_unique_matches(
+    monkeypatch: pytest.MonkeyPatch,
+):
+    monkeypatch.setattr(plan_module, "_choose_skill", AsyncMock(return_value=None))
+    monkeypatch.setattr(
+        plan_module,
+        "_collect_context_metadata",
+        AsyncMock(return_value={"scope": "currentFolder", "rootFolderId": "root", "files": [], "folders": []}),
+    )
+    monkeypatch.setattr(plan_module, "_upsert_agent_plan", AsyncMock(return_value=None))
+    planner = AsyncMock(
+        return_value={
+            "summary": "move one matching file",
+            "proposedActions": [
+                {
+                    "step": 1,
+                    "tool": "drive.moveFile",
+                    "input": {"fileId": "11", "targetFolderId": "21", "shareHandling": "keep"},
+                }
+            ],
+        }
+    )
+    runner = PlanRunner(
+        settings=settings(),
+        planner_client=SimpleNamespace(create_plan=planner),  # type: ignore[arg-type]
+    )
+    request = PlanAgentRequest.model_validate(
+        {
+            "input": "把银翼杀手电影放到银翼杀手文件夹下",
+            "context": {
+                "rootFolderId": "root",
+                "selectedFileIds": [],
+                "selectedFolderIds": [],
+                "currentPath": "/My Files",
+            },
+            "executionPolicy": "confirm",
+        }
+    )
+    job = BackgroundJob(
+        job_id=337,
+        task_type="agent.plan",
+        status="running",
+        payload=request.model_dump(by_alias=True),
+        result={},
+        requested_by=7,
+        scheduled_at=datetime.now(UTC),
+        created_at=datetime.now(UTC),
+        updated_at=datetime.now(UTC),
+    )
+
+    result = await runner.run(db=DummyDb(), job=job)  # type: ignore[arg-type]
+
+    assert len(result.proposed_actions) == 1
+    action = result.proposed_actions[0]
+    assert action.tool == "drive.moveFile"
+    assert action.input["fileId"] == "11"
+    assert action.input["targetFolderId"] == "21"
+    assert action.side_effect == "write"
+
+
+@pytest.mark.asyncio
+async def test_plan_runner_uses_planner_returned_create_then_move_when_target_missing(
+    monkeypatch: pytest.MonkeyPatch,
+):
+    monkeypatch.setattr(plan_module, "_choose_skill", AsyncMock(return_value=None))
+    monkeypatch.setattr(
+        plan_module,
+        "_collect_context_metadata",
+        AsyncMock(return_value={"scope": "currentFolder", "rootFolderId": "root", "files": [], "folders": []}),
+    )
+    monkeypatch.setattr(plan_module, "_upsert_agent_plan", AsyncMock(return_value=None))
+    planner = AsyncMock(
+        return_value={
+            "summary": "create missing folder then move",
+            "proposedActions": [
+                {
+                    "step": 1,
+                    "tool": "drive.createFolder",
+                    "input": {"parentFolderId": "root", "name": "银翼杀手"},
+                },
+                {
+                    "step": 2,
+                    "tool": "drive.moveFile",
+                    "input": {"fileId": "11", "targetFolderId": "$step1.folderId"},
+                },
+            ],
+        }
+    )
+    runner = PlanRunner(
+        settings=settings(),
+        planner_client=SimpleNamespace(create_plan=planner),  # type: ignore[arg-type]
+    )
+    request = PlanAgentRequest.model_validate(
+        {
+            "input": "把银翼杀手电影放到银翼杀手文件夹下",
+            "context": {
+                "rootFolderId": "root",
+                "selectedFileIds": [],
+                "selectedFolderIds": [],
+                "currentPath": "/My Files",
+            },
+            "executionPolicy": "confirm",
+        }
+    )
+    job = BackgroundJob(
+        job_id=338,
+        task_type="agent.plan",
+        status="running",
+        payload=request.model_dump(by_alias=True),
+        result={},
+        requested_by=7,
+        scheduled_at=datetime.now(UTC),
+        created_at=datetime.now(UTC),
+        updated_at=datetime.now(UTC),
+    )
+
+    result = await runner.run(db=DummyDb(), job=job)  # type: ignore[arg-type]
+
+    assert len(result.proposed_actions) == 2
+    assert result.proposed_actions[0].tool == "drive.createFolder"
+    assert result.proposed_actions[0].input["name"] == "银翼杀手"
+    assert result.proposed_actions[1].tool == "drive.moveFile"
+    assert result.proposed_actions[1].input["fileId"] == "11"
+    assert result.proposed_actions[1].input["targetFolderId"] == "$step1.folderId"
+
+
+@pytest.mark.asyncio
+async def test_plan_runner_rewrites_write_summary_with_grounded_facts(
+    monkeypatch: pytest.MonkeyPatch,
+):
+    monkeypatch.setattr(plan_module, "_choose_skill", AsyncMock(return_value=None))
+    monkeypatch.setattr(
+        plan_module,
+        "_collect_context_metadata",
+        AsyncMock(return_value={"scope": "currentFolder", "rootFolderId": "root", "files": [], "folders": []}),
+    )
+    monkeypatch.setattr(plan_module, "_upsert_agent_plan", AsyncMock(return_value=None))
+    planner = AsyncMock(
+        return_value={
+            "summary": "创建银翼杀手文件夹，然后将 V字仇杀队 文件夹中的2部银翼杀手电影移入该文件夹。",
+            "proposedActions": [
+                {
+                    "step": 1,
+                    "tool": "drive.createFolder",
+                    "input": {"parentFolderId": "root", "name": "银翼杀手"},
+                },
+                {
+                    "step": 2,
+                    "tool": "drive.moveFile",
+                    "input": {"fileId": "19", "targetFolderId": "$step1.folderId"},
+                },
+                {
+                    "step": 3,
+                    "tool": "drive.moveFile",
+                    "input": {"fileId": "20", "targetFolderId": "$step1.folderId"},
+                },
+            ],
+        }
+    )
+    runner = PlanRunner(
+        settings=settings(),
+        planner_client=SimpleNamespace(create_plan=planner),  # type: ignore[arg-type]
+    )
+    request = PlanAgentRequest.model_validate(
+        {
+            "input": "把银翼杀手两部，移到银翼杀手文件夹里",
+            "context": {
+                "rootFolderId": "root",
+                "selectedFileIds": [],
+                "selectedFolderIds": [],
+                "currentPath": "/My Files",
+            },
+            "executionPolicy": "confirm",
+        }
+    )
+    job = BackgroundJob(
+        job_id=348,
+        task_type="agent.plan",
+        status="running",
+        payload=request.model_dump(by_alias=True),
+        result={},
+        requested_by=7,
+        scheduled_at=datetime.now(UTC),
+        created_at=datetime.now(UTC),
+        updated_at=datetime.now(UTC),
+    )
+    db = DummyDb()
+
+    class _Rows:
+        def __init__(self, rows: list[tuple[Any, Any]]) -> None:
+            self._rows = rows
+
+        def all(self) -> list[tuple[Any, Any]]:
+            return list(self._rows)
+
+    db.execute = AsyncMock(return_value=_Rows([(19, "银翼杀手1982.mp4"), (20, "银翼杀手2049.mp4")]))
+
+    result = await runner.run(db=db, job=job)  # type: ignore[arg-type]
+
+    assert "V字仇杀队" not in result.summary
+    assert "创建“银翼杀手”文件夹" in result.summary
+    assert "2 个文件" in result.summary
+
+
+@pytest.mark.asyncio
+async def test_plan_runner_records_planning_evidence_from_read_tools(
+    monkeypatch: pytest.MonkeyPatch,
+):
+    monkeypatch.setattr(plan_module, "_choose_skill", AsyncMock(return_value=None))
+    monkeypatch.setattr(
+        plan_module,
+        "_collect_context_metadata",
+        AsyncMock(return_value={"scope": "currentFolder", "rootFolderId": "root", "files": [], "folders": []}),
+    )
+    monkeypatch.setattr(plan_module, "_upsert_agent_plan", AsyncMock(return_value=None))
+
+    class _FakeToolRouter:
+        async def dispatch(self, _call):  # noqa: ANN001
+            return {
+                "items": [
+                    {"fileId": "19", "name": "银翼杀手1982.mp4", "path": "/My Files/videos/银翼杀手1982.mp4"},
+                    {"fileId": "20", "name": "银翼杀手2049.mp4", "path": "/My Files/videos/银翼杀手2049.mp4"},
+                    {"fileId": "21", "name": "Blade Runner Trailer.mp4", "path": "/My Files/videos/Blade Runner Trailer.mp4"},
+                    {"fileId": "22", "name": "x1.mp4", "path": "/My Files/videos/x1.mp4"},
+                    {"fileId": "23", "name": "x2.mp4", "path": "/My Files/videos/x2.mp4"},
+                    {"fileId": "24", "name": "x3.mp4", "path": "/My Files/videos/x3.mp4"},
+                    {"fileId": "25", "name": "x4.mp4", "path": "/My Files/videos/x4.mp4"},
+                ],
+                "totalItems": 7,
+                "query": "银翼杀手",
+                "folderId": "1",
+                "recursive": True,
+                "category": "video",
+            }
+
+    monkeypatch.setattr(plan_module, "ToolRouter", lambda **kwargs: _FakeToolRouter())
+
+    async def _planner_with_read_tool(**kwargs):  # noqa: ANN003
+        tool_executor = kwargs["tool_executor"]
+        await tool_executor(
+            "drive.searchFiles",
+            {"folderId": "root", "query": "银翼杀手", "category": "video"},
+        )
+        return {
+            "summary": "search first",
+            "proposedActions": [
+                {
+                    "step": 1,
+                    "tool": "drive.searchFiles",
+                    "input": {"folderId": "root", "query": "银翼杀手", "category": "video"},
+                }
+            ],
+        }
+
+    runner = PlanRunner(
+        settings=settings(),
+        planner_client=SimpleNamespace(create_plan=_planner_with_read_tool),  # type: ignore[arg-type]
+    )
+    request = PlanAgentRequest.model_validate(
+        {
+            "input": "找出银翼杀手视频文件",
+            "context": {
+                "rootFolderId": "root",
+                "selectedFileIds": [],
+                "selectedFolderIds": [],
+                "currentPath": "/My Files",
+            },
+            "executionPolicy": "confirm",
+        }
+    )
+    job = BackgroundJob(
+        job_id=349,
+        task_type="agent.plan",
+        status="running",
+        payload=request.model_dump(by_alias=True),
+        result={},
+        requested_by=7,
+        scheduled_at=datetime.now(UTC),
+        created_at=datetime.now(UTC),
+        updated_at=datetime.now(UTC),
+    )
+
+    result = await runner.run(db=DummyDb(), job=job)  # type: ignore[arg-type]
+
+    assert result.planning_evidence is not None
+    assert len(result.planning_evidence) == 1
+    evidence = result.planning_evidence[0]
+    assert evidence.step == 1
+    assert evidence.tool == "drive.searchFiles"
+    assert evidence.input["query"] == "银翼杀手"
+    assert evidence.output_preview["totalItems"] == 7
+    assert isinstance(evidence.output_preview.get("items"), list)
+    assert "..." in str(evidence.output_preview["items"][-1])
+
+
+@pytest.mark.asyncio
+async def test_plan_runner_uses_planner_returned_read_only_candidates_when_ambiguous(
+    monkeypatch: pytest.MonkeyPatch,
+):
+    monkeypatch.setattr(plan_module, "_choose_skill", AsyncMock(return_value=None))
+    monkeypatch.setattr(
+        plan_module,
+        "_collect_context_metadata",
+        AsyncMock(return_value={"scope": "currentFolder", "rootFolderId": "root", "files": [], "folders": []}),
+    )
+    monkeypatch.setattr(plan_module, "_upsert_agent_plan", AsyncMock(return_value=None))
+    planner = AsyncMock(
+        return_value={
+            "summary": "ambiguous, return candidates",
+            "proposedActions": [
+                {
+                    "step": 1,
+                    "tool": "drive.searchFiles",
+                    "input": {"folderId": "root", "query": "银翼杀手", "category": "video"},
+                }
+            ],
+        }
+    )
+    runner = PlanRunner(
+        settings=settings(),
+        planner_client=SimpleNamespace(create_plan=planner),  # type: ignore[arg-type]
+    )
+    request = PlanAgentRequest.model_validate(
+        {
+            "input": "把银翼杀手电影放到银翼杀手文件夹下",
+            "context": {
+                "rootFolderId": "root",
+                "selectedFileIds": [],
+                "selectedFolderIds": [],
+                "currentPath": "/My Files",
+            },
+            "executionPolicy": "confirm",
+        }
+    )
+    job = BackgroundJob(
+        job_id=339,
+        task_type="agent.plan",
+        status="running",
+        payload=request.model_dump(by_alias=True),
+        result={},
+        requested_by=7,
+        scheduled_at=datetime.now(UTC),
+        created_at=datetime.now(UTC),
+        updated_at=datetime.now(UTC),
+    )
+
+    result = await runner.run(db=DummyDb(), job=job)  # type: ignore[arg-type]
+
+    assert len(result.proposed_actions) == 1
+    action = result.proposed_actions[0]
+    assert action.tool == "drive.searchFiles"
+    assert action.side_effect == "read"
+    assert "ambiguous" in result.summary
+
+
+def test_normalize_actions_rejects_symbolic_placeholder_target_folder():
+    with pytest.raises(ApiError) as exc:
+        plan_module._normalize_actions(
+            llm_payload={
+                "summary": "organize movies",
+                "proposedActions": [
+                    {
+                        "step": 1,
+                        "tool": "drive.createFolder",
+                        "input": {"parentFolderId": "root", "name": "Movies"},
+                    },
+                    {
+                        "step": 2,
+                        "tool": "drive.moveFile",
+                        "input": {"fileId": "13", "targetFolderId": "newFolderId"},
+                    },
+                ],
+            },
+            allowed_tools=("drive.createFolder", "drive.moveFile"),
+            max_steps=10,
+        )
+
+    assert exc.value.status_code == 400
+    assert "step 2" in exc.value.message
+    assert "targetFolderId" in exc.value.message
+    assert "newFolderId" in exc.value.message
+
+
+def test_normalize_actions_accepts_previous_step_reference():
+    actions = plan_module._normalize_actions(
+        llm_payload={
+            "summary": "organize movies",
+            "proposedActions": [
+                {
+                    "step": 1,
+                    "tool": "drive.createFolder",
+                    "input": {"parentFolderId": "root", "name": "Movies"},
+                },
+                {
+                    "step": 2,
+                    "tool": "drive.moveFile",
+                    "input": {"fileId": "13", "targetFolderId": "$step1.folderId"},
+                },
+            ],
+        },
+        allowed_tools=("drive.createFolder", "drive.moveFile"),
+        max_steps=10,
+    )
+
+    assert len(actions) == 2
+    assert actions[1].input["targetFolderId"] == "$step1.folderId"
+
+
+def test_normalize_actions_rejects_future_step_reference():
+    with pytest.raises(ApiError) as exc:
+        plan_module._normalize_actions(
+            llm_payload={
+                "summary": "organize movies",
+                "proposedActions": [
+                    {
+                        "step": 3,
+                        "tool": "drive.moveFile",
+                        "input": {"fileId": "13", "targetFolderId": "$step4.folderId"},
+                    },
+                    {
+                        "step": 4,
+                        "tool": "drive.createFolder",
+                        "input": {"parentFolderId": "root", "name": "Movies"},
+                    },
+                ],
+            },
+            allowed_tools=("drive.createFolder", "drive.moveFile"),
+            max_steps=10,
+        )
+
+    assert exc.value.status_code == 400
+    assert "future step 4" in exc.value.message
+    assert "$step4.folderId" in exc.value.message
+
+
+def test_execute_reference_resolution_rejects_symbolic_placeholder():
+    with pytest.raises(ApiError) as exc:
+        execute_module._resolve_references(
+            {"targetFolderId": "newFolderId"},
+            step_outputs={},
+        )
+
+    assert exc.value.status_code == 409
+    assert "targetFolderId" in exc.value.message
+    assert "$stepN.field" in exc.value.message
+
+
+@pytest.mark.asyncio
+async def test_policy_guard_blocks_delete_without_confirmation():
+    decision = await PolicyGuard().evaluate_tool_call(
+        tool_name="drive.deleteFile",
+        high_risk_confirmed=False,
+    )
+    assert decision.allowed is False
+    assert classify_tool_risk("drive.deleteFolder") == "high"
+
+
+@pytest.mark.asyncio
+async def test_tool_router_dispatches_move_file():
+    router = ToolRouter(db=DummyDb(), user_id=7)  # type: ignore[arg-type]
+    router.file_service.move_file = AsyncMock(
+        return_value=SimpleNamespace(
+            model_dump=lambda **kwargs: {"fileId": "1", "targetFolderId": "2"}
+        )
+    )
+
+    result = await router.dispatch(
+        ToolCall(
+            tool_name="drive.moveFile",
+            arguments={"fileId": "1", "targetFolderId": "2"},
+        )
+    )
+
+    assert result == {"fileId": "1", "targetFolderId": "2"}
+    router.file_service.move_file.assert_awaited_once()
+
+
+@pytest.mark.asyncio
+async def test_tool_router_count_files_counts_recursive_videos():
+    db = DummyDb()
+    db.scalar = AsyncMock(return_value=1)
+    db.scalars = AsyncMock(
+        side_effect=[
+            [1, 2],
+            [
+                SimpleNamespace(
+                    file_id=10,
+                    file_name="movie.mp4",
+                    file_size=100,
+                    mime_type="application/octet-stream",
+                    file_ext="mp4",
+                    folder_id=1,
+                    created_at=None,
+                    updated_at=None,
+                ),
+                SimpleNamespace(
+                    file_id=11,
+                    file_name="clip.mkv",
+                    file_size=200,
+                    mime_type="video/x-matroska",
+                    file_ext="mkv",
+                    folder_id=2,
+                    created_at=None,
+                    updated_at=None,
+                ),
+                SimpleNamespace(
+                    file_id=12,
+                    file_name="notes.txt",
+                    file_size=10,
+                    mime_type="text/plain",
+                    file_ext="txt",
+                    folder_id=1,
+                    created_at=None,
+                    updated_at=None,
+                ),
+            ],
+        ]
+    )
+    router = ToolRouter(db=db, user_id=7)  # type: ignore[arg-type]
+
+    result = await router.dispatch(
+        ToolCall(
+            tool_name="drive.countFiles",
+            arguments={"folderId": "root", "recursive": True, "category": "video"},
+        )
+    )
+
+    assert result["totalItems"] == 2
+    assert result["category"] == "video"
+    assert result["recursive"] is True
+    assert result["byMimeType"] == {"video/mp4": 1, "video/x-matroska": 1}
+    assert [item["name"] for item in result["sampleItems"]] == ["movie.mp4", "clip.mkv"]
+    executed_statement = str(db.scalars.await_args_list[-1].args[0])
+    assert "file.status" in executed_statement
+    assert "file.is_latest" in executed_statement
+
+
+@pytest.mark.asyncio
+async def test_tool_router_count_files_filters_by_search_term():
+    db = DummyDb()
+    db.scalar = AsyncMock(return_value=1)
+    db.scalars = AsyncMock(
+        side_effect=[
+            [1],
+            [
+                SimpleNamespace(
+                    file_id=10,
+                    file_name="银翼杀手.mp4",
+                    file_size=100,
+                    mime_type="video/mp4",
+                    file_ext="mp4",
+                    folder_id=1,
+                    created_at=None,
+                    updated_at=None,
+                ),
+            ],
+        ]
+    )
+    router = ToolRouter(db=db, user_id=7)  # type: ignore[arg-type]
+
+    result = await router.dispatch(
+        ToolCall(
+            tool_name="drive.countFiles",
+            arguments={
+                "folderId": "root",
+                "recursive": True,
+                "category": "video",
+                "search": "银翼杀手",
+            },
+        )
+    )
+
+    assert result["totalItems"] == 1
+    assert result["search"] == "银翼杀手"
+    executed_statement = str(db.scalars.await_args_list[-1].args[0])
+    assert "file_name" in executed_statement
+
+
+@pytest.mark.asyncio
+async def test_execute_runner_normalizes_tool_output_before_action_log(monkeypatch: pytest.MonkeyPatch):
+    started = datetime.now(UTC)
+    output_time = datetime.now(UTC)
+    job = BackgroundJob(
+        job_id=600,
+        task_type="agent.execute",
+        status="running",
+        payload={
+            "planJobId": "500",
+            "planHash": "sha256:test",
+            "approval": {
+                "confirmedBy": "7",
+                "confirmedAt": started.isoformat(),
+                "highRiskConfirmed": False,
+            },
+        },
+        result={},
+        requested_by=7,
+        scheduled_at=started,
+        created_at=started,
+        updated_at=started,
+    )
+    action = {
+        "step": 1,
+        "tool": "drive.createFolder",
+        "input": {"parentFolderId": "root", "name": "Movies"},
+        "sideEffect": "write",
+        "riskLevel": "low",
+        "requiresConfirmation": False,
+    }
+    db = DummyDb()
+    db.refresh = AsyncMock()
+
+    mock_plan_repo = SimpleNamespace(
+        get_for_execute_binding=AsyncMock(
+            return_value=SimpleNamespace(
+                proposed_actions_json=[action],
+            )
+        )
+    )
+    monkeypatch.setattr(execute_module, "AgentPlanRepository", lambda _db: mock_plan_repo)
+
+    mock_work_sessions = SimpleNamespace(
+        create_for_job=AsyncMock(return_value=None),
+        close_session=AsyncMock(return_value=None),
+    )
+    monkeypatch.setattr(execute_module, "AgentWorkSessionRepository", lambda _db: mock_work_sessions)
+
+    captured_outputs: list[dict[str, object]] = []
+    mock_action_logs = SimpleNamespace(
+        append_step=AsyncMock(return_value=None),
+        finish_step=AsyncMock(
+            side_effect=lambda **kwargs: captured_outputs.append(dict(kwargs)) or None
+        ),
+    )
+    monkeypatch.setattr(execute_module, "AgentActionLogRepository", lambda _db: mock_action_logs)
+
+    mock_router = SimpleNamespace(
+        dispatch=AsyncMock(
+            return_value={
+                "id": "9",
+                "createdAt": output_time,
+                "updatedAt": output_time,
+            }
+        )
+    )
+    monkeypatch.setattr(execute_module, "ToolRouter", lambda **kwargs: mock_router)
+
+    result = await ExecuteRunner(
+        answer_client=SimpleNamespace(create_answer=AsyncMock(return_value="ok"))  # type: ignore[arg-type]
+    ).run(db=db, job=job)  # type: ignore[arg-type]
+
+    assert result.applied_actions == 1
+    assert captured_outputs
+    success_call = next(item for item in captured_outputs if item.get("status") == "succeeded")
+    outputs_json = success_call["outputs_json"]
+    assert isinstance(outputs_json, dict)
+    assert isinstance(outputs_json["createdAt"], str)
+    assert outputs_json["createdAt"] == output_time.isoformat()
+
+
+@pytest.mark.asyncio
+async def test_execute_runner_propagates_answer_model_errors(monkeypatch: pytest.MonkeyPatch):
+    started = datetime.now(UTC)
+    job = BackgroundJob(
+        job_id=610,
+        task_type="agent.execute",
+        status="running",
+        payload={
+            "planJobId": "510",
+            "planHash": "sha256:test",
+            "approval": {
+                "confirmedBy": "7",
+                "confirmedAt": started.isoformat(),
+                "highRiskConfirmed": False,
+            },
+        },
+        result={},
+        requested_by=7,
+        scheduled_at=started,
+        created_at=started,
+        updated_at=started,
+    )
+    action = {
+        "step": 1,
+        "tool": "drive.countFiles",
+        "input": {"folderId": "root", "recursive": True, "category": "video"},
+        "sideEffect": "read",
+        "riskLevel": "low",
+        "requiresConfirmation": False,
+    }
+    db = DummyDb()
+    db.refresh = AsyncMock()
+    monkeypatch.setattr(
+        execute_module,
+        "AgentPlanRepository",
+        lambda _db: SimpleNamespace(
+            get_for_execute_binding=AsyncMock(return_value=SimpleNamespace(proposed_actions_json=[action]))
+        ),
+    )
+    monkeypatch.setattr(
+        execute_module,
+        "AgentWorkSessionRepository",
+        lambda _db: SimpleNamespace(
+            create_for_job=AsyncMock(return_value=None),
+            close_session=AsyncMock(return_value=None),
+        ),
+    )
+    monkeypatch.setattr(
+        execute_module,
+        "AgentActionLogRepository",
+        lambda _db: SimpleNamespace(
+            append_step=AsyncMock(return_value=None),
+            finish_step=AsyncMock(return_value=None),
+        ),
+    )
+    monkeypatch.setattr(
+        execute_module,
+        "ToolRouter",
+        lambda **kwargs: SimpleNamespace(
+            dispatch=AsyncMock(
+                return_value={
+                    "totalItems": 3,
+                    "category": "video",
+                    "recursive": True,
+                    "folderId": "1",
+                    "byMimeType": {"video/mp4": 3},
+                }
+            )
+        ),
+    )
+
+    with pytest.raises(ApiError) as exc:
+        await ExecuteRunner(
+            answer_client=SimpleNamespace(
+                create_answer=AsyncMock(
+                    side_effect=ApiError(status_code=503, code=503, message="Agent LLM API key is not configured")
+                )
+            )  # type: ignore[arg-type]
+        ).run(db=db, job=job)  # type: ignore[arg-type]
+
+    assert exc.value.status_code == 503
+
+
+@pytest.mark.asyncio
+async def test_execute_runner_returns_count_files_answer(monkeypatch: pytest.MonkeyPatch):
+    started = datetime.now(UTC)
+    job = BackgroundJob(
+        job_id=601,
+        task_type="agent.execute",
+        status="running",
+        payload={
+            "planJobId": "501",
+            "planHash": "sha256:test",
+            "approval": {
+                "confirmedBy": "7",
+                "confirmedAt": started.isoformat(),
+                "highRiskConfirmed": False,
+            },
+        },
+        result={},
+        requested_by=7,
+        scheduled_at=started,
+        created_at=started,
+        updated_at=started,
+    )
+    action = {
+        "step": 1,
+        "tool": "drive.countFiles",
+        "input": {"folderId": "root", "recursive": True, "category": "video"},
+        "sideEffect": "read",
+        "riskLevel": "low",
+        "requiresConfirmation": False,
+    }
+    db = DummyDb()
+    db.refresh = AsyncMock()
+
+    mock_plan_repo = SimpleNamespace(
+        get_for_execute_binding=AsyncMock(
+            return_value=SimpleNamespace(
+                proposed_actions_json=[action],
+            )
+        )
+    )
+    monkeypatch.setattr(execute_module, "AgentPlanRepository", lambda _db: mock_plan_repo)
+
+    mock_work_sessions = SimpleNamespace(
+        create_for_job=AsyncMock(return_value=None),
+        close_session=AsyncMock(return_value=None),
+    )
+    monkeypatch.setattr(execute_module, "AgentWorkSessionRepository", lambda _db: mock_work_sessions)
+    monkeypatch.setattr(
+        execute_module,
+        "AgentActionLogRepository",
+        lambda _db: SimpleNamespace(
+            append_step=AsyncMock(return_value=None),
+            finish_step=AsyncMock(return_value=None),
+        ),
+    )
+    monkeypatch.setattr(
+        execute_module,
+        "ToolRouter",
+        lambda **kwargs: SimpleNamespace(
+            dispatch=AsyncMock(
+                return_value={
+                    "totalItems": 3,
+                    "category": "video",
+                    "recursive": True,
+                    "folderId": "1",
+                    "byMimeType": {"video/mp4": 3},
+                    "sampleItems": [],
+                }
+            )
+        ),
+    )
+
+    result = await ExecuteRunner(
+        answer_client=SimpleNamespace(
+            create_answer=AsyncMock(return_value="你上传了 3 部电影（按视频文件统计）。")
+        )  # type: ignore[arg-type]
+    ).run(db=db, job=job)  # type: ignore[arg-type]
+
+    assert result.answer == "你上传了 3 部电影（按视频文件统计）。"
+    assert result.applied_actions == 1
+
+
+@pytest.mark.asyncio
+async def test_execute_runner_returns_count_files_answer_with_search_term(
+    monkeypatch: pytest.MonkeyPatch,
+):
+    started = datetime.now(UTC)
+    job = BackgroundJob(
+        job_id=602,
+        task_type="agent.execute",
+        status="running",
+        payload={
+            "planJobId": "502",
+            "planHash": "sha256:test",
+            "approval": {
+                "confirmedBy": "7",
+                "confirmedAt": started.isoformat(),
+                "highRiskConfirmed": False,
+            },
+        },
+        result={},
+        requested_by=7,
+        scheduled_at=started,
+        created_at=started,
+        updated_at=started,
+    )
+    action = {
+        "step": 1,
+        "tool": "drive.countFiles",
+        "input": {
+            "folderId": "root",
+            "recursive": True,
+            "category": "video",
+            "search": "银翼杀手",
+        },
+        "sideEffect": "read",
+        "riskLevel": "low",
+        "requiresConfirmation": False,
+    }
+    db = DummyDb()
+    db.refresh = AsyncMock()
+
+    monkeypatch.setattr(
+        execute_module,
+        "AgentPlanRepository",
+        lambda _db: SimpleNamespace(
+            get_for_execute_binding=AsyncMock(
+                return_value=SimpleNamespace(proposed_actions_json=[action])
+            )
+        ),
+    )
+    monkeypatch.setattr(
+        execute_module,
+        "AgentWorkSessionRepository",
+        lambda _db: SimpleNamespace(
+            create_for_job=AsyncMock(return_value=None),
+            close_session=AsyncMock(return_value=None),
+        ),
+    )
+    monkeypatch.setattr(
+        execute_module,
+        "AgentActionLogRepository",
+        lambda _db: SimpleNamespace(
+            append_step=AsyncMock(return_value=None),
+            finish_step=AsyncMock(return_value=None),
+        ),
+    )
+    monkeypatch.setattr(
+        execute_module,
+        "ToolRouter",
+        lambda **kwargs: SimpleNamespace(
+            dispatch=AsyncMock(
+                return_value={
+                    "totalItems": 2,
+                    "category": "video",
+                    "recursive": True,
+                    "folderId": "1",
+                    "search": "银翼杀手",
+                    "byMimeType": {"video/mp4": 2},
+                    "sampleItems": [],
+                }
+            )
+        ),
+    )
+
+    result = await ExecuteRunner(
+        answer_client=SimpleNamespace(
+            create_answer=AsyncMock(return_value="你上传了 2 部名称包含“银翼杀手”的电影（按视频文件统计）。")
+        )  # type: ignore[arg-type]
+    ).run(db=db, job=job)  # type: ignore[arg-type]
+
+    assert result.answer == "你上传了 2 部名称包含“银翼杀手”的电影（按视频文件统计）。"
+    assert "只读操作" not in (result.answer or "")
+
+
+@pytest.mark.asyncio
+async def test_execute_runner_returns_count_files_answer_with_names_when_asked(
+    monkeypatch: pytest.MonkeyPatch,
+):
+    started = datetime.now(UTC)
+    job = BackgroundJob(
+        job_id=604,
+        task_type="agent.execute",
+        status="running",
+        payload={
+            "planJobId": "504",
+            "planHash": "sha256:test",
+            "approval": {
+                "confirmedBy": "7",
+                "confirmedAt": started.isoformat(),
+                "highRiskConfirmed": False,
+            },
+        },
+        result={},
+        requested_by=7,
+        scheduled_at=started,
+        created_at=started,
+        updated_at=started,
+    )
+    action = {
+        "step": 1,
+        "tool": "drive.countFiles",
+        "input": {"folderId": "root", "recursive": True, "category": "archive"},
+        "sideEffect": "read",
+        "riskLevel": "low",
+        "requiresConfirmation": False,
+    }
+    db = DummyDb()
+    db.refresh = AsyncMock()
+
+    monkeypatch.setattr(
+        execute_module,
+        "AgentPlanRepository",
+        lambda _db: SimpleNamespace(
+            get_for_execute_binding=AsyncMock(
+                return_value=SimpleNamespace(
+                    input_text="我上传了多少压缩包，叫什么名字",
+                    proposed_actions_json=[action],
+                )
+            )
+        ),
+    )
+    monkeypatch.setattr(
+        execute_module,
+        "AgentWorkSessionRepository",
+        lambda _db: SimpleNamespace(
+            create_for_job=AsyncMock(return_value=None),
+            close_session=AsyncMock(return_value=None),
+        ),
+    )
+    monkeypatch.setattr(
+        execute_module,
+        "AgentActionLogRepository",
+        lambda _db: SimpleNamespace(
+            append_step=AsyncMock(return_value=None),
+            finish_step=AsyncMock(return_value=None),
+        ),
+    )
+    monkeypatch.setattr(
+        execute_module,
+        "ToolRouter",
+        lambda **kwargs: SimpleNamespace(
+            dispatch=AsyncMock(
+                return_value={
+                    "totalItems": 2,
+                    "category": "archive",
+                    "recursive": True,
+                    "folderId": "1",
+                    "itemNames": ["photos.zip", "backup.7z"],
+                    "itemNamesTruncated": False,
+                    "byMimeType": {"application/zip": 1, "application/x-7z-compressed": 1},
+                    "sampleItems": [],
+                }
+            )
+        ),
+    )
 
-def test_execute_reference_resolution_rejects_symbolic_placeholder():
-    with pytest.raises(ApiError) as exc:
-        execute_module._resolve_references(
-            {"targetFolderId": "newFolderId"},
-            step_outputs={},
-        )
+    result = await ExecuteRunner(
+        answer_client=SimpleNamespace(
+            create_answer=AsyncMock(return_value="你上传了 2 个压缩包，名字是：photos.zip、backup.7z。")
+        )  # type: ignore[arg-type]
+    ).run(db=db, job=job)  # type: ignore[arg-type]
 
-    assert exc.value.status_code == 409
-    assert "targetFolderId" in exc.value.message
-    assert "$stepN.field" in exc.value.message
+    assert result.answer == "你上传了 2 个压缩包，名字是：photos.zip、backup.7z。"
 
 
 @pytest.mark.asyncio
-async def test_policy_guard_blocks_delete_without_confirmation():
-    decision = await PolicyGuard().evaluate_tool_call(
-        tool_name="drive.deleteFile",
-        high_risk_confirmed=False,
+async def test_execute_runner_lists_archive_names_for_read_only_archive_question(
+    monkeypatch: pytest.MonkeyPatch,
+):
+    started = datetime.now(UTC)
+    job = BackgroundJob(
+        job_id=603,
+        task_type="agent.execute",
+        status="running",
+        payload={
+            "planJobId": "503",
+            "planHash": "sha256:test",
+            "approval": {
+                "confirmedBy": "7",
+                "confirmedAt": started.isoformat(),
+                "highRiskConfirmed": False,
+            },
+        },
+        result={},
+        requested_by=7,
+        scheduled_at=started,
+        created_at=started,
+        updated_at=started,
     )
-    assert decision.allowed is False
-    assert classify_tool_risk("drive.deleteFolder") == "high"
-
+    action = {
+        "step": 1,
+        "tool": "drive.listFolder",
+        "input": {"folderId": "root"},
+        "sideEffect": "read",
+        "riskLevel": "low",
+        "requiresConfirmation": False,
+    }
+    db = DummyDb()
+    db.refresh = AsyncMock()
 
-@pytest.mark.asyncio
-async def test_tool_router_dispatches_move_file():
-    router = ToolRouter(db=DummyDb(), user_id=7)  # type: ignore[arg-type]
-    router.file_service.move_file = AsyncMock(
-        return_value=SimpleNamespace(
-            model_dump=lambda **kwargs: {"fileId": "1", "targetFolderId": "2"}
-        )
+    monkeypatch.setattr(
+        execute_module,
+        "AgentPlanRepository",
+        lambda _db: SimpleNamespace(
+            get_for_execute_binding=AsyncMock(
+                return_value=SimpleNamespace(
+                    input_text="我上传了哪些压缩包",
+                    proposed_actions_json=[action],
+                )
+            )
+        ),
     )
-
-    result = await router.dispatch(
-        ToolCall(
-            tool_name="drive.moveFile",
-            arguments={"fileId": "1", "targetFolderId": "2"},
-        )
+    monkeypatch.setattr(
+        execute_module,
+        "AgentWorkSessionRepository",
+        lambda _db: SimpleNamespace(
+            create_for_job=AsyncMock(return_value=None),
+            close_session=AsyncMock(return_value=None),
+        ),
     )
-
-    assert result == {"fileId": "1", "targetFolderId": "2"}
-    router.file_service.move_file.assert_awaited_once()
-
-
-@pytest.mark.asyncio
-async def test_tool_router_count_files_counts_recursive_videos():
-    db = DummyDb()
-    db.scalar = AsyncMock(return_value=1)
-    db.scalars = AsyncMock(return_value=[1, 2])
-    db.execute = AsyncMock(
-        return_value=SimpleNamespace(
-            all=lambda: [
-                (10, "movie.mp4", 100, "application/octet-stream", "mp4", 1),
-                (11, "clip.mkv", 200, "video/x-matroska", "mkv", 2),
-                (12, "notes.txt", 10, "text/plain", "txt", 1),
-            ]
-        )
+    monkeypatch.setattr(
+        execute_module,
+        "AgentActionLogRepository",
+        lambda _db: SimpleNamespace(
+            append_step=AsyncMock(return_value=None),
+            finish_step=AsyncMock(return_value=None),
+        ),
     )
-    router = ToolRouter(db=db, user_id=7)  # type: ignore[arg-type]
-
-    result = await router.dispatch(
-        ToolCall(
-            tool_name="drive.countFiles",
-            arguments={"folderId": "root", "recursive": True, "category": "video"},
-        )
+    monkeypatch.setattr(
+        execute_module,
+        "ToolRouter",
+        lambda **kwargs: SimpleNamespace(
+            dispatch=AsyncMock(
+                return_value={
+                    "items": [
+                        {
+                            "itemType": "file",
+                            "id": "1",
+                            "name": "photos.zip",
+                            "size": 10,
+                            "mimeType": "application/zip",
+                        },
+                        {
+                            "itemType": "file",
+                            "id": "2",
+                            "name": "movie.mp4",
+                            "size": 20,
+                            "mimeType": "video/mp4",
+                        },
+                        {
+                            "itemType": "file",
+                            "id": "3",
+                            "name": "backup.7z",
+                            "size": 30,
+                            "mimeType": "application/octet-stream",
+                        },
+                    ],
+                    "pagination": {
+                        "totalItems": 3,
+                        "totalPages": 1,
+                        "perPage": 200,
+                        "currentPage": 1,
+                        "hasPrev": False,
+                        "hasNext": False,
+                    },
+                }
+            )
+        ),
     )
 
-    assert result["totalItems"] == 2
-    assert result["category"] == "video"
-    assert result["recursive"] is True
-    assert result["byMimeType"] == {"video/mp4": 1, "video/x-matroska": 1}
-    assert [item["name"] for item in result["sampleItems"]] == ["movie.mp4", "clip.mkv"]
-    executed_statement = str(db.execute.await_args.args[0])
-    assert "file.status" in executed_statement
-    assert "file.is_latest" in executed_statement
+    result = await ExecuteRunner(
+        answer_client=SimpleNamespace(
+            create_answer=AsyncMock(return_value="当前文件夹中的压缩包有 2 个：photos.zip、backup.7z。")
+        )  # type: ignore[arg-type]
+    ).run(db=db, job=job)  # type: ignore[arg-type]
+
+    assert result.answer == "当前文件夹中的压缩包有 2 个：photos.zip、backup.7z。"
 
 
 @pytest.mark.asyncio
-async def test_execute_runner_normalizes_tool_output_before_action_log(monkeypatch: pytest.MonkeyPatch):
+async def test_execute_runner_returns_search_files_candidate_answer(
+    monkeypatch: pytest.MonkeyPatch,
+):
     started = datetime.now(UTC)
-    output_time = datetime.now(UTC)
     job = BackgroundJob(
-        job_id=600,
+        job_id=605,
         task_type="agent.execute",
         status="running",
         payload={
-            "planJobId": "500",
+            "planJobId": "505",
             "planHash": "sha256:test",
             "approval": {
                 "confirmedBy": "7",
@@ -862,70 +2285,102 @@ async def test_execute_runner_normalizes_tool_output_before_action_log(monkeypat
     )
     action = {
         "step": 1,
-        "tool": "drive.createFolder",
-        "input": {"parentFolderId": "root", "name": "Movies"},
-        "sideEffect": "write",
+        "tool": "drive.searchFiles",
+        "input": {"folderId": "root", "query": "银翼杀手", "category": "video"},
+        "sideEffect": "read",
         "riskLevel": "low",
         "requiresConfirmation": False,
     }
     db = DummyDb()
     db.refresh = AsyncMock()
 
-    mock_plan_repo = SimpleNamespace(
-        get_for_execute_binding=AsyncMock(
-            return_value=SimpleNamespace(
-                proposed_actions_json=[action],
+    monkeypatch.setattr(
+        execute_module,
+        "AgentPlanRepository",
+        lambda _db: SimpleNamespace(
+            get_for_execute_binding=AsyncMock(
+                return_value=SimpleNamespace(
+                    input_text="把银翼杀手电影放到银翼杀手文件夹下",
+                    proposed_actions_json=[action],
+                )
             )
-        )
+        ),
     )
-    monkeypatch.setattr(execute_module, "AgentPlanRepository", lambda _db: mock_plan_repo)
-
-    mock_work_sessions = SimpleNamespace(
-        create_for_job=AsyncMock(return_value=None),
-        close_session=AsyncMock(return_value=None),
+    monkeypatch.setattr(
+        execute_module,
+        "AgentWorkSessionRepository",
+        lambda _db: SimpleNamespace(
+            create_for_job=AsyncMock(return_value=None),
+            close_session=AsyncMock(return_value=None),
+        ),
     )
-    monkeypatch.setattr(execute_module, "AgentWorkSessionRepository", lambda _db: mock_work_sessions)
-
-    captured_outputs: list[dict[str, object]] = []
-    mock_action_logs = SimpleNamespace(
-        append_step=AsyncMock(return_value=None),
-        finish_step=AsyncMock(
-            side_effect=lambda **kwargs: captured_outputs.append(dict(kwargs)) or None
+    monkeypatch.setattr(
+        execute_module,
+        "AgentActionLogRepository",
+        lambda _db: SimpleNamespace(
+            append_step=AsyncMock(return_value=None),
+            finish_step=AsyncMock(return_value=None),
         ),
     )
-    monkeypatch.setattr(execute_module, "AgentActionLogRepository", lambda _db: mock_action_logs)
-
-    mock_router = SimpleNamespace(
-        dispatch=AsyncMock(
-            return_value={
-                "id": "9",
-                "createdAt": output_time,
-                "updatedAt": output_time,
-            }
-        )
+    monkeypatch.setattr(
+        execute_module,
+        "ToolRouter",
+        lambda **kwargs: SimpleNamespace(
+            dispatch=AsyncMock(
+                return_value={
+                    "items": [
+                        {"id": "11", "name": "银翼杀手1982.mp4", "mimeType": "video/mp4"},
+                        {"id": "12", "name": "银翼杀手2049.mp4", "mimeType": "video/mp4"},
+                    ],
+                    "totalItems": 2,
+                    "query": "银翼杀手",
+                    "folderId": "1",
+                    "recursive": False,
+                    "category": "video",
+                }
+            )
+        ),
     )
-    monkeypatch.setattr(execute_module, "ToolRouter", lambda **kwargs: mock_router)
 
-    result = await ExecuteRunner().run(db=db, job=job)  # type: ignore[arg-type]
+    result = await ExecuteRunner(
+        answer_client=SimpleNamespace(
+            create_answer=AsyncMock(
+                return_value="找到 2 个名称包含“银翼杀手”的文件：银翼杀手1982.mp4、银翼杀手2049.mp4。"
+            )
+        )  # type: ignore[arg-type]
+    ).run(db=db, job=job)  # type: ignore[arg-type]
 
-    assert result.applied_actions == 1
-    assert captured_outputs
-    success_call = next(item for item in captured_outputs if item.get("status") == "succeeded")
-    outputs_json = success_call["outputs_json"]
-    assert isinstance(outputs_json, dict)
-    assert isinstance(outputs_json["createdAt"], str)
-    assert outputs_json["createdAt"] == output_time.isoformat()
+    assert result.answer == "找到 2 个名称包含“银翼杀手”的文件：银翼杀手1982.mp4、银翼杀手2049.mp4。"
 
 
-@pytest.mark.asyncio
-async def test_execute_runner_returns_count_files_answer(monkeypatch: pytest.MonkeyPatch):
+class _NeverStream:
+    async def next(self, *, timeout=None):  # noqa: ANN001
+        await asyncio.Future()
+
+    async def aclose(self) -> None:
+        return None
+
+
+class _CaptureBus:
+    def __init__(self) -> None:
+        self.events: list[AgentEventEnvelope] = []
+
+    async def publish(self, envelope: AgentEventEnvelope) -> None:
+        self.events.append(envelope)
+
+    @asynccontextmanager
+    async def subscribe(self, *, job_id: int):  # noqa: ARG002
+        yield _NeverStream()
+
+
+def _execute_job_for_controls() -> BackgroundJob:
     started = datetime.now(UTC)
-    job = BackgroundJob(
-        job_id=601,
+    return BackgroundJob(
+        job_id=700,
         task_type="agent.execute",
         status="running",
         payload={
-            "planJobId": "501",
+            "planJobId": "500",
             "planHash": "sha256:test",
             "approval": {
                 "confirmedBy": "7",
@@ -939,6 +2394,14 @@ async def test_execute_runner_returns_count_files_answer(monkeypatch: pytest.Mon
         created_at=started,
         updated_at=started,
     )
+
+
+def _patch_execute_dependencies(
+    monkeypatch: pytest.MonkeyPatch,
+    *,
+    controls: list[list[SimpleNamespace]],
+    dropped: list[int],
+) -> None:
     action = {
         "step": 1,
         "tool": "drive.countFiles",
@@ -947,23 +2410,24 @@ async def test_execute_runner_returns_count_files_answer(monkeypatch: pytest.Mon
         "riskLevel": "low",
         "requiresConfirmation": False,
     }
-    db = DummyDb()
-    db.refresh = AsyncMock()
 
-    mock_plan_repo = SimpleNamespace(
-        get_for_execute_binding=AsyncMock(
-            return_value=SimpleNamespace(
-                proposed_actions_json=[action],
+    monkeypatch.setattr(
+        execute_module,
+        "AgentPlanRepository",
+        lambda _db: SimpleNamespace(
+            get_for_execute_binding=AsyncMock(
+                return_value=SimpleNamespace(proposed_actions_json=[action])
             )
-        )
+        ),
     )
-    monkeypatch.setattr(execute_module, "AgentPlanRepository", lambda _db: mock_plan_repo)
-
-    mock_work_sessions = SimpleNamespace(
-        create_for_job=AsyncMock(return_value=None),
-        close_session=AsyncMock(return_value=None),
+    monkeypatch.setattr(
+        execute_module,
+        "AgentWorkSessionRepository",
+        lambda _db: SimpleNamespace(
+            create_for_job=AsyncMock(return_value=None),
+            close_session=AsyncMock(return_value=None),
+        ),
     )
-    monkeypatch.setattr(execute_module, "AgentWorkSessionRepository", lambda _db: mock_work_sessions)
     monkeypatch.setattr(
         execute_module,
         "AgentActionLogRepository",
@@ -978,18 +2442,103 @@ async def test_execute_runner_returns_count_files_answer(monkeypatch: pytest.Mon
         lambda **kwargs: SimpleNamespace(
             dispatch=AsyncMock(
                 return_value={
-                    "totalItems": 3,
+                    "totalItems": 1,
                     "category": "video",
                     "recursive": True,
                     "folderId": "1",
-                    "byMimeType": {"video/mp4": 3},
+                    "byMimeType": {"video/mp4": 1},
                     "sampleItems": [],
                 }
             )
         ),
     )
 
-    result = await ExecuteRunner().run(db=db, job=job)  # type: ignore[arg-type]
+    class FakeInboxRepository:
+        def __init__(self, _db) -> None:  # noqa: ANN001
+            return None
+
+        async def list_pending_controls(self, *, job_id: int):  # noqa: ARG002
+            if controls:
+                return controls.pop(0)
+            return []
+
+        async def mark_dropped(self, *, inbox_message_id: int) -> None:
+            dropped.append(inbox_message_id)
+
+    monkeypatch.setattr(execute_module, "AgentInboxMessageRepository", FakeInboxRepository)
+
+
+@pytest.mark.asyncio
+async def test_execute_runner_pauses_then_resumes_at_step_boundary(
+    monkeypatch: pytest.MonkeyPatch,
+):
+    controls = [
+        [SimpleNamespace(inbox_message_id=1, kind=AgentInboxKind.CONTROL_PAUSE)],
+        [SimpleNamespace(inbox_message_id=2, kind=AgentInboxKind.CONTROL_RESUME)],
+    ]
+    dropped: list[int] = []
+    _patch_execute_dependencies(monkeypatch, controls=controls, dropped=dropped)
+    db = DummyDb()
+    db.refresh = AsyncMock()
+    bus = _CaptureBus()
+
+    result = await ExecuteRunner(
+        event_bus=bus,
+        answer_client=SimpleNamespace(create_answer=AsyncMock(return_value="ok")),  # type: ignore[arg-type]
+    ).run(db=db, job=_execute_job_for_controls())  # type: ignore[arg-type]
 
-    assert result.answer == "你上传了 3 部电影（按视频文件统计）。"
     assert result.applied_actions == 1
+    assert dropped == [1, 2]
+    event_types = [event.event_type for event in bus.events]
+    assert "agent.paused" in event_types
+    assert "agent.resumed" in event_types
+    assert "tool.started" in event_types
+    assert "tool.succeeded" in event_types
+
+
+@pytest.mark.asyncio
+async def test_execute_runner_canceled_via_inbox_at_step_boundary(
+    monkeypatch: pytest.MonkeyPatch,
+):
+    controls = [[SimpleNamespace(inbox_message_id=1, kind=AgentInboxKind.CONTROL_CANCEL)]]
+    dropped: list[int] = []
+    _patch_execute_dependencies(monkeypatch, controls=controls, dropped=dropped)
+    db = DummyDb()
+    db.refresh = AsyncMock()
+
+    with pytest.raises(AgentJobCanceled):
+        await ExecuteRunner(
+            event_bus=_CaptureBus(),
+            answer_client=SimpleNamespace(create_answer=AsyncMock(return_value="ok")),  # type: ignore[arg-type]
+        ).run(  # type: ignore[arg-type]
+            db=db,
+            job=_execute_job_for_controls(),
+        )
+
+    assert dropped == [1]
+
+
+@pytest.mark.asyncio
+async def test_execute_runner_publish_state_ignores_event_bus_failures():
+    bus = SimpleNamespace(publish=AsyncMock(side_effect=RuntimeError("boom")))
+    runner = ExecuteRunner(event_bus=bus)  # type: ignore[arg-type]
+
+    await runner._publish_state("agent.paused", job_id=1)
+
+    assert bus.publish.await_count == 1
+
+
+@pytest.mark.asyncio
+async def test_execute_runner_publish_tool_ignores_event_bus_failures():
+    bus = SimpleNamespace(publish=AsyncMock(side_effect=RuntimeError("boom")))
+    runner = ExecuteRunner(event_bus=bus)  # type: ignore[arg-type]
+
+    await runner._publish_tool(
+        "tool.started",
+        job_id=1,
+        step=1,
+        tool="drive.listFolder",
+        payload={"input": {"folderId": "root"}},
+    )
+
+    assert bus.publish.await_count == 1
diff --git a/app/tests/test_agent_routes.py b/app/tests/test_agent_routes.py
index 6b50f90..68d225e 100644
--- a/app/tests/test_agent_routes.py
+++ b/app/tests/test_agent_routes.py
@@ -1,14 +1,22 @@
 from __future__ import annotations
 
+from contextlib import asynccontextmanager
 from datetime import UTC, datetime
 
 from fastapi import FastAPI
 from fastapi.testclient import TestClient
 
-from fileflash.core.deps import get_agent_execute_service, get_agent_plan_service, get_current_user
+from fileflash.agents.harness.event_bus import AgentEventEnvelope, InMemoryAgentEventBus
+from fileflash.core.deps import (
+    get_agent_event_bus,
+    get_agent_execute_service,
+    get_agent_plan_service,
+    get_current_user,
+)
 from fileflash.core.errors import ApiError, api_error_handler
 from fileflash.db.deps import get_db
-from fileflash.models import BackgroundJob
+from fileflash.models import AgentActionLog, AgentInboxMessage, BackgroundJob
+from fileflash.models.enums import AgentInboxRole
 from fileflash.models.tables_identity import User
 from fileflash.routers.agent import router
 from fileflash.schemas.agent import ExecuteAgentResponse, PlanAgentResponse
@@ -38,16 +46,32 @@ def __init__(self) -> None:
             created_at=now,
             updated_at=now,
         )
+        self.messages: list[AgentInboxMessage] = []
+        self._next_inbox_id = 1
 
     async def scalar(self, _query):  # noqa: ANN001
         return self.job
 
+    async def scalars(self, _query):  # noqa: ANN001
+        return []
+
+    def add(self, msg: AgentInboxMessage) -> None:
+        msg.inbox_message_id = self._next_inbox_id
+        self._next_inbox_id += 1
+        self.messages.append(msg)
+
+    async def flush(self) -> None:
+        return None
+
     async def commit(self) -> None:
         return None
 
     async def refresh(self, _job: BackgroundJob) -> None:
         return None
 
+    async def get(self, _model, _id: int):  # noqa: ANN001
+        return None
+
 
 class RunningJobDb(StubDb):
     def __init__(self) -> None:
@@ -55,6 +79,40 @@ def __init__(self) -> None:
         self.job.status = "running"
 
 
+class EventsDb(StubDb):
+    def __init__(self) -> None:
+        super().__init__()
+        now = datetime.now(UTC)
+        self.job.status = "succeeded"
+        self.job.result = {
+            "planJobId": "10",
+            "executeJobId": "12",
+            "summary": "done",
+            "answer": "你上传了 2 部名称包含“银翼杀手”的电影（按视频文件统计）。",
+            "appliedActions": 1,
+            "skippedActions": 0,
+            "warnings": [],
+            "finishedAt": now.isoformat(),
+        }
+        self.job.finished_at = now
+        self.job.updated_at = now
+        self.action_log = AgentActionLog(
+            action_log_id=1,
+            job_id=12,
+            step_no=1,
+            tool_name="drive.countFiles",
+            inputs_json={"folderId": "root", "category": "video", "search": "银翼杀手"},
+            outputs_json={"totalItems": 2, "category": "video", "search": "银翼杀手"},
+            status="succeeded",
+            duration_ms=12,
+            started_at=now,
+            finished_at=now,
+        )
+
+    async def scalars(self, _query):  # noqa: ANN001
+        return [self.action_log]
+
+
 def _user() -> User:
     return User(user_id=7, username="u7", email="u7@example.com", password_hash="x")
 
@@ -81,6 +139,17 @@ def _client_with_running_job() -> TestClient:
     return TestClient(app)
 
 
+def _client_with_events() -> TestClient:
+    app = FastAPI()
+    app.include_router(router, prefix="/api/v1")
+    app.add_exception_handler(ApiError, api_error_handler)
+    app.dependency_overrides[get_current_user] = _user
+    app.dependency_overrides[get_agent_plan_service] = lambda: StubPlanService()
+    app.dependency_overrides[get_agent_execute_service] = lambda: StubExecuteService()
+    app.dependency_overrides[get_db] = lambda: EventsDb()
+    return TestClient(app)
+
+
 def test_plan_route_returns_response_shell():
     response = _client().post(
         "/api/v1/agent/plan",
@@ -131,22 +200,85 @@ def test_execute_route_returns_response_shell():
     assert body["data"]["taskType"] == "agent.execute"
 
 
-def test_cancel_route_returns_response_shell():
-    response = _client().post("/api/v1/agent/cancel/12")
+def test_post_message_control_pause_returns_response_shell():
+    bus = InMemoryAgentEventBus()
+    db = StubDb()
+    app = FastAPI()
+    app.include_router(router, prefix="/api/v1")
+    app.add_exception_handler(ApiError, api_error_handler)
+    app.dependency_overrides[get_current_user] = _user
+    app.dependency_overrides[get_db] = lambda: db
+    app.dependency_overrides[get_agent_event_bus] = lambda: bus
+    client = TestClient(app)
+
+    response = client.post("/api/v1/agent/jobs/12/messages", json={"kind": "control.pause"})
 
     assert response.status_code == 200
     body = response.json()
     assert body["success"] is True
-    assert body["data"]["jobId"] == "12"
-    assert body["data"]["status"] == "canceled"
-    assert body["data"]["canceledAt"]
+    assert body["data"]["kind"] == "control.pause"
+    assert body["data"]["inboxMessageId"] == "1"
+    assert db.messages[0].role == AgentInboxRole.USER
 
 
-def test_cancel_route_marks_running_job_as_canceled():
-    response = _client_with_running_job().post("/api/v1/agent/cancel/12")
+def test_job_events_route_streams_tool_and_final_answer_events():
+    response = _client_with_events().get("/api/v1/agent/jobs/12/events")
 
     assert response.status_code == 200
-    body = response.json()
-    assert body["success"] is True
-    assert body["data"]["jobId"] == "12"
-    assert body["data"]["status"] == "canceled"
+    assert response.headers["content-type"].startswith("text/event-stream")
+    body = response.text
+    assert "event: tool.started" in body
+    assert "event: tool.succeeded" in body
+    assert "event: job.succeeded" in body
+    assert "正在读取名称包含" in body
+    assert "银翼杀手" in body
+    assert "answer" in body
+
+
+def test_job_events_route_streams_event_bus_events_after_initial_replay():
+    now = datetime.now(UTC)
+    events = [
+        AgentEventEnvelope(
+            job_id=12,
+            event_type="agent.progress",
+            payload={"step": 1, "total": 3, "message": "halfway"},
+            emitted_at=now,
+        ),
+        AgentEventEnvelope(
+            job_id=12,
+            event_type="job.succeeded",
+            payload={"status": "succeeded"},
+            emitted_at=now,
+        ),
+    ]
+
+    class StaticStream:
+        async def next(self, *, timeout=None):  # noqa: ANN001
+            if not events:
+                raise TimeoutError
+            return events.pop(0)
+
+        async def aclose(self) -> None:
+            return None
+
+    class StaticBus:
+        async def publish(self, envelope):  # noqa: ANN001
+            return None
+
+        @asynccontextmanager
+        async def subscribe(self, *, job_id: int):  # noqa: ARG002
+            yield StaticStream()
+
+    app = FastAPI()
+    app.include_router(router, prefix="/api/v1")
+    app.add_exception_handler(ApiError, api_error_handler)
+    app.dependency_overrides[get_current_user] = _user
+    app.dependency_overrides[get_db] = lambda: RunningJobDb()
+    app.dependency_overrides[get_agent_event_bus] = lambda: StaticBus()
+    client = TestClient(app)
+
+    response = client.get("/api/v1/agent/jobs/12/events")
+
+    assert response.status_code == 200
+    assert "event: agent.progress" in response.text
+    assert "event: job.succeeded" in response.text
diff --git a/app/tests/test_agent_skill_service.py b/app/tests/test_agent_skill_service.py
index 79d8ffe..bc4d13f 100644
--- a/app/tests/test_agent_skill_service.py
+++ b/app/tests/test_agent_skill_service.py
@@ -76,6 +76,29 @@ async def test_update_custom_skill_requires_owner_private():
     session.commit.assert_not_awaited()
 
 
+@pytest.mark.asyncio
+async def test_create_custom_skill_rejects_unknown_tool():
+    session = DummySession()
+    session.scalar.return_value = None
+
+    repo = AgentSkillRepository(session)
+    service = SkillService(db=session, skills=repo)
+
+    with pytest.raises(ApiError) as exc:
+        await service.create_custom_skill(
+            user_id=7,
+            payload=CreateAgentSkillRequest(
+                name="Unsafe",
+                description="bad tool",
+                tool_whitelist=["drive.listFolder", "files.list"],
+            ),
+        )
+
+    assert exc.value.status_code == 422
+    assert exc.value.data == {"unknownTools": ["files.list"]}
+    session.commit.assert_not_awaited()
+
+
 @pytest.mark.asyncio
 async def test_delete_custom_skill_requires_owner_private():
     session = DummySession()
@@ -91,6 +114,33 @@ async def test_delete_custom_skill_requires_owner_private():
     session.commit.assert_not_awaited()
 
 
+@pytest.mark.asyncio
+async def test_import_rejects_unknown_tool():
+    session = DummySession()
+    session.scalars.return_value = []
+
+    repo = AgentSkillRepository(session)
+    service = SkillService(db=session, skills=repo)
+
+    payload = ImportAgentSkillsRequest(
+        items=[
+            ImportAgentSkillItem(
+                skill_key="builtin:bad",
+                name="bad",
+                description="bad",
+                tool_whitelist=["drive.missing"],
+            )
+        ],
+    )
+
+    with pytest.raises(ApiError) as exc:
+        await service.import_global_skills(payload=payload)
+
+    assert exc.value.status_code == 422
+    assert exc.value.data == {"unknownTools": ["drive.missing"]}
+    session.commit.assert_not_awaited()
+
+
 @pytest.mark.asyncio
 async def test_import_insert_only_conflict_raises_409():
     session = DummySession()
diff --git a/app/tests/test_agent_tools.py b/app/tests/test_agent_tools.py
new file mode 100644
index 0000000..36287ec
--- /dev/null
+++ b/app/tests/test_agent_tools.py
@@ -0,0 +1,240 @@
+from __future__ import annotations
+
+from types import SimpleNamespace
+from unittest.mock import AsyncMock
+
+import pytest
+
+from fileflash.agents.harness.router import ToolCall, ToolRouter
+from fileflash.agents.harness.tool_registry import REGISTRY, ToolRegistry, ToolSpec
+from fileflash.models.enums import FileStatus
+
+
+async def _noop_handler(_ctx, _args):  # noqa: ANN001
+    return {"ok": True}
+
+
+def test_tool_registry_registers_and_maps_provider_names():
+    registry = ToolRegistry()
+    registry.register(
+        ToolSpec(
+            name="drive.testTool",
+            description="test",
+            input_schema={"type": "object"},
+            side_effect="read",
+            risk_level="low",
+            requires_confirmation=False,
+            handler=_noop_handler,
+        )
+    )
+
+    assert registry.all_names() == ("drive.testTool",)
+    assert registry.get("drive.testTool").anthropic_name == "drive_test_tool"
+    assert registry.get_by_provider_name("drive_test_tool").name == "drive.testTool"
+    assert registry.anthropic_tools_for(["drive.testTool"])[0]["internalName"] == "drive.testTool"
+
+
+def test_tool_registry_rejects_duplicate_names():
+    registry = ToolRegistry()
+    spec = ToolSpec(
+        name="drive.testTool",
+        description="test",
+        input_schema={"type": "object"},
+        side_effect="read",
+        risk_level="low",
+        requires_confirmation=False,
+        handler=_noop_handler,
+    )
+    registry.register(spec)
+
+    with pytest.raises(ValueError):
+        registry.register(spec)
+
+
+def test_builtin_registry_contains_new_query_tools():
+    names = set(REGISTRY.all_names())
+
+    assert {
+        "drive.searchFiles",
+        "drive.getFileInfo",
+        "drive.listRecent",
+        "drive.statsByCategory",
+        "drive.findDuplicates",
+    }.issubset(names)
+    assert REGISTRY.get("drive.deleteFile").risk_level == "high"
+
+
+class DummyDb:
+    def __init__(self) -> None:
+        self.scalar = AsyncMock(return_value=1)
+        self.scalars = AsyncMock(return_value=[])
+        self.execute = AsyncMock()
+        self.get = AsyncMock()
+
+
+@pytest.mark.asyncio
+async def test_tool_router_dispatches_new_search_files_tool():
+    db = DummyDb()
+    db.scalar = AsyncMock(
+        side_effect=[
+            1,
+            SimpleNamespace(folder_name="My Files", parent_folder_id=None),
+        ]
+    )
+    db.scalars = AsyncMock(
+        side_effect=[
+            [1],
+            [
+                SimpleNamespace(
+                    file_id=10,
+                    file_name="movie.mp4",
+                    file_size=100,
+                    mime_type="video/mp4",
+                    file_ext="mp4",
+                    folder_id=1,
+                    storage_object_id=20,
+                    status=FileStatus.ACTIVE,
+                    is_latest=True,
+                    created_at=None,
+                    updated_at=None,
+                )
+            ],
+        ]
+    )
+    router = ToolRouter(db=db, user_id=7)  # type: ignore[arg-type]
+
+    result = await router.dispatch(
+        ToolCall(
+            tool_name="drive.searchFiles",
+            arguments={"folderId": "root", "query": "movie", "category": "video"},
+        )
+    )
+
+    assert result["totalItems"] == 1
+    assert result["items"][0]["name"] == "movie.mp4"
+
+
+@pytest.mark.asyncio
+async def test_tool_router_dispatches_stats_by_category_tool():
+    db = DummyDb()
+    db.scalars = AsyncMock(
+        side_effect=[
+            [1],
+            [
+                SimpleNamespace(
+                    file_id=10,
+                    file_name="movie.mp4",
+                    file_size=100,
+                    mime_type="video/mp4",
+                    file_ext="mp4",
+                    folder_id=1,
+                    storage_object_id=20,
+                    created_at=None,
+                    updated_at=None,
+                ),
+                SimpleNamespace(
+                    file_id=11,
+                    file_name="notes.txt",
+                    file_size=10,
+                    mime_type="text/plain",
+                    file_ext="txt",
+                    folder_id=1,
+                    storage_object_id=21,
+                    created_at=None,
+                    updated_at=None,
+                ),
+            ],
+        ]
+    )
+    router = ToolRouter(db=db, user_id=7)  # type: ignore[arg-type]
+
+    result = await router.dispatch(
+        ToolCall(tool_name="drive.statsByCategory", arguments={"folderId": "root"})
+    )
+
+    assert result["video"] == 1
+    assert result["document"] == 1
+    assert result["totalSize"] == 110
+
+
+@pytest.mark.asyncio
+async def test_tool_router_count_files_accepts_anime_alias_and_returns_item_names():
+    db = DummyDb()
+    db.scalar = AsyncMock(return_value=1)
+    db.scalars = AsyncMock(
+        side_effect=[
+            [1],
+            [
+                SimpleNamespace(
+                    file_id=10,
+                    file_name="银河动漫番剧.mp4",
+                    file_size=100,
+                    mime_type="video/mp4",
+                    file_ext="mp4",
+                    folder_id=1,
+                    storage_object_id=20,
+                    created_at=None,
+                    updated_at=None,
+                ),
+                SimpleNamespace(
+                    file_id=11,
+                    file_name="notes.txt",
+                    file_size=10,
+                    mime_type="text/plain",
+                    file_ext="txt",
+                    folder_id=1,
+                    storage_object_id=21,
+                    created_at=None,
+                    updated_at=None,
+                ),
+            ],
+        ]
+    )
+    router = ToolRouter(db=db, user_id=7)  # type: ignore[arg-type]
+
+    result = await router.dispatch(
+        ToolCall(
+            tool_name="drive.countFiles",
+            arguments={"folderId": "root", "recursive": True, "category": "anime"},
+        )
+    )
+
+    assert result["category"] == "video"
+    assert result["totalItems"] == 1
+    assert result["itemNames"] == ["银河动漫番剧.mp4"]
+    assert result["itemNamesTruncated"] is False
+
+
+@pytest.mark.asyncio
+async def test_tool_router_count_files_truncates_item_names_at_limit():
+    db = DummyDb()
+    db.scalar = AsyncMock(return_value=1)
+    rows = [
+        SimpleNamespace(
+            file_id=100 + index,
+            file_name=f"video-{index:02d}.mp4",
+            file_size=100,
+            mime_type="video/mp4",
+            file_ext="mp4",
+            folder_id=1,
+            storage_object_id=200 + index,
+            created_at=None,
+            updated_at=None,
+        )
+        for index in range(13)
+    ]
+    db.scalars = AsyncMock(side_effect=[[1], rows])
+    router = ToolRouter(db=db, user_id=7)  # type: ignore[arg-type]
+
+    result = await router.dispatch(
+        ToolCall(
+            tool_name="drive.countFiles",
+            arguments={"folderId": "root", "recursive": True, "category": "video"},
+        )
+    )
+
+    assert result["totalItems"] == 13
+    assert len(result["itemNames"]) == 12
+    assert result["itemNames"][0] == "video-00.mp4"
+    assert result["itemNames"][-1] == "video-11.mp4"
+    assert result["itemNamesTruncated"] is True
diff --git a/app/tests/test_agent_worker.py b/app/tests/test_agent_worker.py
index 65b15b0..1275bfe 100644
--- a/app/tests/test_agent_worker.py
+++ b/app/tests/test_agent_worker.py
@@ -6,6 +6,7 @@
 
 import pytest
 
+from fileflash.agents.harness.event_bus import AgentEventEnvelope
 from fileflash.agents.worker import AgentWorkerConsumer
 from fileflash.models import BackgroundJob
 
@@ -32,6 +33,19 @@ async def scalar(self, _query):  # noqa: ANN001
         return self._job
 
 
+class CaptureBus:
+    def __init__(self) -> None:
+        self.events: list[AgentEventEnvelope] = []
+
+    async def publish(self, envelope: AgentEventEnvelope) -> None:
+        self.events.append(envelope)
+
+
+class FailingBus:
+    async def publish(self, envelope: AgentEventEnvelope) -> None:  # noqa: ARG002
+        raise RuntimeError("publish unavailable")
+
+
 def _job(*, status: str, cancel_requested_at: datetime | None) -> BackgroundJob:
     now = datetime.now(UTC)
     return BackgroundJob(
@@ -82,3 +96,45 @@ async def test_mark_failed_does_not_override_job_with_cancel_request(monkeypatch
     assert job.status == "running"
     assert job.cancel_requested_at == canceled_at
     assert job.error_message is None
+
+
+@pytest.mark.asyncio
+async def test_mark_succeeded_publishes_terminal_event(monkeypatch: pytest.MonkeyPatch):
+    job = _job(status="running", cancel_requested_at=None)
+    session = DummySession(job)
+    bus = CaptureBus()
+    consumer = AgentWorkerConsumer(
+        queue=SimpleNamespace(),
+        session_factory=lambda: _AsyncContextManager(session),  # type: ignore[arg-type]
+        event_bus=bus,
+    )
+    monkeypatch.setattr("fileflash.agents.worker.apply_local_lock_timeout", AsyncMock(return_value=None))
+
+    finished_at = datetime.now(UTC).replace(microsecond=0)
+    await consumer._mark_succeeded(
+        job_id=65,
+        result={"summary": "ok", "finishedAt": finished_at},
+        phase="completed",
+    )
+
+    assert [event.event_type for event in bus.events] == ["job.succeeded"]
+    assert bus.events[0].payload["status"] == "succeeded"
+    assert bus.events[0].payload["data"]["result"]["finishedAt"] == finished_at.isoformat()
+    assert job.result["finishedAt"] == finished_at.isoformat()
+
+
+@pytest.mark.asyncio
+async def test_mark_succeeded_ignores_publish_failures(monkeypatch: pytest.MonkeyPatch):
+    job = _job(status="running", cancel_requested_at=None)
+    session = DummySession(job)
+    consumer = AgentWorkerConsumer(
+        queue=SimpleNamespace(),
+        session_factory=lambda: _AsyncContextManager(session),  # type: ignore[arg-type]
+        event_bus=FailingBus(),
+    )
+    monkeypatch.setattr("fileflash.agents.worker.apply_local_lock_timeout", AsyncMock(return_value=None))
+
+    await consumer._mark_succeeded(job_id=65, result={"summary": "ok"}, phase="completed")
+
+    assert job.status == "succeeded"
+    assert job.result["summary"] == "ok"
diff --git a/app/tests/test_file_download_recycle_service.py b/app/tests/test_file_download_recycle_service.py
index 3d1caba..e0b6031 100644
--- a/app/tests/test_file_download_recycle_service.py
+++ b/app/tests/test_file_download_recycle_service.py
@@ -1,15 +1,29 @@
 from __future__ import annotations
 
+import tempfile
 from datetime import UTC, datetime
+from types import SimpleNamespace
 from unittest.mock import AsyncMock
 
 import pytest
-
-from fileflash.core.errors import ApiError
-from fileflash.models.enums import FileStatus, FolderStatus, FolderType, UploadStatus
+from fastapi import FastAPI
+from fastapi.testclient import TestClient
+
+from fileflash.core.deps import get_current_user, get_download_rate_limit_service, get_file_service
+from fileflash.core.errors import ApiError, api_error_handler
+from fileflash.models.enums import (
+    FileStatus,
+    FolderStatus,
+    FolderType,
+    UploadStatus,
+    UserRole,
+    UserStatus,
+)
+from fileflash.models.tables_identity import User
 from fileflash.models.tables_storage import File, FileMediaMetadata, Folder, StorageObject
-from fileflash.schemas.file import BatchFilesRequest
-from fileflash.services.file import FileService
+from fileflash.routers.files import router as files_router
+from fileflash.schemas.file import BatchDownloadRequest, BatchFilesRequest
+from fileflash.services.file import BatchDownloadPlan, DownloadStreamResult, FileService
 
 
 class DummyStorage:
@@ -41,6 +55,14 @@ def __init__(self) -> None:
         self.delete = AsyncMock()
 
 
+class ResultRows:
+    def __init__(self, rows) -> None:  # noqa: ANN001
+        self._rows = rows
+
+    def all(self):  # noqa: ANN201
+        return self._rows
+
+
 def make_file_row(*, file_id: int = 1, file_name: str = "demo.txt", folder_id: int = 10) -> File:
     return File(
         file_id=file_id,
@@ -73,6 +95,22 @@ def make_folder_row(*, folder_id: int = 10, folder_name: str = "Docs") -> Folder
     )
 
 
+def make_user(*, role: UserRole = UserRole.USER) -> User:
+    return User(
+        user_id=1,
+        username="alice",
+        email="alice@example.com",
+        password_hash="x",
+        role=role,
+        status=UserStatus.ACTIVE,
+        email_verified=True,
+        storage_limit=1024,
+        storage_used=0,
+        created_at=datetime.now(UTC),
+        updated_at=datetime.now(UTC),
+    )
+
+
 @pytest.mark.asyncio
 async def test_get_download_stream_supports_single_range(monkeypatch: pytest.MonkeyPatch):
     session = DummySession()
@@ -375,6 +413,145 @@ async def test_get_preview_stream_falls_back_to_source_when_transcoded_missing(m
     assert result.headers["Content-Length"] == "512"
 
 
+@pytest.mark.asyncio
+async def test_batch_download_plan_estimates_source_file_size() -> None:
+    session = DummySession()
+    storage = DummyStorage()
+    service = FileService(db=session, storage=storage)
+    file_row = make_file_row(file_id=7, file_name="archive.bin")
+    file_row.storage_object_id = 99
+    storage_object = StorageObject(
+        object_id=99,
+        bucket_name="fileflash",
+        object_key="objects/u1/archive",
+        object_size=512,
+        upload_status=UploadStatus.ACTIVE,
+        content_type="application/octet-stream",
+    )
+    session.scalars = AsyncMock(return_value=[file_row])
+    session.execute = AsyncMock(return_value=ResultRows([(file_row, storage_object)]))
+
+    plan = await service.create_batch_download_plan(
+        user_id=1,
+        payload=BatchDownloadRequest(fileIds=["7"]),
+    )
+
+    assert plan.estimated_bytes == 512
+    assert plan.files[0][2] == "archive.bin"
+
+
+class StubDownloadLimiter:
+    def __init__(self, *, deny: bool = False) -> None:
+        self.deny = deny
+        self.calls: list[tuple[str, int]] = []
+
+    async def enforce_user(self, *, user: User, bytes_count: int) -> None:
+        self.calls.append((f"user:{user.user_id}", bytes_count))
+        if self.deny and user.role != UserRole.ADMIN:
+            raise ApiError(status_code=429, code=429, message="Download rate limit exceeded")
+
+    async def enforce_user_id(self, *, user_id: int, bytes_count: int) -> None:
+        self.calls.append((f"user:{user_id}", bytes_count))
+        if self.deny:
+            raise ApiError(status_code=429, code=429, message="Download rate limit exceeded")
+
+
+class StubFileRouteService:
+    async def get_download_stream(
+        self,
+        *,
+        user_id: int,  # noqa: ARG002
+        file_id: str,  # noqa: ARG002
+        range_header: str | None,
+    ) -> DownloadStreamResult:
+        async def _stream():
+            yield b"0123456789"
+
+        headers = {"Content-Length": "4" if range_header else "10", "Accept-Ranges": "bytes"}
+        if range_header:
+            headers["Content-Range"] = "bytes 0-3/10"
+        return DownloadStreamResult(
+            stream=_stream(),
+            filename="demo.txt",
+            content_type="text/plain",
+            status_code=206 if range_header else 200,
+            headers=headers,
+        )
+
+    async def get_preview_stream(self, **kwargs) -> DownloadStreamResult:  # noqa: ANN003
+        return await self.get_download_stream(**kwargs)
+
+    async def create_batch_download_plan(
+        self,
+        *,
+        user_id: int,  # noqa: ARG002
+        payload: BatchDownloadRequest,  # noqa: ARG002
+    ) -> BatchDownloadPlan:
+        return SimpleNamespace(estimated_bytes=10, files=[object()])  # type: ignore[return-value]
+
+    async def create_batch_download_archive_from_plan(self, *, plan: BatchDownloadPlan):  # noqa: ANN201, ARG002
+        tmp = tempfile.NamedTemporaryFile(prefix="fileflash-test-", suffix=".zip", delete=False)
+        tmp.write(b"zip")
+        tmp.close()
+        return tmp.name, "test.zip"
+
+
+def _files_client(*, role: UserRole, limiter: StubDownloadLimiter) -> TestClient:
+    app = FastAPI()
+    app.add_exception_handler(ApiError, api_error_handler)
+    app.include_router(files_router, prefix="/api/v1")
+    app.dependency_overrides[get_current_user] = lambda: make_user(role=role)
+    app.dependency_overrides[get_file_service] = lambda: StubFileRouteService()
+    app.dependency_overrides[get_download_rate_limit_service] = lambda: limiter
+    return TestClient(app)
+
+
+def test_download_route_returns_429_when_limiter_rejects_user() -> None:
+    limiter = StubDownloadLimiter(deny=True)
+    with _files_client(role=UserRole.USER, limiter=limiter) as client:
+        response = client.get("/api/v1/files/1/download")
+
+    assert response.status_code == 429
+    assert limiter.calls == [("user:1", 10)]
+
+
+def test_download_route_preserves_range_response_when_allowed() -> None:
+    limiter = StubDownloadLimiter()
+    with _files_client(role=UserRole.USER, limiter=limiter) as client:
+        response = client.get("/api/v1/files/1/download", headers={"Range": "bytes=0-3"})
+
+    assert response.status_code == 206
+    assert response.headers["content-range"] == "bytes 0-3/10"
+    assert limiter.calls == [("user:1", 4)]
+
+
+def test_admin_download_route_is_not_rejected_by_user_limiter() -> None:
+    limiter = StubDownloadLimiter(deny=True)
+    with _files_client(role=UserRole.ADMIN, limiter=limiter) as client:
+        response = client.get("/api/v1/files/1/download")
+
+    assert response.status_code == 200
+    assert limiter.calls == [("user:1", 10)]
+
+
+def test_batch_download_route_returns_429_before_archive_when_limited() -> None:
+    limiter = StubDownloadLimiter(deny=True)
+    with _files_client(role=UserRole.USER, limiter=limiter) as client:
+        response = client.post("/api/v1/files/batch-download", json={"fileIds": ["1"]})
+
+    assert response.status_code == 429
+    assert limiter.calls == [("user:1", 10)]
+
+
+def test_admin_batch_download_route_is_not_rejected_by_user_limiter() -> None:
+    limiter = StubDownloadLimiter(deny=True)
+    with _files_client(role=UserRole.ADMIN, limiter=limiter) as client:
+        response = client.post("/api/v1/files/batch-download", json={"fileIds": ["1"]})
+
+    assert response.status_code == 200
+    assert response.content == b"zip"
+
+
 @pytest.mark.asyncio
 async def test_delete_file_marks_record_deleted(monkeypatch: pytest.MonkeyPatch):
     session = DummySession()
diff --git a/app/tests/test_rate_limiter.py b/app/tests/test_rate_limiter.py
new file mode 100644
index 0000000..386c160
--- /dev/null
+++ b/app/tests/test_rate_limiter.py
@@ -0,0 +1,92 @@
+from __future__ import annotations
+
+from unittest.mock import AsyncMock
+
+import pytest
+from redis.exceptions import RedisError
+
+from fileflash.core.settings import Settings
+from fileflash.models.enums import UserRole, UserStatus
+from fileflash.models.tables_identity import User
+from fileflash.services.download_rate_limit import DownloadRateLimitService
+from fileflash.services.rate_limiter import RedisRateLimiter
+
+
+class FakeRedis:
+    def __init__(self, *, fail: bool = False) -> None:
+        self.fail = fail
+        self.values: dict[str, int] = {}
+        self.expired: list[tuple[str, int]] = []
+
+    async def incrby(self, key: str, amount: int) -> int:
+        if self.fail:
+            raise RedisError("down")
+        self.values[key] = self.values.get(key, 0) + amount
+        return self.values[key]
+
+    async def expire(self, key: str, window_seconds: int) -> None:
+        self.expired.append((key, window_seconds))
+
+
+@pytest.mark.asyncio
+async def test_allow_weighted_uses_incrby_and_sets_ttl() -> None:
+    limiter = RedisRateLimiter("redis://example")
+    fake = FakeRedis()
+    limiter._redis = fake  # type: ignore[assignment]
+
+    allowed = await limiter.allow_weighted("k", limit=10, window_seconds=60, weight=4)
+
+    assert allowed is True
+    assert fake.values["k"] == 4
+    assert fake.expired == [("k", 60)]
+
+
+@pytest.mark.asyncio
+async def test_allow_weighted_rejects_over_limit() -> None:
+    limiter = RedisRateLimiter("redis://example")
+    fake = FakeRedis()
+    limiter._redis = fake  # type: ignore[assignment]
+
+    assert await limiter.allow_weighted("k", limit=5, window_seconds=60, weight=4) is True
+    assert await limiter.allow_weighted("k", limit=5, window_seconds=60, weight=2) is False
+
+
+@pytest.mark.asyncio
+async def test_allow_weighted_degrades_open_when_redis_fails() -> None:
+    limiter = RedisRateLimiter("redis://example")
+    limiter._redis = FakeRedis(fail=True)  # type: ignore[assignment]
+
+    assert await limiter.allow_weighted("k", limit=1, window_seconds=60, weight=10) is True
+
+
+class FakeRateLimiter:
+    def __init__(self) -> None:
+        self.allow = AsyncMock(return_value=False)
+        self.allow_weighted = AsyncMock(return_value=False)
+
+
+@pytest.mark.asyncio
+async def test_download_rate_limiter_skips_admin_user_id() -> None:
+    admin = User(
+        user_id=1,
+        username="admin",
+        email="admin@example.com",
+        password_hash="x",
+        role=UserRole.ADMIN,
+        status=UserStatus.ACTIVE,
+        email_verified=True,
+        storage_limit=1024,
+        storage_used=0,
+    )
+    db = type("Db", (), {"get": AsyncMock(return_value=admin)})()
+    rate_limiter = FakeRateLimiter()
+    service = DownloadRateLimitService(
+        db=db,  # type: ignore[arg-type]
+        settings=Settings(DATABASE_URL="sqlite+aiosqlite:///:memory:"),
+        rate_limiter=rate_limiter,  # type: ignore[arg-type]
+    )
+
+    await service.enforce_user_id(user_id=1, bytes_count=100)
+
+    rate_limiter.allow.assert_not_awaited()
+    rate_limiter.allow_weighted.assert_not_awaited()
diff --git a/app/tests/test_settings.py b/app/tests/test_settings.py
index 738f3ff..52356ea 100644
--- a/app/tests/test_settings.py
+++ b/app/tests/test_settings.py
@@ -32,9 +32,18 @@ def test_agent_related_settings_defaults():
     assert settings.agent_queue_stream == "fileflash:agents"
     assert settings.agent_job_timeout_sec == 600
     assert settings.agent_tool_timeout_sec == 30
+    assert settings.agent_llm_plan_max_tokens == 8192
     assert settings.agent_mcp_endpoints == ()
 
 
+def test_auth_risk_control_defaults():
+    settings = make_settings()
+    assert settings.register_rate_limit == 12
+    assert settings.login_rate_limit == 30
+    assert settings.max_failed_login_attempts == 8
+    assert settings.account_lock_minutes == 5
+
+
 def test_app_env_detection():
     dev = make_settings(APP_ENV="development")
     assert dev.is_development_env is True
diff --git a/app/tests/test_share_routes.py b/app/tests/test_share_routes.py
index 48cb008..e6d5b6f 100644
--- a/app/tests/test_share_routes.py
+++ b/app/tests/test_share_routes.py
@@ -5,7 +5,13 @@
 from fastapi import FastAPI
 from fastapi.testclient import TestClient
 
-from fileflash.core.deps import get_client_ip, get_share_service, get_user_agent
+from fileflash.core.deps import (
+    get_client_ip,
+    get_download_rate_limit_service,
+    get_share_service,
+    get_user_agent,
+)
+from fileflash.core.errors import ApiError, api_error_handler
 from fileflash.routers.shares import router as shares_router
 
 
@@ -19,6 +25,7 @@ async def get_shared_file_download_stream_response(
         range_header: str | None,  # noqa: ARG002
         ip_address: str,  # noqa: ARG002
         user_agent: str | None,  # noqa: ARG002
+        rate_limit_check=None,  # noqa: ANN001
     ) -> tuple[AsyncIterator[bytes], str, str, int, dict[str, str]]:
         async def _stream() -> AsyncIterator[bytes]:
             yield b"data"
@@ -32,15 +39,30 @@ async def _stream() -> AsyncIterator[bytes]:
             "Accept-Ranges": "bytes",
             "Content-Length": "4",
         }
+        if rate_limit_check is not None:
+            await rate_limit_check(4)
         return _stream(), "测试文档.pdf", "application/pdf", 200, headers
 
 
-def _build_client() -> TestClient:
+class StubDownloadLimiter:
+    def __init__(self, *, deny: bool = False) -> None:
+        self.deny = deny
+        self.calls: list[tuple[str, int]] = []
+
+    async def enforce_share_ip(self, *, client_ip: str, bytes_count: int) -> None:
+        self.calls.append((client_ip, bytes_count))
+        if self.deny:
+            raise ApiError(status_code=429, code=429, message="Download rate limit exceeded")
+
+
+def _build_client(limiter: StubDownloadLimiter | None = None) -> TestClient:
     app = FastAPI()
+    app.add_exception_handler(ApiError, api_error_handler)
     app.include_router(shares_router, prefix="/api/v1")
     app.dependency_overrides[get_share_service] = lambda: StubShareService()
     app.dependency_overrides[get_client_ip] = lambda: "127.0.0.1"
     app.dependency_overrides[get_user_agent] = lambda: "pytest"
+    app.dependency_overrides[get_download_rate_limit_service] = lambda: limiter or StubDownloadLimiter()
     return TestClient(app)
 
 
@@ -71,3 +93,27 @@ def test_shared_preview_handles_unicode_filename_header() -> None:
     assert 'filename*=UTF-8\'\'' in header
     header.encode("latin-1")
     assert response.content == b"data"
+
+
+def test_shared_download_returns_429_when_ip_limited() -> None:
+    limiter = StubDownloadLimiter(deny=True)
+    with _build_client(limiter) as client:
+        response = client.get(
+            "/api/v1/shares/ABCD/download",
+            headers={"Authorization": "Bearer test-share-token"},
+        )
+
+    assert response.status_code == 429
+    assert limiter.calls == [("127.0.0.1", 4)]
+
+
+def test_shared_preview_returns_429_when_ip_limited() -> None:
+    limiter = StubDownloadLimiter(deny=True)
+    with _build_client(limiter) as client:
+        response = client.get(
+            "/api/v1/shares/ABCD/preview",
+            headers={"Authorization": "Bearer test-share-token"},
+        )
+
+    assert response.status_code == 429
+    assert limiter.calls == [("127.0.0.1", 4)]
diff --git a/docker/flyway/migrations/V14__agent_inbox.sql b/docker/flyway/migrations/V14__agent_inbox.sql
new file mode 100644
index 0000000..16ab9e0
--- /dev/null
+++ b/docker/flyway/migrations/V14__agent_inbox.sql
@@ -0,0 +1,49 @@
+-- =========================
+-- Domain: agent inbox
+-- =========================
+
+DO $$
+BEGIN
+    IF NOT EXISTS (SELECT 1 FROM pg_type WHERE typname = 'agent_inbox_role_enum') THEN
+        CREATE TYPE agent_inbox_role_enum AS ENUM ('agent', 'user');
+    END IF;
+    IF NOT EXISTS (SELECT 1 FROM pg_type WHERE typname = 'agent_inbox_kind_enum') THEN
+        CREATE TYPE agent_inbox_kind_enum AS ENUM (
+            'ask',
+            'reply',
+            'control.pause',
+            'control.resume',
+            'control.approve',
+            'control.deny',
+            'control.skip',
+            'control.cancel'
+        );
+    END IF;
+    IF NOT EXISTS (SELECT 1 FROM pg_type WHERE typname = 'agent_inbox_status_enum') THEN
+        CREATE TYPE agent_inbox_status_enum AS ENUM ('waiting', 'answered', 'timed_out', 'dropped');
+    END IF;
+END
+$$;
+
+CREATE TABLE IF NOT EXISTS agent_inbox_message (
+    inbox_message_id BIGINT GENERATED BY DEFAULT AS IDENTITY PRIMARY KEY,
+    job_id BIGINT NOT NULL,
+    role agent_inbox_role_enum NOT NULL,
+    kind agent_inbox_kind_enum NOT NULL,
+    payload_json JSONB NOT NULL DEFAULT '{}'::jsonb,
+    reply_to_id BIGINT NULL,
+    status agent_inbox_status_enum NULL,
+    created_at TIMESTAMP NOT NULL DEFAULT CURRENT_TIMESTAMP,
+    answered_at TIMESTAMP NULL,
+    CONSTRAINT fk_agent_inbox_message_job
+        FOREIGN KEY (job_id) REFERENCES background_job(job_id) ON DELETE CASCADE,
+    CONSTRAINT fk_agent_inbox_message_reply_to
+        FOREIGN KEY (reply_to_id) REFERENCES agent_inbox_message(inbox_message_id) ON DELETE SET NULL
+);
+
+CREATE INDEX IF NOT EXISTS idx_agent_inbox_message_job_created
+    ON agent_inbox_message (job_id, created_at);
+
+CREATE INDEX IF NOT EXISTS idx_agent_inbox_message_job_status
+    ON agent_inbox_message (job_id, status)
+    WHERE status IS NOT NULL;
diff --git a/docker/flyway/migrations/V15__agent_tool_registry_skills.sql b/docker/flyway/migrations/V15__agent_tool_registry_skills.sql
new file mode 100644
index 0000000..f1a9079
--- /dev/null
+++ b/docker/flyway/migrations/V15__agent_tool_registry_skills.sql
@@ -0,0 +1,19 @@
+UPDATE agent_skill
+SET tool_whitelist_json = '[
+    "drive.listFolder",
+    "drive.countFiles",
+    "drive.searchFiles",
+    "drive.getFileInfo",
+    "drive.listRecent",
+    "drive.statsByCategory",
+    "drive.findDuplicates",
+    "drive.createFolder",
+    "drive.moveFile",
+    "drive.moveFolder",
+    "drive.renameFile",
+    "drive.renameFolder",
+    "drive.deleteFile",
+    "drive.deleteFolder"
+]'::jsonb,
+updated_at = CURRENT_TIMESTAMP
+WHERE skill_key = 'builtin:organizeByType';
diff --git a/docs/superpowers/plans/2026-05-24-admin-console-backend.md b/docs/superpowers/plans/2026-05-24-admin-console-backend.md
index 5551456..ebdb421 100644
--- a/docs/superpowers/plans/2026-05-24-admin-console-backend.md
+++ b/docs/superpowers/plans/2026-05-24-admin-console-backend.md
@@ -89,6 +89,7 @@ app/src/fileflash/
 ## Task 0: 基础设施（admin 包 + 状态映射）
 
 **Files:**
+
 - Create: `app/src/fileflash/schemas/admin/__init__.py`
 - Create: `app/src/fileflash/services/admin/__init__.py`
 - Create: `app/src/fileflash/services/admin/_status.py`
@@ -214,6 +215,7 @@ git commit -m "feat(admin): scaffold admin packages and user status mapping"
 ## Task 1: Admin Users — schemas + service
 
 **Files:**
+
 - Create: `app/src/fileflash/schemas/admin/users.py`
 - Create: `app/src/fileflash/services/admin/users.py`
 - Test: `app/tests/test_admin_users_service.py`
@@ -602,6 +604,7 @@ git commit -m "feat(admin): users service with list and set_status (last-admin g
 ## Task 2: Admin Users — router + deps + 注册
 
 **Files:**
+
 - Create: `app/src/fileflash/routers/admin_users.py`
 - Modify: `app/src/fileflash/core/deps.py`
 - Modify: `app/src/fileflash/routers/__init__.py`
@@ -785,6 +788,7 @@ git commit -m "feat(admin): /admin/users list + /admin/users/{id}/status routes"
 ## Task 3: Admin Storage（summary / users / quota / usage-trend）
 
 **Files:**
+
 - Create: `app/src/fileflash/schemas/admin/storage.py`
 - Create: `app/src/fileflash/services/admin/storage.py`
 - Create: `app/src/fileflash/routers/admin_storage.py`
@@ -1370,6 +1374,7 @@ git commit -m "feat(admin): /admin/storage summary, users, quota, usage-trend"
 ## Task 4: Admin Files（list + rescan）
 
 **Files:**
+
 - Create: `app/src/fileflash/schemas/admin/files.py`
 - Create: `app/src/fileflash/services/admin/files.py`
 - Create: `app/src/fileflash/routers/admin_files.py`
@@ -1836,6 +1841,7 @@ git commit -m "feat(admin): /admin/files list + /admin/files/{id}/rescan with ev
 ## Task 5: Admin Moderation（violations list + resolve）
 
 **Files:**
+
 - Create: `app/src/fileflash/schemas/admin/moderation.py`
 - Create: `app/src/fileflash/services/admin/moderation.py`
 - Create: `app/src/fileflash/routers/admin_moderation.py`
@@ -2201,6 +2207,7 @@ git commit -m "feat(admin): /admin/violations list + resolve via ModerationCase"
 ## Task 6: Admin Logs
 
 **Files:**
+
 - Create: `app/src/fileflash/schemas/admin/logs.py`
 - Create: `app/src/fileflash/services/admin/logs.py`
 - Create: `app/src/fileflash/routers/admin_logs.py`
@@ -2421,6 +2428,7 @@ git commit -m "feat(admin): /admin/logs list with filters"
 ## Task 7: Admin Notifications（list / broadcast / read / archive）
 
 **Files:**
+
 - Create: `app/src/fileflash/schemas/admin/notifications.py`
 - Create: `app/src/fileflash/services/admin/notifications.py`
 - Create: `app/src/fileflash/routers/admin_notifications.py`
@@ -2873,6 +2881,7 @@ git commit -m "feat(admin): /admin/notifications list, broadcast, archive"
 ## Task 8: Admin System（health + rate-limit）
 
 **Files:**
+
 - Create: `app/src/fileflash/schemas/admin/system.py`
 - Create: `app/src/fileflash/services/admin/system.py`
 - Create: `app/src/fileflash/routers/admin_system.py`
diff --git a/docs/superpowers/plans/2026-05-24-admin-console-frontend.md b/docs/superpowers/plans/2026-05-24-admin-console-frontend.md
index 99b597c..f236394 100644
--- a/docs/superpowers/plans/2026-05-24-admin-console-frontend.md
+++ b/docs/superpowers/plans/2026-05-24-admin-console-frontend.md
@@ -87,6 +87,7 @@ web/src/pages/dashboard/index.ts
 ## Task 0: api / types / mock 对齐 Plan A 契约
 
 **Files:**
+
 - Modify: `web/src/api/storage.ts`, `web/src/api/log.ts`, `web/src/api/notification.ts`
 - Modify: `web/src/types/log.d.ts`, `web/src/types/notification.d.ts`
 - Modify: `web/src/mock/handlers/log.ts`, `web/src/mock/handlers/notification.ts`, `web/src/mock/handlers/storage.ts`
@@ -275,6 +276,7 @@ git commit -m "feat(web): align api+mock with Plan A admin contracts"
 ## Task 1: ConsoleLayout + Sidebar + 路由
 
 **Files:**
+
 - Create: `web/src/pages/console/ConsoleLayout.vue`, `ConsoleSidebar.vue`, `index.ts`
 - Modify: `web/src/router/routes.ts`
 
@@ -472,6 +474,7 @@ git commit -m "feat(web): scaffold Console layout, sidebar, and 9 subpage routes
 ## Task 2: 共享组件（components/console/）
 
 **Files:**
+
 - Create: `web/src/components/console/KpiCard.vue`, `StatusBadge.vue`, `FilterBar.vue`, `AdminTable.vue`, `TrendChart.vue`, `BroadcastComposer.vue`, `QuotaEditor.vue`, `index.ts`
 
 - [ ] **Step 2.1: KpiCard.vue**
@@ -840,6 +843,7 @@ git commit -m "feat(web): add Console shared components (KpiCard, AdminTable, et
 ## Task 3: Overview 子页
 
 **Files:**
+
 - Replace placeholder: `web/src/pages/console/overview/OverviewPage.vue`
 
 - [ ] **Step 3.1: 实现 OverviewPage**
@@ -1825,6 +1829,7 @@ git commit -m "feat(web): Console Rules page (registration email domains)"
 ## Task 12: 主框架集成、删除旧 Dashboard、i18n
 
 **Files:**
+
 - Modify: `web/src/components/organisms/shell/UserMenu.vue`
 - Modify: `web/src/i18n/messages.ts`
 - Delete: `web/src/pages/dashboard/Dashboard.vue`, `web/src/pages/dashboard/index.ts`
@@ -1856,9 +1861,10 @@ Edit `web/src/i18n/messages.ts`：
   | 'console.nav.rules'
 ```
 
-2. 中英 messages 表中，把原 `'header.menu.dashboard': '仪表盘'` 改为 `'header.menu.console': '控制台'`（en-US 改为 `'Console'`）。追加：
+1. 中英 messages 表中，把原 `'header.menu.dashboard': '仪表盘'` 改为 `'header.menu.console': '控制台'`（en-US 改为 `'Console'`）。追加：
 
 中文表：
+
 ```
     'console.title': '控制台',
     'console.nav.overview': '概览',
@@ -1873,6 +1879,7 @@ Edit `web/src/i18n/messages.ts`：
 ```
 
 英文表：
+
 ```
     'console.title': 'Console',
     'console.nav.overview': 'Overview',
@@ -1924,6 +1931,7 @@ git commit -m "feat(web): wire Console into MainLayout, drop legacy Dashboard, a
 ```bash
 cd web && bun run check
 ```
+
 Expected: 0 errors。
 
 - [ ] **Step 13.2: 全量构建**
@@ -1931,6 +1939,7 @@ Expected: 0 errors。
 ```bash
 cd web && bun run build
 ```
+
 Expected: dist/ 生成、无错误。
 
 - [ ] **Step 13.3: dev server 手动巡检**
diff --git a/docs/superpowers/plans/2026-05-26-agent-A-interaction-backend.md b/docs/superpowers/plans/2026-05-26-agent-A-interaction-backend.md
new file mode 100644
index 0000000..ab86d63
--- /dev/null
+++ b/docs/superpowers/plans/2026-05-26-agent-A-interaction-backend.md
@@ -0,0 +1,2284 @@
+# Agent 子项目 A（交互/反馈层）— 后端实现计划
+
+> **For agentic workers:** REQUIRED SUB-SKILL: Use superpowers:subagent-driven-development (recommended) or superpowers:executing-plans to implement this plan task-by-task. Steps use checkbox (`- [ ]`) syntax for tracking.
+
+**Goal:** 把 agent 后端从单向 SSE + DB 轮询升级为 Redis pub/sub 推送 + POST inbox 双向通道，支持 `agent.ask` / `agent.progress` / `agent.thinking` / `tool.partial` 等新事件，以及 pause/resume/skip/approve/cancel 等控制信号在 step 边界生效。
+
+**Architecture:** 新增 `AgentEventBus`（Redis pub/sub 封装）、`AgentInboxMessage` 表 + repository、`AgentInbox` 服务、`AskProtocol` 协议三大单元；SSE 端点从轮询 DB 改为订阅 Redis channel；ExecuteRunner / PlanRunner 在 step 边界检查 inbox。前端最小接入留给前端 plan。
+
+**Tech Stack:** Python 3.12 + FastAPI + SQLAlchemy async + Redis pub/sub (`redis.asyncio`) + Flyway SQL 迁移 + pytest + 既有 stub 风格测试（不引入 fakeredis）。
+
+**Spec:** `docs/superpowers/specs/2026-05-26-agent-improvements-design.md` 子项目 A 部分
+
+---
+
+## File Structure
+
+**新建（src）**
+
+- `app/src/fileflash/agents/harness/event_bus.py` — `AgentEventBus`（publish + subscribe）+ 内存 stub 用于测试
+- `app/src/fileflash/agents/harness/inbox.py` — `AgentInbox` 服务（写表 + publish）
+- `app/src/fileflash/agents/harness/ask.py` — `AskProtocol` 协议（创建 ask 消息、阻塞等回答）
+- `app/src/fileflash/repositories/agent/inbox.py` — `AgentInboxMessageRepository`
+
+**新建（迁移）**
+
+- `docker/flyway/migrations/V14__agent_inbox.sql` — `AgentInboxMessage` 表 + enum 类型
+
+**修改**
+
+- `app/src/fileflash/models/enums.py` — 新增 `AgentInboxRole` / `AgentInboxKind` / `AgentInboxStatus`
+- `app/src/fileflash/models/tables_agent.py` — 新增 `AgentInboxMessage` ORM model
+- `app/src/fileflash/models/__init__.py` — 导出 `AgentInboxMessage`
+- `app/src/fileflash/repositories/__init__.py` — 导出 `AgentInboxMessageRepository`
+- `app/src/fileflash/schemas/agent.py` — 新事件类型字面量 + 上行 message 类型
+- `app/src/fileflash/routers/agent.py` — 新增 `POST /agent/jobs/{id}/messages`、改 SSE 实现、删除 `POST /agent/cancel/{job_id}`
+- `app/src/fileflash/agents/runtime/execute_runner.py` — step 边界检查 inbox（pause/resume/cancel/skip/approve）+ publish 工具事件
+- `app/src/fileflash/agents/runtime/plan_runner.py` — 接入 ask 协议
+- `app/src/fileflash/agents/worker.py` — 创建 EventBus 单例并下发到 runner
+- `app/src/fileflash/core/settings.py` — 增 `agent_inbox_ask_timeout_sec`（默认 1800）+ Redis pub/sub channel 配置项
+- `app/src/fileflash/core/deps.py` — 注入 `AgentEventBus` 依赖
+
+**测试**
+
+- `app/tests/test_agent_event_bus.py` — 新
+- `app/tests/test_agent_inbox.py` — 新
+- `app/tests/test_agent_ask_protocol.py` — 新
+- `app/tests/test_agent_routes.py` — 扩展
+- `app/tests/test_agent_plan_execute_runtime.py` — 扩展
+
+**前端**
+
+不在本 plan 范围。参见 `2026-05-26-agent-A-interaction-frontend.md`。本 plan 完成后，后端通过 curl/httpx 集成测试可以独立验证。
+
+---
+
+## Sequencing
+
+```
+Task 1 (settings) ──► Task 2 (enums) ──► Task 3 (SQL 迁移) ──► Task 4 (ORM model)
+                                                                       │
+                                              ┌────────────────────────┘
+                                              ▼
+                                  Task 5 (repository)
+                                              │
+       ┌──────────────────────────────────────┼─────────────────────────┐
+       ▼                                       ▼                         ▼
+Task 6 (schemas)                Task 7 (EventBus)               Task 8 (Inbox service)
+                                                                          │
+                                                                          ▼
+                                                                  Task 9 (Ask protocol)
+                                                                          │
+                                                ┌─────────────────────────┘
+                                                ▼
+                                  Task 10 (POST /messages 路由)
+                                                │
+                                                ▼
+                                  Task 11 (SSE 改 EventBus subscribe)
+                                                │
+                                                ▼
+                                  Task 12 (删 POST /cancel)
+                                                │
+                                                ▼
+                                  Task 13 (ExecuteRunner 接 inbox)
+                                                │
+                                                ▼
+                                  Task 14 (PlanRunner 接 ask)
+                                                │
+                                                ▼
+                                  Task 15 (worker 装配)
+                                                │
+                                                ▼
+                                  Task 16 (端到端集成测试)
+```
+
+---
+
+## Task 1: 配置项与依赖
+
+**Files:**
+
+- Modify: `app/src/fileflash/core/settings.py`
+
+- [ ] **Step 1: 在 `Settings` 类合适位置（紧跟 `redis_url` 之后）增加 4 个配置项**
+
+```python
+    agent_inbox_ask_timeout_sec: int = Field(
+        default=1800,
+        alias="AGENT_INBOX_ASK_TIMEOUT_SEC",
+    )
+    agent_event_channel_prefix: str = Field(
+        default="agent:job",
+        alias="AGENT_EVENT_CHANNEL_PREFIX",
+    )
+    agent_inbox_channel_prefix: str = Field(
+        default="agent:inbox",
+        alias="AGENT_INBOX_CHANNEL_PREFIX",
+    )
+    agent_event_bus_buffer_size: int = Field(
+        default=64,
+        alias="AGENT_EVENT_BUS_BUFFER_SIZE",
+    )
+```
+
+- [ ] **Step 2: 删除既有 `routers/agent.py` 顶部的 `AGENT_EVENT_POLL_INTERVAL_SEC` 常量（line 22）。如果还有其它文件引用此常量，先用 Grep 确认无引用再删。**
+
+Run: `grep -rn "AGENT_EVENT_POLL_INTERVAL_SEC" app/src/ app/tests/`
+Expected: 仅 `routers/agent.py:22` 一处定义、`_event_stream` 内一处引用。
+
+- [ ] **Step 3: Commit**
+
+```bash
+git add app/src/fileflash/core/settings.py
+git commit -m "feat(agent): add inbox + event bus settings"
+```
+
+---
+
+## Task 2: 新增 inbox 相关枚举
+
+**Files:**
+
+- Modify: `app/src/fileflash/models/enums.py`
+
+- [ ] **Step 1: 在 `AgentMcpVisibility` 之后追加三个枚举**
+
+```python
+class AgentInboxRole(BaseStrEnum):
+    AGENT = "agent"
+    USER = "user"
+
+
+class AgentInboxKind(BaseStrEnum):
+    ASK = "ask"
+    REPLY = "reply"
+    CONTROL_PAUSE = "control.pause"
+    CONTROL_RESUME = "control.resume"
+    CONTROL_APPROVE = "control.approve"
+    CONTROL_DENY = "control.deny"
+    CONTROL_SKIP = "control.skip"
+    CONTROL_CANCEL = "control.cancel"
+
+
+class AgentInboxStatus(BaseStrEnum):
+    WAITING = "waiting"
+    ANSWERED = "answered"
+    TIMED_OUT = "timed_out"
+    DROPPED = "dropped"
+```
+
+- [ ] **Step 2: 把上面三个名字加到 `__all__` 末尾**
+
+```python
+__all__ = [
+    # ... existing entries ...
+    "AgentInboxRole",
+    "AgentInboxKind",
+    "AgentInboxStatus",
+]
+```
+
+- [ ] **Step 3: Commit**
+
+```bash
+git add app/src/fileflash/models/enums.py
+git commit -m "feat(agent): add inbox role/kind/status enums"
+```
+
+---
+
+## Task 3: Flyway 迁移 V14（新表 + pg enums）
+
+**Files:**
+
+- Create: `docker/flyway/migrations/V14__agent_inbox.sql`
+
+- [ ] **Step 1: 写完整 SQL 迁移**
+
+```sql
+-- =========================
+-- Domain: agent inbox
+-- =========================
+
+DO $$
+BEGIN
+    IF NOT EXISTS (SELECT 1 FROM pg_type WHERE typname = 'agent_inbox_role_enum') THEN
+        CREATE TYPE agent_inbox_role_enum AS ENUM ('agent', 'user');
+    END IF;
+    IF NOT EXISTS (SELECT 1 FROM pg_type WHERE typname = 'agent_inbox_kind_enum') THEN
+        CREATE TYPE agent_inbox_kind_enum AS ENUM (
+            'ask',
+            'reply',
+            'control.pause',
+            'control.resume',
+            'control.approve',
+            'control.deny',
+            'control.skip',
+            'control.cancel'
+        );
+    END IF;
+    IF NOT EXISTS (SELECT 1 FROM pg_type WHERE typname = 'agent_inbox_status_enum') THEN
+        CREATE TYPE agent_inbox_status_enum AS ENUM ('waiting', 'answered', 'timed_out', 'dropped');
+    END IF;
+END
+$$;
+
+CREATE TABLE IF NOT EXISTS agent_inbox_message (
+    inbox_message_id BIGINT GENERATED BY DEFAULT AS IDENTITY PRIMARY KEY,
+    job_id BIGINT NOT NULL,
+    role agent_inbox_role_enum NOT NULL,
+    kind agent_inbox_kind_enum NOT NULL,
+    payload_json JSONB NOT NULL DEFAULT '{}'::jsonb,
+    reply_to_id BIGINT NULL,
+    status agent_inbox_status_enum NULL,
+    created_at TIMESTAMP NOT NULL DEFAULT CURRENT_TIMESTAMP,
+    answered_at TIMESTAMP NULL,
+    CONSTRAINT fk_agent_inbox_message_job
+        FOREIGN KEY (job_id) REFERENCES background_job(job_id) ON DELETE CASCADE,
+    CONSTRAINT fk_agent_inbox_message_reply_to
+        FOREIGN KEY (reply_to_id) REFERENCES agent_inbox_message(inbox_message_id) ON DELETE SET NULL
+);
+
+CREATE INDEX IF NOT EXISTS idx_agent_inbox_message_job_created
+    ON agent_inbox_message (job_id, created_at);
+
+CREATE INDEX IF NOT EXISTS idx_agent_inbox_message_job_status
+    ON agent_inbox_message (job_id, status)
+    WHERE status IS NOT NULL;
+```
+
+- [ ] **Step 2: 在本地 PostgreSQL 应用迁移（按既有 Flyway 流程）**
+
+Run: `docker compose -f docker/compose.yml up flyway --build` 或项目既有 migration 命令。
+Expected: V14 标记为 success；`\dt agent_inbox_message` 在 psql 中能看到新表。
+
+- [ ] **Step 3: Commit**
+
+```bash
+git add docker/flyway/migrations/V14__agent_inbox.sql
+git commit -m "feat(agent): V14 add agent_inbox_message table"
+```
+
+---
+
+## Task 4: ORM model `AgentInboxMessage`
+
+**Files:**
+
+- Modify: `app/src/fileflash/models/tables_agent.py`
+- Modify: `app/src/fileflash/models/__init__.py`
+
+- [ ] **Step 1: 在 `tables_agent.py` 顶部导入区追加**
+
+```python
+from .enums import (
+    AgentExecutionPolicy,
+    AgentInboxKind,
+    AgentInboxRole,
+    AgentInboxStatus,
+    AgentMcpVisibility,
+    AgentMemoryKind,
+    AgentMemoryScope,
+    AgentSkillVisibility,
+)
+```
+
+- [ ] **Step 2: 在 `AgentWorkSession` 类之后追加 `AgentInboxMessage` 类**
+
+```python
+class AgentInboxMessage(Base):
+    __tablename__ = "agent_inbox_message"
+    __table_args__ = (
+        Index("idx_agent_inbox_message_job_created", "job_id", "created_at"),
+        Index(
+            "idx_agent_inbox_message_job_status",
+            "job_id",
+            "status",
+            postgresql_where=text("status IS NOT NULL"),
+        ),
+    )
+
+    inbox_message_id: Mapped[int] = mapped_column(BigInteger, Identity(), primary_key=True)
+    job_id: Mapped[int] = mapped_column(
+        BigInteger,
+        ForeignKey("background_job.job_id", ondelete="CASCADE"),
+        nullable=False,
+    )
+    role: Mapped[AgentInboxRole] = mapped_column(
+        pg_enum(AgentInboxRole, "agent_inbox_role_enum"),
+        nullable=False,
+    )
+    kind: Mapped[AgentInboxKind] = mapped_column(
+        pg_enum(AgentInboxKind, "agent_inbox_kind_enum"),
+        nullable=False,
+    )
+    payload_json: Mapped[dict[str, Any]] = mapped_column(
+        JSONB,
+        nullable=False,
+        server_default=text("'{}'::jsonb"),
+    )
+    reply_to_id: Mapped[int | None] = mapped_column(
+        BigInteger,
+        ForeignKey("agent_inbox_message.inbox_message_id", ondelete="SET NULL"),
+    )
+    status: Mapped[AgentInboxStatus | None] = mapped_column(
+        pg_enum(AgentInboxStatus, "agent_inbox_status_enum"),
+    )
+    created_at: Mapped[datetime] = mapped_column(
+        DateTime,
+        nullable=False,
+        server_default=text("CURRENT_TIMESTAMP"),
+    )
+    answered_at: Mapped[datetime | None] = mapped_column(DateTime)
+```
+
+- [ ] **Step 3: 把 `AgentInboxMessage` 加到 `__all__` 末尾，并在 `app/src/fileflash/models/__init__.py` 导出**
+
+```python
+# tables_agent.py __all__
+__all__ = [
+    "AgentActionLog",
+    "AgentInboxMessage",
+    "AgentMcpServer",
+    "AgentMemory",
+    "AgentPlan",
+    "AgentSkill",
+    "AgentUserSetting",
+    "AgentWorkSession",
+]
+```
+
+- [ ] **Step 4: 写最小 sanity 测试，确认 model 能与 DB 通信**
+
+新建 `app/tests/test_agent_inbox_model.py`：
+
+```python
+from datetime import UTC, datetime
+
+import pytest
+from sqlalchemy import select
+
+from fileflash.models import AgentInboxMessage, BackgroundJob
+from fileflash.models.enums import AgentInboxKind, AgentInboxRole, AgentInboxStatus
+
+
+@pytest.mark.asyncio
+async def test_insert_ask_message_round_trip(db_session, sample_background_job):  # noqa: ANN001
+    msg = AgentInboxMessage(
+        job_id=sample_background_job.job_id,
+        role=AgentInboxRole.AGENT,
+        kind=AgentInboxKind.ASK,
+        payload_json={"prompt": "which one?", "schema": {}},
+        status=AgentInboxStatus.WAITING,
+        created_at=datetime.now(UTC),
+    )
+    db_session.add(msg)
+    await db_session.commit()
+    fetched = await db_session.scalar(select(AgentInboxMessage).where(
+        AgentInboxMessage.inbox_message_id == msg.inbox_message_id
+    ))
+    assert fetched is not None
+    assert fetched.kind == AgentInboxKind.ASK
+    assert fetched.status == AgentInboxStatus.WAITING
+    assert fetched.payload_json["prompt"] == "which one?"
+```
+
+> 注：`db_session` / `sample_background_job` 是项目既有 pytest fixture（参见 `app/tests/test_agent_repositories.py`）。如名字不一致，沿用该测试文件里的 fixture 名。
+
+- [ ] **Step 5: 运行测试**
+
+Run: `cd app && uv run pytest tests/test_agent_inbox_model.py -v`
+Expected: PASS
+
+- [ ] **Step 6: Commit**
+
+```bash
+git add app/src/fileflash/models/tables_agent.py app/src/fileflash/models/__init__.py app/tests/test_agent_inbox_model.py
+git commit -m "feat(agent): add AgentInboxMessage ORM model"
+```
+
+---
+
+## Task 5: `AgentInboxMessageRepository`
+
+**Files:**
+
+- Create: `app/src/fileflash/repositories/agent/inbox.py`
+- Modify: `app/src/fileflash/repositories/__init__.py`
+- Create: `app/tests/test_agent_inbox_repository.py`
+
+- [ ] **Step 1: 写测试（先 fail）**
+
+```python
+# app/tests/test_agent_inbox_repository.py
+from datetime import UTC, datetime
+
+import pytest
+
+from fileflash.models.enums import AgentInboxKind, AgentInboxRole, AgentInboxStatus
+from fileflash.repositories import AgentInboxMessageRepository
+
+
+@pytest.mark.asyncio
+async def test_create_ask_then_record_reply(db_session, sample_background_job):  # noqa: ANN001
+    repo = AgentInboxMessageRepository(db_session)
+    ask = await repo.create_ask(
+        job_id=int(sample_background_job.job_id),
+        payload={"prompt": "choose", "schema": {"choice": ["A", "B"]}},
+    )
+    await db_session.commit()
+    assert ask.status == AgentInboxStatus.WAITING
+    assert ask.role == AgentInboxRole.AGENT
+    assert ask.kind == AgentInboxKind.ASK
+
+    reply = await repo.record_user_message(
+        job_id=int(sample_background_job.job_id),
+        kind=AgentInboxKind.REPLY,
+        payload={"value": "A"},
+        reply_to_id=int(ask.inbox_message_id),
+    )
+    await db_session.commit()
+    assert reply.role == AgentInboxRole.USER
+    assert reply.reply_to_id == ask.inbox_message_id
+
+    answered = await repo.mark_answered(
+        inbox_message_id=int(ask.inbox_message_id),
+        answered_at=datetime.now(UTC),
+    )
+    await db_session.commit()
+    assert answered.status == AgentInboxStatus.ANSWERED
+    assert answered.answered_at is not None
+
+
+@pytest.mark.asyncio
+async def test_pending_controls_excludes_consumed(db_session, sample_background_job):  # noqa: ANN001
+    repo = AgentInboxMessageRepository(db_session)
+    pause = await repo.record_user_message(
+        job_id=int(sample_background_job.job_id),
+        kind=AgentInboxKind.CONTROL_PAUSE,
+        payload={},
+    )
+    await db_session.commit()
+
+    pending = await repo.list_pending_controls(job_id=int(sample_background_job.job_id))
+    assert [m.inbox_message_id for m in pending] == [pause.inbox_message_id]
+
+    await repo.mark_dropped(inbox_message_id=int(pause.inbox_message_id))
+    await db_session.commit()
+    pending_after = await repo.list_pending_controls(job_id=int(sample_background_job.job_id))
+    assert pending_after == []
+```
+
+- [ ] **Step 2: 运行测试，确认 fail**
+
+Run: `cd app && uv run pytest tests/test_agent_inbox_repository.py -v`
+Expected: FAIL — `AgentInboxMessageRepository` not exported.
+
+- [ ] **Step 3: 实现 repository**
+
+`app/src/fileflash/repositories/agent/inbox.py`：
+
+```python
+from __future__ import annotations
+
+from datetime import UTC, datetime
+from typing import Any
+
+from sqlalchemy import and_, select
+from sqlalchemy.ext.asyncio import AsyncSession
+
+from ...models import AgentInboxMessage
+from ...models.enums import AgentInboxKind, AgentInboxRole, AgentInboxStatus
+
+_CONTROL_KINDS = frozenset(
+    {
+        AgentInboxKind.CONTROL_PAUSE,
+        AgentInboxKind.CONTROL_RESUME,
+        AgentInboxKind.CONTROL_APPROVE,
+        AgentInboxKind.CONTROL_DENY,
+        AgentInboxKind.CONTROL_SKIP,
+        AgentInboxKind.CONTROL_CANCEL,
+    }
+)
+
+
+class AgentInboxMessageRepository:
+    def __init__(self, db: AsyncSession) -> None:
+        self._db = db
+
+    async def create_ask(
+        self,
+        *,
+        job_id: int,
+        payload: dict[str, Any],
+    ) -> AgentInboxMessage:
+        msg = AgentInboxMessage(
+            job_id=job_id,
+            role=AgentInboxRole.AGENT,
+            kind=AgentInboxKind.ASK,
+            payload_json=payload,
+            status=AgentInboxStatus.WAITING,
+            created_at=datetime.now(UTC),
+        )
+        self._db.add(msg)
+        await self._db.flush()
+        return msg
+
+    async def record_user_message(
+        self,
+        *,
+        job_id: int,
+        kind: AgentInboxKind,
+        payload: dict[str, Any],
+        reply_to_id: int | None = None,
+    ) -> AgentInboxMessage:
+        msg = AgentInboxMessage(
+            job_id=job_id,
+            role=AgentInboxRole.USER,
+            kind=kind,
+            payload_json=payload,
+            reply_to_id=reply_to_id,
+            status=None,
+            created_at=datetime.now(UTC),
+        )
+        self._db.add(msg)
+        await self._db.flush()
+        return msg
+
+    async def mark_answered(
+        self,
+        *,
+        inbox_message_id: int,
+        answered_at: datetime,
+    ) -> AgentInboxMessage:
+        msg = await self._db.get(AgentInboxMessage, inbox_message_id)
+        if msg is None:
+            raise ValueError(f"AgentInboxMessage {inbox_message_id} not found")
+        msg.status = AgentInboxStatus.ANSWERED
+        msg.answered_at = answered_at
+        await self._db.flush()
+        return msg
+
+    async def mark_dropped(self, *, inbox_message_id: int) -> None:
+        msg = await self._db.get(AgentInboxMessage, inbox_message_id)
+        if msg is None:
+            return
+        if msg.kind in _CONTROL_KINDS:
+            msg.status = AgentInboxStatus.DROPPED
+            msg.answered_at = datetime.now(UTC)
+        await self._db.flush()
+
+    async def get_ask(self, *, inbox_message_id: int) -> AgentInboxMessage | None:
+        msg = await self._db.get(AgentInboxMessage, inbox_message_id)
+        if msg is None or msg.kind != AgentInboxKind.ASK:
+            return None
+        return msg
+
+    async def get_reply_for(self, *, ask_id: int) -> AgentInboxMessage | None:
+        return await self._db.scalar(
+            select(AgentInboxMessage).where(
+                and_(
+                    AgentInboxMessage.reply_to_id == ask_id,
+                    AgentInboxMessage.kind == AgentInboxKind.REPLY,
+                )
+            )
+        )
+
+    async def list_pending_controls(self, *, job_id: int) -> list[AgentInboxMessage]:
+        rows = await self._db.scalars(
+            select(AgentInboxMessage)
+            .where(
+                and_(
+                    AgentInboxMessage.job_id == job_id,
+                    AgentInboxMessage.role == AgentInboxRole.USER,
+                    AgentInboxMessage.kind.in_(list(_CONTROL_KINDS)),
+                    AgentInboxMessage.status.is_(None),
+                )
+            )
+            .order_by(AgentInboxMessage.created_at.asc())
+        )
+        return list(rows)
+```
+
+> 注：control 消息以"`status IS NULL` 表示未消费"为约定；worker 处理完后调 `mark_dropped`（命名只表"已消费、不再有效"，不代表用户错误）。Reply 消息保持 `status IS NULL`，由 `mark_answered` 处理对应的 ask。
+
+- [ ] **Step 4: 导出**
+
+`app/src/fileflash/repositories/__init__.py`：在合适位置新增
+
+```python
+from .agent.inbox import AgentInboxMessageRepository
+
+__all__ = [
+    # ... existing entries ...
+    "AgentInboxMessageRepository",
+]
+```
+
+- [ ] **Step 5: 运行测试**
+
+Run: `cd app && uv run pytest tests/test_agent_inbox_repository.py -v`
+Expected: PASS（2 个用例）
+
+- [ ] **Step 6: Commit**
+
+```bash
+git add app/src/fileflash/repositories/agent/inbox.py app/src/fileflash/repositories/__init__.py app/tests/test_agent_inbox_repository.py
+git commit -m "feat(agent): add AgentInboxMessageRepository"
+```
+
+---
+
+## Task 6: 新事件类型与上行 message schemas
+
+**Files:**
+
+- Modify: `app/src/fileflash/schemas/agent.py`
+
+- [ ] **Step 1: 扩展 `AgentJobEventType` 字面量与新增上行 message 模型**
+
+把 `AgentJobEventType` 改为：
+
+```python
+AgentJobEventType = Literal[
+    "job.queued",
+    "job.running",
+    "plan.ready",
+    "tool.started",
+    "tool.succeeded",
+    "tool.failed",
+    "tool.partial",
+    "agent.thinking",
+    "agent.progress",
+    "agent.ask",
+    "agent.paused",
+    "agent.resumed",
+    "job.succeeded",
+    "job.failed",
+    "job.canceled",
+]
+```
+
+在文件末尾（`__all__` 之前）新增：
+
+```python
+AgentInboxMessageKind = Literal[
+    "reply",
+    "control.pause",
+    "control.resume",
+    "control.approve",
+    "control.deny",
+    "control.skip",
+    "control.cancel",
+]
+
+
+class AgentInboxMessageRequest(CamelModel):
+    kind: AgentInboxMessageKind
+    reply_to: str | None = None              # ask 的 inbox_message_id（str-encoded）
+    value: Any = None                        # reply 时为用户回答；control 时通常 None
+    metadata: dict[str, Any] = Field(default_factory=dict)
+
+
+class AgentInboxMessageResponse(CamelModel):
+    inbox_message_id: str
+    kind: AgentInboxMessageKind
+    accepted_at: datetime
+```
+
+把这两个名字加入 `__all__`。
+
+- [ ] **Step 2: 写最小验证测试**
+
+新建 `app/tests/test_agent_inbox_schema.py`：
+
+```python
+import pytest
+from pydantic import ValidationError
+
+from fileflash.schemas.agent import AgentInboxMessageRequest
+
+
+def test_reply_with_value_validates() -> None:
+    msg = AgentInboxMessageRequest.model_validate(
+        {"kind": "reply", "replyTo": "42", "value": "yes"}
+    )
+    assert msg.kind == "reply"
+    assert msg.reply_to == "42"
+    assert msg.value == "yes"
+
+
+def test_unknown_kind_rejected() -> None:
+    with pytest.raises(ValidationError):
+        AgentInboxMessageRequest.model_validate({"kind": "control.explode"})
+```
+
+- [ ] **Step 3: 运行测试**
+
+Run: `cd app && uv run pytest tests/test_agent_inbox_schema.py -v`
+Expected: PASS
+
+- [ ] **Step 4: Commit**
+
+```bash
+git add app/src/fileflash/schemas/agent.py app/tests/test_agent_inbox_schema.py
+git commit -m "feat(agent): extend job event types and add inbox message schemas"
+```
+
+---
+
+## Task 7: `AgentEventBus`（Redis pub/sub 封装）
+
+**Files:**
+
+- Create: `app/src/fileflash/agents/harness/event_bus.py`
+- Modify: `app/src/fileflash/agents/harness/events.py` — 保留 `AgentEvent`，删除 `EventBus` scaffold
+- Create: `app/tests/test_agent_event_bus.py`
+
+- [ ] **Step 1: 写测试（先 fail）**
+
+```python
+# app/tests/test_agent_event_bus.py
+from datetime import UTC, datetime
+
+import pytest
+
+from fileflash.agents.harness.event_bus import (
+    AgentEventEnvelope,
+    InMemoryAgentEventBus,
+)
+
+
+@pytest.mark.asyncio
+async def test_subscriber_receives_published_event() -> None:
+    bus = InMemoryAgentEventBus()
+    envelope = AgentEventEnvelope(
+        job_id=42,
+        event_type="agent.ask",
+        payload={"prompt": "choose"},
+        emitted_at=datetime.now(UTC),
+    )
+    async with bus.subscribe(job_id=42) as stream:
+        await bus.publish(envelope)
+        received = await stream.next(timeout=1.0)
+    assert received == envelope
+
+
+@pytest.mark.asyncio
+async def test_only_subscribers_of_same_job_receive() -> None:
+    bus = InMemoryAgentEventBus()
+    own = AgentEventEnvelope(job_id=1, event_type="job.running", payload={}, emitted_at=datetime.now(UTC))
+    other = AgentEventEnvelope(job_id=2, event_type="job.running", payload={}, emitted_at=datetime.now(UTC))
+    async with bus.subscribe(job_id=1) as stream:
+        await bus.publish(other)
+        await bus.publish(own)
+        first = await stream.next(timeout=1.0)
+    assert first == own
+
+
+@pytest.mark.asyncio
+async def test_close_subscriber_unblocks() -> None:
+    bus = InMemoryAgentEventBus()
+    async with bus.subscribe(job_id=7) as stream:
+        with pytest.raises(TimeoutError):
+            await stream.next(timeout=0.1)
+```
+
+- [ ] **Step 2: 运行测试，确认 fail**
+
+Run: `cd app && uv run pytest tests/test_agent_event_bus.py -v`
+Expected: FAIL — module missing.
+
+- [ ] **Step 3: 实现 `event_bus.py`**
+
+```python
+# app/src/fileflash/agents/harness/event_bus.py
+from __future__ import annotations
+
+import asyncio
+import contextlib
+import json
+import logging
+from collections.abc import AsyncIterator
+from dataclasses import asdict, dataclass, field
+from datetime import datetime
+from typing import Any, Protocol
+
+from redis.asyncio import Redis
+
+from ...core.settings import Settings, get_settings
+
+logger = logging.getLogger(__name__)
+
+
+@dataclass(slots=True)
+class AgentEventEnvelope:
+    job_id: int
+    event_type: str
+    payload: dict[str, Any]
+    emitted_at: datetime
+    event_id: str | None = None
+
+    def to_json(self) -> str:
+        body = asdict(self)
+        body["emitted_at"] = self.emitted_at.isoformat()
+        return json.dumps(body, ensure_ascii=False, separators=(",", ":"))
+
+    @classmethod
+    def from_json(cls, raw: str) -> "AgentEventEnvelope":
+        data = json.loads(raw)
+        return cls(
+            job_id=int(data["job_id"]),
+            event_type=str(data["event_type"]),
+            payload=dict(data.get("payload") or {}),
+            emitted_at=datetime.fromisoformat(data["emitted_at"]),
+            event_id=data.get("event_id"),
+        )
+
+
+class AgentEventStream(Protocol):
+    async def next(self, *, timeout: float | None = None) -> AgentEventEnvelope: ...
+    async def aclose(self) -> None: ...
+
+
+class AgentEventBus(Protocol):
+    async def publish(self, envelope: AgentEventEnvelope) -> None: ...
+    def subscribe(self, *, job_id: int) -> "AgentEventSubscription": ...
+
+
+@dataclass(slots=True)
+class _InMemoryStream:
+    queue: asyncio.Queue[AgentEventEnvelope]
+
+    async def next(self, *, timeout: float | None = None) -> AgentEventEnvelope:
+        if timeout is None:
+            return await self.queue.get()
+        return await asyncio.wait_for(self.queue.get(), timeout=timeout)
+
+    async def aclose(self) -> None:
+        return None
+
+
+class InMemoryAgentEventBus:
+    """同进程实现，用于单元测试和单进程开发。生产用 RedisAgentEventBus。"""
+
+    def __init__(self, *, buffer_size: int = 64) -> None:
+        self._buffer = buffer_size
+        self._subscribers: dict[int, list[asyncio.Queue[AgentEventEnvelope]]] = {}
+
+    async def publish(self, envelope: AgentEventEnvelope) -> None:
+        queues = list(self._subscribers.get(envelope.job_id, []))
+        for q in queues:
+            if q.full():
+                logger.warning("InMemoryAgentEventBus drop: queue full job_id=%s", envelope.job_id)
+                continue
+            await q.put(envelope)
+
+    @contextlib.asynccontextmanager
+    async def subscribe(self, *, job_id: int) -> AsyncIterator[_InMemoryStream]:
+        q: asyncio.Queue[AgentEventEnvelope] = asyncio.Queue(maxsize=self._buffer)
+        self._subscribers.setdefault(job_id, []).append(q)
+        try:
+            yield _InMemoryStream(queue=q)
+        finally:
+            self._subscribers[job_id].remove(q)
+            if not self._subscribers[job_id]:
+                del self._subscribers[job_id]
+
+
+class RedisAgentEventBus:
+    """生产实现：worker 进程 publish 到 channel，web 进程 subscribe。"""
+
+    def __init__(
+        self,
+        *,
+        redis: Redis,
+        channel_prefix: str,
+        buffer_size: int = 64,
+    ) -> None:
+        self._redis = redis
+        self._channel_prefix = channel_prefix
+        self._buffer = buffer_size
+
+    def _channel(self, job_id: int) -> str:
+        return f"{self._channel_prefix}:{job_id}:events"
+
+    async def publish(self, envelope: AgentEventEnvelope) -> None:
+        await self._redis.publish(self._channel(envelope.job_id), envelope.to_json())
+
+    @contextlib.asynccontextmanager
+    async def subscribe(self, *, job_id: int) -> AsyncIterator["_RedisStream"]:
+        pubsub = self._redis.pubsub()
+        await pubsub.subscribe(self._channel(job_id))
+        stream = _RedisStream(pubsub=pubsub)
+        try:
+            yield stream
+        finally:
+            await pubsub.unsubscribe(self._channel(job_id))
+            await pubsub.aclose()
+
+
+@dataclass(slots=True)
+class _RedisStream:
+    pubsub: Any
+
+    async def next(self, *, timeout: float | None = None) -> AgentEventEnvelope:
+        message = await self.pubsub.get_message(
+            ignore_subscribe_messages=True,
+            timeout=timeout if timeout is not None else 0,
+        )
+        if message is None:
+            raise TimeoutError("No event within timeout")
+        data = message.get("data")
+        if isinstance(data, bytes):
+            data = data.decode("utf-8")
+        return AgentEventEnvelope.from_json(str(data))
+
+    async def aclose(self) -> None:
+        await self.pubsub.aclose()
+
+
+def build_agent_event_bus(*, settings: Settings | None = None, redis: Redis | None = None) -> AgentEventBus:
+    cfg = settings or get_settings()
+    if redis is None:
+        if not cfg.redis_url:
+            return InMemoryAgentEventBus(buffer_size=cfg.agent_event_bus_buffer_size)
+        from redis.asyncio import Redis as RedisClient  # local import to avoid hard dep at import time
+
+        redis = RedisClient.from_url(cfg.redis_url, decode_responses=True)
+    return RedisAgentEventBus(
+        redis=redis,
+        channel_prefix=cfg.agent_event_channel_prefix,
+        buffer_size=cfg.agent_event_bus_buffer_size,
+    )
+```
+
+- [ ] **Step 4: 清理 events.py scaffold**
+
+`app/src/fileflash/agents/harness/events.py` 改为：
+
+```python
+# Kept as a re-export shim until callers migrate to event_bus.py.
+from .event_bus import AgentEventEnvelope as AgentEvent
+
+__all__ = ["AgentEvent"]
+```
+
+> 此 shim 后续 PR 删除。本 plan 暂不删，避免外部 import 路径同时变更。
+
+- [ ] **Step 5: 运行测试**
+
+Run: `cd app && uv run pytest tests/test_agent_event_bus.py -v`
+Expected: PASS（3 个用例）
+
+- [ ] **Step 6: Commit**
+
+```bash
+git add app/src/fileflash/agents/harness/event_bus.py app/src/fileflash/agents/harness/events.py app/tests/test_agent_event_bus.py
+git commit -m "feat(agent): add AgentEventBus with in-memory and Redis impls"
+```
+
+---
+
+## Task 8: `AgentInbox` 服务（写表 + publish）
+
+**Files:**
+
+- Create: `app/src/fileflash/agents/harness/inbox.py`
+- Create: `app/tests/test_agent_inbox.py`
+
+- [ ] **Step 1: 写测试**
+
+```python
+# app/tests/test_agent_inbox.py
+from datetime import UTC, datetime
+
+import pytest
+
+from fileflash.agents.harness.event_bus import InMemoryAgentEventBus
+from fileflash.agents.harness.inbox import AgentInbox
+from fileflash.models.enums import AgentInboxKind
+from fileflash.repositories import AgentInboxMessageRepository
+
+
+@pytest.mark.asyncio
+async def test_handle_reply_persists_and_publishes(db_session, sample_background_job):  # noqa: ANN001
+    repo = AgentInboxMessageRepository(db_session)
+    ask = await repo.create_ask(
+        job_id=int(sample_background_job.job_id),
+        payload={"prompt": "?"},
+    )
+    await db_session.commit()
+
+    bus = InMemoryAgentEventBus()
+    inbox = AgentInbox(db=db_session, event_bus=bus)
+
+    async with bus.subscribe(job_id=int(sample_background_job.job_id)) as stream:
+        msg = await inbox.handle(
+            job_id=int(sample_background_job.job_id),
+            kind=AgentInboxKind.REPLY,
+            payload={"value": "yes"},
+            reply_to_id=int(ask.inbox_message_id),
+        )
+        await db_session.commit()
+        evt = await stream.next(timeout=1.0)
+
+    assert msg.kind == AgentInboxKind.REPLY
+    assert evt.event_type == "agent.inbox.reply"
+    assert evt.payload["replyTo"] == str(ask.inbox_message_id)
+    assert evt.payload["value"] == "yes"
+
+
+@pytest.mark.asyncio
+async def test_reply_with_unknown_ask_raises(db_session, sample_background_job):  # noqa: ANN001
+    bus = InMemoryAgentEventBus()
+    inbox = AgentInbox(db=db_session, event_bus=bus)
+    with pytest.raises(ValueError):
+        await inbox.handle(
+            job_id=int(sample_background_job.job_id),
+            kind=AgentInboxKind.REPLY,
+            payload={"value": "yes"},
+            reply_to_id=999999,
+        )
+```
+
+- [ ] **Step 2: 运行测试，确认 fail**
+
+Run: `cd app && uv run pytest tests/test_agent_inbox.py -v`
+Expected: FAIL — module missing.
+
+- [ ] **Step 3: 实现 `AgentInbox`**
+
+```python
+# app/src/fileflash/agents/harness/inbox.py
+from __future__ import annotations
+
+from datetime import UTC, datetime
+from typing import Any
+
+from sqlalchemy.ext.asyncio import AsyncSession
+
+from ...models.enums import AgentInboxKind
+from ...repositories import AgentInboxMessageRepository
+from .event_bus import AgentEventBus, AgentEventEnvelope
+
+
+_INBOX_EVENT_TYPES: dict[AgentInboxKind, str] = {
+    AgentInboxKind.REPLY: "agent.inbox.reply",
+    AgentInboxKind.CONTROL_PAUSE: "agent.inbox.control",
+    AgentInboxKind.CONTROL_RESUME: "agent.inbox.control",
+    AgentInboxKind.CONTROL_APPROVE: "agent.inbox.control",
+    AgentInboxKind.CONTROL_DENY: "agent.inbox.control",
+    AgentInboxKind.CONTROL_SKIP: "agent.inbox.control",
+    AgentInboxKind.CONTROL_CANCEL: "agent.inbox.control",
+}
+
+
+class AgentInbox:
+    def __init__(self, *, db: AsyncSession, event_bus: AgentEventBus) -> None:
+        self._db = db
+        self._bus = event_bus
+        self._repo = AgentInboxMessageRepository(db)
+
+    async def handle(
+        self,
+        *,
+        job_id: int,
+        kind: AgentInboxKind,
+        payload: dict[str, Any],
+        reply_to_id: int | None = None,
+    ):
+        if kind == AgentInboxKind.REPLY:
+            if reply_to_id is None:
+                raise ValueError("reply requires reply_to_id")
+            ask = await self._repo.get_ask(inbox_message_id=reply_to_id)
+            if ask is None:
+                raise ValueError(f"ask {reply_to_id} not found")
+            if ask.job_id != job_id:
+                raise ValueError(f"ask {reply_to_id} belongs to a different job")
+
+        msg = await self._repo.record_user_message(
+            job_id=job_id,
+            kind=kind,
+            payload=payload,
+            reply_to_id=reply_to_id,
+        )
+        event_type = _INBOX_EVENT_TYPES[kind]
+        envelope_payload: dict[str, Any] = {"kind": kind.value, "messageId": str(msg.inbox_message_id)}
+        if reply_to_id is not None:
+            envelope_payload["replyTo"] = str(reply_to_id)
+        if "value" in payload:
+            envelope_payload["value"] = payload["value"]
+        await self._bus.publish(
+            AgentEventEnvelope(
+                job_id=job_id,
+                event_type=event_type,
+                payload=envelope_payload,
+                emitted_at=datetime.now(UTC),
+            )
+        )
+        return msg
+```
+
+- [ ] **Step 4: 运行测试**
+
+Run: `cd app && uv run pytest tests/test_agent_inbox.py -v`
+Expected: PASS（2 个用例）
+
+- [ ] **Step 5: Commit**
+
+```bash
+git add app/src/fileflash/agents/harness/inbox.py app/tests/test_agent_inbox.py
+git commit -m "feat(agent): add AgentInbox service"
+```
+
+---
+
+## Task 9: `AskProtocol`（worker 等用户回答）
+
+**Files:**
+
+- Create: `app/src/fileflash/agents/harness/ask.py`
+- Create: `app/tests/test_agent_ask_protocol.py`
+
+- [ ] **Step 1: 写测试**
+
+```python
+# app/tests/test_agent_ask_protocol.py
+import asyncio
+from datetime import UTC, datetime
+
+import pytest
+
+from fileflash.agents.harness.ask import AskProtocol, AskTimedOut
+from fileflash.agents.harness.event_bus import InMemoryAgentEventBus
+from fileflash.agents.harness.inbox import AgentInbox
+from fileflash.models.enums import AgentInboxKind, AgentInboxStatus
+from fileflash.repositories import AgentInboxMessageRepository
+
+
+@pytest.mark.asyncio
+async def test_ask_returns_when_reply_arrives(db_session, sample_background_job):  # noqa: ANN001
+    bus = InMemoryAgentEventBus()
+    inbox = AgentInbox(db=db_session, event_bus=bus)
+    protocol = AskProtocol(
+        db=db_session,
+        event_bus=bus,
+        job_id=int(sample_background_job.job_id),
+    )
+    await protocol.start()
+    try:
+        async def reply_later():
+            await asyncio.sleep(0.05)
+            # 找到刚创建的 ask
+            repo = AgentInboxMessageRepository(db_session)
+            from sqlalchemy import select
+            from fileflash.models import AgentInboxMessage
+            ask = await db_session.scalar(
+                select(AgentInboxMessage)
+                .where(AgentInboxMessage.kind == AgentInboxKind.ASK)
+                .order_by(AgentInboxMessage.inbox_message_id.desc())
+            )
+            await inbox.handle(
+                job_id=int(sample_background_job.job_id),
+                kind=AgentInboxKind.REPLY,
+                payload={"value": "A"},
+                reply_to_id=int(ask.inbox_message_id),
+            )
+            await db_session.commit()
+
+        replier = asyncio.create_task(reply_later())
+        result = await protocol.ask(
+            prompt="choose",
+            schema={"choice": ["A", "B"]},
+            timeout_sec=2.0,
+        )
+        await replier
+    finally:
+        await protocol.aclose()
+
+    assert result == "A"
+
+
+@pytest.mark.asyncio
+async def test_ask_times_out(db_session, sample_background_job):  # noqa: ANN001
+    bus = InMemoryAgentEventBus()
+    protocol = AskProtocol(
+        db=db_session,
+        event_bus=bus,
+        job_id=int(sample_background_job.job_id),
+    )
+    await protocol.start()
+    try:
+        with pytest.raises(AskTimedOut):
+            await protocol.ask(prompt="?", schema={}, timeout_sec=0.1)
+    finally:
+        await protocol.aclose()
+
+    # 验证 ask 已被标 timed_out
+    from sqlalchemy import select
+    from fileflash.models import AgentInboxMessage
+    asks = list(
+        await db_session.scalars(
+            select(AgentInboxMessage).where(AgentInboxMessage.kind == AgentInboxKind.ASK)
+        )
+    )
+    assert asks
+    assert asks[-1].status == AgentInboxStatus.TIMED_OUT
+```
+
+- [ ] **Step 2: 运行测试，确认 fail**
+
+Run: `cd app && uv run pytest tests/test_agent_ask_protocol.py -v`
+Expected: FAIL — module missing.
+
+- [ ] **Step 3: 实现 `AskProtocol`**
+
+```python
+# app/src/fileflash/agents/harness/ask.py
+from __future__ import annotations
+
+import asyncio
+import contextlib
+from datetime import UTC, datetime
+from typing import Any
+
+from sqlalchemy.ext.asyncio import AsyncSession
+
+from ...models.enums import AgentInboxKind
+from ...repositories import AgentInboxMessageRepository
+from .event_bus import AgentEventBus, AgentEventEnvelope
+
+
+class AskTimedOut(Exception):
+    def __init__(self, *, ask_id: int) -> None:
+        super().__init__(f"Ask {ask_id} timed out")
+        self.ask_id = ask_id
+
+
+class AskProtocol:
+    """worker 端：创建 ask 表条目、publish agent.ask 事件、阻塞等 reply 经 inbox channel 唤醒。
+
+    生命周期绑定单个 job_id。`start()` 后开始订阅；`aclose()` 释放订阅。
+    """
+
+    def __init__(
+        self,
+        *,
+        db: AsyncSession,
+        event_bus: AgentEventBus,
+        job_id: int,
+    ) -> None:
+        self._db = db
+        self._bus = event_bus
+        self._job_id = job_id
+        self._repo = AgentInboxMessageRepository(db)
+        self._waiters: dict[int, asyncio.Future[Any]] = {}
+        self._sub_ctx = None
+        self._sub_stream = None
+        self._sub_task: asyncio.Task[None] | None = None
+
+    async def start(self) -> None:
+        self._sub_ctx = self._bus.subscribe(job_id=self._job_id)
+        self._sub_stream = await self._sub_ctx.__aenter__()
+        self._sub_task = asyncio.create_task(self._listen())
+
+    async def aclose(self) -> None:
+        if self._sub_task is not None:
+            self._sub_task.cancel()
+            with contextlib.suppress(asyncio.CancelledError):
+                await self._sub_task
+        if self._sub_ctx is not None:
+            await self._sub_ctx.__aexit__(None, None, None)
+        for fut in self._waiters.values():
+            if not fut.done():
+                fut.cancel()
+
+    async def ask(
+        self,
+        *,
+        prompt: str,
+        schema: dict[str, Any],
+        timeout_sec: float,
+    ) -> Any:
+        msg = await self._repo.create_ask(
+            job_id=self._job_id,
+            payload={"prompt": prompt, "schema": schema, "timeoutSec": timeout_sec},
+        )
+        await self._db.commit()
+
+        await self._bus.publish(
+            AgentEventEnvelope(
+                job_id=self._job_id,
+                event_type="agent.ask",
+                payload={
+                    "messageId": str(msg.inbox_message_id),
+                    "prompt": prompt,
+                    "schema": schema,
+                    "timeoutSec": timeout_sec,
+                },
+                emitted_at=datetime.now(UTC),
+            )
+        )
+
+        loop = asyncio.get_running_loop()
+        fut: asyncio.Future[Any] = loop.create_future()
+        self._waiters[int(msg.inbox_message_id)] = fut
+        try:
+            value = await asyncio.wait_for(fut, timeout=timeout_sec)
+        except asyncio.TimeoutError as exc:
+            from ...models.enums import AgentInboxStatus
+            ask = await self._repo.get_ask(inbox_message_id=int(msg.inbox_message_id))
+            if ask is not None:
+                ask.status = AgentInboxStatus.TIMED_OUT
+                ask.answered_at = datetime.now(UTC)
+                await self._db.commit()
+            raise AskTimedOut(ask_id=int(msg.inbox_message_id)) from exc
+        finally:
+            self._waiters.pop(int(msg.inbox_message_id), None)
+
+        await self._repo.mark_answered(
+            inbox_message_id=int(msg.inbox_message_id),
+            answered_at=datetime.now(UTC),
+        )
+        await self._db.commit()
+        return value
+
+    async def _listen(self) -> None:
+        assert self._sub_stream is not None
+        while True:
+            try:
+                envelope = await self._sub_stream.next(timeout=None)
+            except asyncio.CancelledError:
+                raise
+            except Exception:  # noqa: BLE001
+                continue
+            if envelope.event_type != "agent.inbox.reply":
+                continue
+            reply_to = envelope.payload.get("replyTo")
+            if reply_to is None:
+                continue
+            try:
+                ask_id = int(reply_to)
+            except (TypeError, ValueError):
+                continue
+            fut = self._waiters.get(ask_id)
+            if fut is None or fut.done():
+                continue
+            fut.set_result(envelope.payload.get("value"))
+```
+
+- [ ] **Step 4: 运行测试**
+
+Run: `cd app && uv run pytest tests/test_agent_ask_protocol.py -v`
+Expected: PASS（2 个用例）
+
+- [ ] **Step 5: Commit**
+
+```bash
+git add app/src/fileflash/agents/harness/ask.py app/tests/test_agent_ask_protocol.py
+git commit -m "feat(agent): add AskProtocol for worker-to-user blocking ask"
+```
+
+---
+
+## Task 10: `POST /agent/jobs/{job_id}/messages` 路由
+
+**Files:**
+
+- Modify: `app/src/fileflash/routers/agent.py`
+- Modify: `app/src/fileflash/core/deps.py`
+- Modify: `app/tests/test_agent_routes.py`
+
+- [ ] **Step 1: 在 `deps.py` 增加 EventBus 依赖**
+
+```python
+# app/src/fileflash/core/deps.py — 在文件末尾增加
+from ..agents.harness.event_bus import AgentEventBus, build_agent_event_bus
+
+_event_bus_singleton: AgentEventBus | None = None
+
+
+def get_agent_event_bus() -> AgentEventBus:
+    global _event_bus_singleton
+    if _event_bus_singleton is None:
+        _event_bus_singleton = build_agent_event_bus()
+    return _event_bus_singleton
+```
+
+> 注：如果 deps.py 已有 module-level singleton 模式，沿用既有写法；否则用上述简单单例。
+
+- [ ] **Step 2: 在 `routers/agent.py` 新增路由**
+
+在 `cancel_agent_job` 之前插入：
+
+```python
+from ..agents.harness.event_bus import AgentEventBus
+from ..agents.harness.inbox import AgentInbox
+from ..core.deps import get_agent_event_bus
+from ..models.enums import AgentInboxKind
+from ..schemas.agent import AgentInboxMessageRequest, AgentInboxMessageResponse
+
+
+@router.post("/jobs/{job_id}/messages")
+async def post_agent_job_message(
+    job_id: str,
+    payload: AgentInboxMessageRequest,
+    current_user: Annotated[User, Depends(get_current_user)],
+    db: Annotated[AsyncSession, Depends(get_db)],
+    event_bus: Annotated[AgentEventBus, Depends(get_agent_event_bus)],
+):
+    parsed_job_id = _parse_job_id(job_id)
+    job = await db.scalar(
+        select(BackgroundJob).where(
+            and_(
+                BackgroundJob.job_id == parsed_job_id,
+                BackgroundJob.requested_by == current_user.user_id,
+                BackgroundJob.task_type.in_(["agent.plan", "agent.execute"]),
+            )
+        )
+    )
+    if job is None:
+        raise ApiError(status_code=404, code=404, message="Job not found")
+
+    kind = AgentInboxKind(payload.kind)
+    reply_to_id: int | None = None
+    if payload.reply_to is not None:
+        try:
+            reply_to_id = int(payload.reply_to)
+        except ValueError as exc:
+            raise ApiError(status_code=400, code=400, message="Invalid replyTo") from exc
+
+    inbox = AgentInbox(db=db, event_bus=event_bus)
+    try:
+        msg = await inbox.handle(
+            job_id=parsed_job_id,
+            kind=kind,
+            payload=_inbox_payload_from_request(payload),
+            reply_to_id=reply_to_id,
+        )
+    except ValueError as exc:
+        raise ApiError(status_code=400, code=400, message=str(exc)) from exc
+    await db.commit()
+
+    data = AgentInboxMessageResponse(
+        inbox_message_id=str(msg.inbox_message_id),
+        kind=payload.kind,
+        accepted_at=msg.created_at,
+    )
+    return api_success(data=data.model_dump(by_alias=True), message="Message accepted")
+
+
+def _inbox_payload_from_request(req: AgentInboxMessageRequest) -> dict[str, Any]:
+    body: dict[str, Any] = {}
+    if req.value is not None:
+        body["value"] = req.value
+    if req.metadata:
+        body["metadata"] = req.metadata
+    return body
+```
+
+> 注：`Any` 已经在 typing 中；如未 import，在文件顶部 `from typing import Annotated, Any`。
+
+- [ ] **Step 3: 扩展 `test_agent_routes.py`，新增一组用例**
+
+```python
+# app/tests/test_agent_routes.py — 在文件末尾追加
+from fileflash.agents.harness.event_bus import InMemoryAgentEventBus
+from fileflash.core.deps import get_agent_event_bus
+from fileflash.models import AgentInboxMessage
+from fileflash.models.enums import AgentInboxKind
+
+
+def _build_app_with_bus(bus: InMemoryAgentEventBus, db_stub) -> FastAPI:  # noqa: ANN001
+    app = FastAPI()
+    app.include_router(router)
+    app.add_exception_handler(ApiError, api_error_handler)
+    app.dependency_overrides[get_db] = lambda: db_stub
+    app.dependency_overrides[get_current_user] = lambda: User(user_id=7)
+    app.dependency_overrides[get_agent_event_bus] = lambda: bus
+    return app
+
+
+def test_post_message_control_pause_accepted(db_session, sample_background_job):  # noqa: ANN001
+    bus = InMemoryAgentEventBus()
+    # 真 DB session 测；不再用 StubDb
+    app = FastAPI()
+    app.include_router(router)
+    app.add_exception_handler(ApiError, api_error_handler)
+    app.dependency_overrides[get_db] = lambda: db_session
+    app.dependency_overrides[get_current_user] = lambda: User(
+        user_id=int(sample_background_job.requested_by)
+    )
+    app.dependency_overrides[get_agent_event_bus] = lambda: bus
+
+    client = TestClient(app)
+    resp = client.post(
+        f"/agent/jobs/{sample_background_job.job_id}/messages",
+        json={"kind": "control.pause"},
+    )
+    assert resp.status_code == 200
+    body = resp.json()
+    assert body["data"]["kind"] == "control.pause"
+```
+
+> 注：`sample_background_job` fixture 应该指向 `requested_by=7` 的 BackgroundJob；如 fixture 不一致，按既有 fixture 命名调整。
+
+- [ ] **Step 4: 运行测试**
+
+Run: `cd app && uv run pytest tests/test_agent_routes.py -v -k "post_message"`
+Expected: PASS
+
+- [ ] **Step 5: Commit**
+
+```bash
+git add app/src/fileflash/core/deps.py app/src/fileflash/routers/agent.py app/tests/test_agent_routes.py
+git commit -m "feat(agent): add POST /agent/jobs/{id}/messages upstream channel"
+```
+
+---
+
+## Task 11: SSE 端点改为订阅 EventBus
+
+**Files:**
+
+- Modify: `app/src/fileflash/routers/agent.py`
+
+- [ ] **Step 1: 替换 `stream_agent_job_events` 与 `event_stream` 内部逻辑**
+
+把现有 `stream_agent_job_events` 整体替换为：
+
+```python
+@router.get("/jobs/{job_id}/events")
+async def stream_agent_job_events(
+    job_id: str,
+    current_user: Annotated[User, Depends(get_current_user)],
+    db: Annotated[AsyncSession, Depends(get_db)],
+    event_bus: Annotated[AgentEventBus, Depends(get_agent_event_bus)],
+):
+    parsed_job_id = _parse_job_id(job_id)
+    initial_events, initial_terminal = await _agent_job_events_for_job(
+        db=db,
+        job_id=parsed_job_id,
+        user_id=int(current_user.user_id),
+    )
+
+    async def event_stream():
+        seen: set[str] = set()
+        for event in initial_events:
+            seen.add(event.id)
+            yield _format_sse_event(event)
+        if initial_terminal:
+            return
+        async with event_bus.subscribe(job_id=parsed_job_id) as stream:
+            while True:
+                try:
+                    envelope = await stream.next(timeout=30.0)
+                except TimeoutError:
+                    # 30s 心跳，避免代理断连
+                    yield ": keep-alive\n\n"
+                    continue
+                event = _envelope_to_job_event(envelope)
+                if event.id in seen:
+                    continue
+                seen.add(event.id)
+                yield _format_sse_event(event)
+                if event.type in {"job.succeeded", "job.failed", "job.canceled"}:
+                    break
+
+    return StreamingResponse(
+        event_stream(),
+        media_type="text/event-stream",
+        headers={
+            "Cache-Control": "no-cache",
+            "X-Accel-Buffering": "no",
+        },
+    )
+```
+
+新增辅助函数：
+
+```python
+def _envelope_to_job_event(env: "AgentEventEnvelope") -> AgentJobEvent:
+    return AgentJobEvent(
+        id=env.event_id or f"{env.job_id}:{env.event_type}:{env.emitted_at.isoformat()}",
+        job_id=str(env.job_id),
+        task_type="agent.execute",  # type 在 envelope payload 里冗余，简化
+        type=env.event_type,  # type: ignore[arg-type]
+        status=str(env.payload.get("status") or ""),
+        agent_phase=env.payload.get("agentPhase"),
+        message=str(env.payload.get("message") or ""),
+        data=dict(env.payload.get("data") or env.payload),
+        timestamp=env.emitted_at,
+    )
+```
+
+把 `AGENT_EVENT_POLL_INTERVAL_SEC` 常量删掉，把 `asyncio.sleep(...)` 调用一并删除。在文件顶部加入：
+
+```python
+from ..agents.harness.event_bus import AgentEventBus, AgentEventEnvelope
+```
+
+> 注：保留 `_agent_job_events_for_job` 用作 initial replay（连接刚建立时拉一次历史），因为 pub/sub 不持久化。
+
+- [ ] **Step 2: 扩展 SSE 测试**
+
+在 `test_agent_routes.py` 已有的 SSE 用例之外加一个：
+
+```python
+def test_sse_streams_published_events(db_session, sample_background_job):  # noqa: ANN001
+    bus = InMemoryAgentEventBus()
+    app = FastAPI()
+    app.include_router(router)
+    app.add_exception_handler(ApiError, api_error_handler)
+    app.dependency_overrides[get_db] = lambda: db_session
+    app.dependency_overrides[get_current_user] = lambda: User(
+        user_id=int(sample_background_job.requested_by)
+    )
+    app.dependency_overrides[get_agent_event_bus] = lambda: bus
+
+    import asyncio
+    from datetime import UTC, datetime
+
+    async def producer():
+        await asyncio.sleep(0.1)
+        await bus.publish(
+            AgentEventEnvelope(
+                job_id=int(sample_background_job.job_id),
+                event_type="agent.progress",
+                payload={"step": 1, "total": 3, "message": "halfway"},
+                emitted_at=datetime.now(UTC),
+            )
+        )
+        await asyncio.sleep(0.05)
+        await bus.publish(
+            AgentEventEnvelope(
+                job_id=int(sample_background_job.job_id),
+                event_type="job.succeeded",
+                payload={"status": "succeeded"},
+                emitted_at=datetime.now(UTC),
+            )
+        )
+
+    client = TestClient(app)
+    # TestClient 不直接支持 async producer 并发；用线程
+    import threading
+
+    def run_producer() -> None:
+        asyncio.run(producer())
+
+    t = threading.Thread(target=run_producer)
+    t.start()
+    with client.stream("GET", f"/agent/jobs/{sample_background_job.job_id}/events") as resp:
+        lines = []
+        for chunk in resp.iter_lines():
+            if chunk:
+                lines.append(chunk)
+            if any("job.succeeded" in line for line in lines):
+                break
+    t.join()
+
+    assert any("agent.progress" in line for line in lines)
+    assert any("job.succeeded" in line for line in lines)
+```
+
+> 注：原有依赖 0.6s DB 轮询的 SSE 测试如失败，按新模型重写为"测 initial replay + 测订阅流"两段。
+
+- [ ] **Step 3: 运行测试**
+
+Run: `cd app && uv run pytest tests/test_agent_routes.py -v -k "sse"`
+Expected: PASS
+
+- [ ] **Step 4: Commit**
+
+```bash
+git add app/src/fileflash/routers/agent.py app/tests/test_agent_routes.py
+git commit -m "feat(agent): replace SSE polling with EventBus subscription"
+```
+
+---
+
+## Task 12: 删除 `POST /agent/cancel/{job_id}`
+
+**Files:**
+
+- Modify: `app/src/fileflash/routers/agent.py`
+- Modify: `app/tests/test_agent_routes.py`
+
+- [ ] **Step 1: 删除 `cancel_agent_job` 函数与对应的 `from ..schemas.agent import ... CancelAgentResponse` 引用**
+
+确认 import 调整后无 unused。
+
+- [ ] **Step 2: 删除 `test_agent_routes.py` 中所有 `POST /agent/cancel` 测试用例**
+
+Run: `grep -n "cancel_agent\|/agent/cancel" app/tests/test_agent_routes.py`
+逐条删除。
+
+- [ ] **Step 3: 全仓搜索其他引用并清理**
+
+Run: `grep -rn "agent/cancel\|cancelAgentJob" app/ web/`
+Expected: 仅 `web/` 下有引用（前端 plan 处理），后端无引用。如果后端有，一并删除。
+
+- [ ] **Step 4: 运行全部 agent 测试**
+
+Run: `cd app && uv run pytest tests/test_agent_routes.py -v`
+Expected: PASS
+
+- [ ] **Step 5: Commit**
+
+```bash
+git add app/src/fileflash/routers/agent.py app/tests/test_agent_routes.py
+git commit -m "refactor(agent): drop legacy POST /agent/cancel route"
+```
+
+---
+
+## Task 13: `ExecuteRunner` 接入 inbox（pause/resume/skip/approve/cancel）
+
+**Files:**
+
+- Modify: `app/src/fileflash/agents/runtime/execute_runner.py`
+- Modify: `app/tests/test_agent_plan_execute_runtime.py`
+
+- [ ] **Step 1: 在 `ExecuteRunner.__init__` 增加 EventBus 依赖与状态**
+
+```python
+class ExecuteRunner:
+    def __init__(
+        self,
+        *,
+        policy_guard: PolicyGuard | None = None,
+        event_bus: AgentEventBus | None = None,
+    ) -> None:
+        self.policy_guard = policy_guard or PolicyGuard()
+        self.event_bus = event_bus
+```
+
+> 默认 `None` 时退化为静默（不 publish），用于单元测试与旧调用兼容。
+
+- [ ] **Step 2: 在 `ExecuteRunner.run` 顶部新增 step 边界控制处理**
+
+把原 line 62-66 的循环顶部替换为：
+
+```python
+        from ...repositories import AgentInboxMessageRepository
+
+        inbox_repo = AgentInboxMessageRepository(db)
+        paused = False
+
+        for action in actions:
+            await db.refresh(job)
+            if job.cancel_requested_at is not None:
+                raise AgentJobCanceled()
+
+            # ---- step 边界 inbox 处理 ----
+            while True:
+                pending = await inbox_repo.list_pending_controls(job_id=int(job.job_id))
+                for ctrl in pending:
+                    if ctrl.kind == AgentInboxKind.CONTROL_CANCEL:
+                        await inbox_repo.mark_dropped(inbox_message_id=int(ctrl.inbox_message_id))
+                        job.cancel_requested_at = datetime.now(UTC)
+                        await db.commit()
+                        raise AgentJobCanceled()
+                    if ctrl.kind == AgentInboxKind.CONTROL_PAUSE:
+                        paused = True
+                        await inbox_repo.mark_dropped(inbox_message_id=int(ctrl.inbox_message_id))
+                        await self._publish_state("agent.paused", job_id=int(job.job_id))
+                    elif ctrl.kind == AgentInboxKind.CONTROL_RESUME:
+                        paused = False
+                        await inbox_repo.mark_dropped(inbox_message_id=int(ctrl.inbox_message_id))
+                        await self._publish_state("agent.resumed", job_id=int(job.job_id))
+                    elif ctrl.kind == AgentInboxKind.CONTROL_SKIP:
+                        # 标记跳过当前 step；继续外层 for
+                        await inbox_repo.mark_dropped(inbox_message_id=int(ctrl.inbox_message_id))
+                        warnings.append(f"Step {action.step} skipped by user")
+                        applied -= 0  # 不计入 applied
+                        await db.commit()
+                        break  # break inner pending loop
+                    else:
+                        # approve / deny — 单工具实时审批，由 policy_guard 读取，这里仅消费
+                        await inbox_repo.mark_dropped(inbox_message_id=int(ctrl.inbox_message_id))
+                await db.commit()
+                if not paused:
+                    break
+                # paused: 等 100ms 再轮询
+                await asyncio.sleep(0.1)
+            # ---- 结束 inbox 处理 ----
+```
+
+并在顶部 import 处新增：
+
+```python
+import asyncio
+
+from ...models.enums import AgentInboxKind
+from ..harness.event_bus import AgentEventBus, AgentEventEnvelope
+```
+
+新增 `_publish_state` 实例方法（与 `run` 同一类）：
+
+```python
+    async def _publish_state(self, event_type: str, *, job_id: int) -> None:
+        if self.event_bus is None:
+            return
+        await self.event_bus.publish(
+            AgentEventEnvelope(
+                job_id=job_id,
+                event_type=event_type,
+                payload={},
+                emitted_at=datetime.now(UTC),
+            )
+        )
+```
+
+- [ ] **Step 3: 把工具调用的事件 publish 也接上 EventBus**
+
+在 line 103-110（`append_step` running 之后）、line 130-140（`finish_step` succeeded 之后）、以及 failure 分支，分别插入：
+
+```python
+            # 工具开始
+            if self.event_bus is not None:
+                await self.event_bus.publish(
+                    AgentEventEnvelope(
+                        job_id=int(job.job_id),
+                        event_type="tool.started",
+                        payload={
+                            "step": int(action.step),
+                            "tool": str(action.tool),
+                            "input": resolved_input,
+                        },
+                        emitted_at=started,
+                    )
+                )
+
+            # 工具成功
+            if self.event_bus is not None:
+                await self.event_bus.publish(
+                    AgentEventEnvelope(
+                        job_id=int(job.job_id),
+                        event_type="tool.succeeded",
+                        payload={
+                            "step": int(action.step),
+                            "tool": str(action.tool),
+                            "output": safe_output,
+                            "durationMs": duration_ms,
+                        },
+                        emitted_at=datetime.now(UTC),
+                    )
+                )
+
+            # 工具失败（含 resolve / dispatch 两个分支）
+            if self.event_bus is not None:
+                await self.event_bus.publish(
+                    AgentEventEnvelope(
+                        job_id=int(job.job_id),
+                        event_type="tool.failed",
+                        payload={
+                            "step": int(action.step),
+                            "tool": str(action.tool),
+                            "errorMessage": f"{type(exc).__name__}: {exc}"[:2000],
+                        },
+                        emitted_at=datetime.now(UTC),
+                    )
+                )
+```
+
+- [ ] **Step 4: 写 / 改测试，覆盖 pause-resume、cancel-via-inbox**
+
+在 `test_agent_plan_execute_runtime.py` 末尾追加：
+
+```python
+import asyncio
+
+from fileflash.agents.harness.event_bus import InMemoryAgentEventBus
+from fileflash.agents.harness.inbox import AgentInbox
+from fileflash.agents.runtime.execute_runner import AgentJobCanceled, ExecuteRunner
+from fileflash.models.enums import AgentInboxKind
+
+
+@pytest.mark.asyncio
+async def test_execute_runner_pauses_then_resumes(
+    db_session, executable_job_with_two_steps,  # noqa: ANN001
+):
+    bus = InMemoryAgentEventBus()
+    inbox = AgentInbox(db=db_session, event_bus=bus)
+    runner = ExecuteRunner(event_bus=bus)
+
+    async def control_later():
+        await asyncio.sleep(0.05)
+        await inbox.handle(
+            job_id=int(executable_job_with_two_steps.job_id),
+            kind=AgentInboxKind.CONTROL_PAUSE,
+            payload={},
+        )
+        await db_session.commit()
+        await asyncio.sleep(0.2)
+        await inbox.handle(
+            job_id=int(executable_job_with_two_steps.job_id),
+            kind=AgentInboxKind.CONTROL_RESUME,
+            payload={},
+        )
+        await db_session.commit()
+
+    sender = asyncio.create_task(control_later())
+    result = await runner.run(db=db_session, job=executable_job_with_two_steps)
+    await sender
+
+    assert result.applied_actions == 2
+
+
+@pytest.mark.asyncio
+async def test_execute_runner_canceled_via_inbox(
+    db_session, executable_job_with_two_steps,  # noqa: ANN001
+):
+    bus = InMemoryAgentEventBus()
+    inbox = AgentInbox(db=db_session, event_bus=bus)
+    runner = ExecuteRunner(event_bus=bus)
+
+    async def cancel_later():
+        await asyncio.sleep(0.05)
+        await inbox.handle(
+            job_id=int(executable_job_with_two_steps.job_id),
+            kind=AgentInboxKind.CONTROL_CANCEL,
+            payload={},
+        )
+        await db_session.commit()
+
+    sender = asyncio.create_task(cancel_later())
+    with pytest.raises(AgentJobCanceled):
+        await runner.run(db=db_session, job=executable_job_with_two_steps)
+    await sender
+```
+
+> 注：`executable_job_with_two_steps` 是新 fixture。如项目已有可执行 job 的 fixture（参见 test_agent_plan_execute_runtime.py），沿用即可，否则在 `conftest.py` 加一个简单 fixture 构造含两步 read-only 计划的 job。
+
+- [ ] **Step 5: 运行测试**
+
+Run: `cd app && uv run pytest tests/test_agent_plan_execute_runtime.py -v -k "pause or canceled_via_inbox"`
+Expected: PASS
+
+- [ ] **Step 6: Commit**
+
+```bash
+git add app/src/fileflash/agents/runtime/execute_runner.py app/tests/test_agent_plan_execute_runtime.py
+git commit -m "feat(agent): wire ExecuteRunner to inbox controls and event bus"
+```
+
+---
+
+## Task 14: `PlanRunner` 接入 ask（基础占位 + 接口暴露）
+
+**Files:**
+
+- Modify: `app/src/fileflash/agents/runtime/plan_runner.py`
+- Modify: `app/tests/test_agent_plan_execute_runtime.py`
+
+> 本 Task 不引入 LLM 触发 ask 的判断逻辑（那需要改 prompt 与 tool-use 模板，留给后续）。本 Task 仅把 `AskProtocol` 注入到 `PlanRunner` 与 `ExecuteRunner`，并提供 `await self._ask(...)` 辅助方法，供后续 prompt 模板调用。
+
+- [ ] **Step 1: 在 `PlanRunner.__init__` 增加 EventBus + ask 启停**
+
+```python
+class PlanRunner:
+    def __init__(
+        self,
+        *,
+        settings: Settings | None = None,
+        planner_client: PlannerClient | None = None,
+        event_bus: AgentEventBus | None = None,
+    ) -> None:
+        self.settings = settings or get_settings()
+        self.planner_client = planner_client or AnthropicPlannerClient(settings=self.settings)
+        self.event_bus = event_bus
+```
+
+在 import 处新增：
+
+```python
+from ..harness.event_bus import AgentEventBus
+from ..harness.ask import AskProtocol
+```
+
+在 `run` 方法的开头：
+
+```python
+        ask: AskProtocol | None = None
+        if self.event_bus is not None:
+            ask = AskProtocol(db=db, event_bus=self.event_bus, job_id=int(job.job_id))
+            await ask.start()
+        try:
+            # ... 现有 run 逻辑 ...
+            return result
+        finally:
+            if ask is not None:
+                await ask.aclose()
+```
+
+在类中新增辅助：
+
+```python
+    async def _ask(
+        self,
+        *,
+        ask: AskProtocol | None,
+        prompt: str,
+        schema: dict[str, Any],
+    ) -> Any | None:
+        if ask is None:
+            return None
+        return await ask.ask(
+            prompt=prompt,
+            schema=schema,
+            timeout_sec=float(self.settings.agent_inbox_ask_timeout_sec),
+        )
+```
+
+> 后续 prompt 模板里若决定需要澄清，调 `await self._ask(ask=ask, prompt=..., schema=...)`。本 plan 仅做接线；触发逻辑留到后续。
+
+- [ ] **Step 2: ExecuteRunner 同样增加 ask 接线（已 publish 事件，但当前不主动调 ask）**
+
+只是为了对称，方便后续 prompt 模板复用。改 `ExecuteRunner.run` 顶部：
+
+```python
+        ask: AskProtocol | None = None
+        if self.event_bus is not None:
+            ask = AskProtocol(db=db, event_bus=self.event_bus, job_id=int(job.job_id))
+            await ask.start()
+        try:
+            # ... 现有 run 逻辑 ...
+            return result
+        finally:
+            if ask is not None:
+                await ask.aclose()
+```
+
+> 当前 ExecuteRunner 不调用 `ask.ask()`；这只是接线。
+
+- [ ] **Step 3: 跳过端到端 ask 触发用例**
+
+> 触发 LLM 调 ask 取决于后续 prompt 模板的改动，超出本 plan 范围。`AskProtocol` 自身的行为（成功回答 + 超时 + status 写回）已在 Task 9 的两个用例完整覆盖。本 Task 不再写额外测试。
+
+- [ ] **Step 4: 运行测试**
+
+Run: `cd app && uv run pytest tests/test_agent_plan_execute_runtime.py -v`
+Expected: 既有用例 PASS（接线为可选注入，不破坏旧调用方）
+
+- [ ] **Step 5: Commit**
+
+```bash
+git add app/src/fileflash/agents/runtime/plan_runner.py app/src/fileflash/agents/runtime/execute_runner.py app/tests/test_agent_plan_execute_runtime.py
+git commit -m "feat(agent): wire AskProtocol into PlanRunner and ExecuteRunner"
+```
+
+---
+
+## Task 15: worker 装配 EventBus 与 runner 注入
+
+**Files:**
+
+- Modify: `app/src/fileflash/agents/worker.py`
+
+- [ ] **Step 1: 在 `AgentWorkerConsumer.__init__` 中创建 EventBus 单例并下发**
+
+```python
+class AgentWorkerConsumer:
+    def __init__(
+        self,
+        *,
+        queue: RedisStreamJobQueue,
+        session_factory: async_sessionmaker[AsyncSession] = SessionLocal,
+        event_bus: AgentEventBus | None = None,
+    ) -> None:
+        self._settings = get_settings()
+        self._queue = queue
+        self._session_factory = session_factory
+        self._event_bus = event_bus or build_agent_event_bus(settings=self._settings)
+```
+
+在 imports 处新增：
+
+```python
+from ..agents.harness.event_bus import AgentEventBus, build_agent_event_bus
+```
+
+- [ ] **Step 2: 在 `_run_job` / `_process_message` 中创建 runner 时传入 event_bus**
+
+找到现有 `PlanRunner()` / `ExecuteRunner(...)` 实例化点（在 `_run_job` 内），替换为：
+
+```python
+            if message.task_type == "agent.plan":
+                runner = PlanRunner(event_bus=self._event_bus)
+                result = await runner.run(db=db, job=fresh_job)
+                ...
+            elif message.task_type == "agent.execute":
+                runner = ExecuteRunner(event_bus=self._event_bus)
+                result = await runner.run(db=db, job=fresh_job)
+                ...
+```
+
+> 注：以现有代码的实例化位置为准；保持依赖注入路径一致。
+
+- [ ] **Step 3: 在 `_mark_canceled` / `_mark_failed` / `_mark_succeeded` 中也 publish 终态事件**
+
+```python
+    async def _publish_terminal(
+        self,
+        *,
+        job_id: int,
+        event_type: str,
+        payload: dict[str, Any] | None = None,
+    ) -> None:
+        await self._event_bus.publish(
+            AgentEventEnvelope(
+                job_id=job_id,
+                event_type=event_type,
+                payload=payload or {},
+                emitted_at=datetime.now(UTC),
+            )
+        )
+```
+
+并在三个 mark 函数末尾分别 `await self._publish_terminal(...)`，事件类型对应 `job.canceled` / `job.failed` / `job.succeeded`。
+
+- [ ] **Step 4: 加最小验证测试**
+
+`app/tests/test_agent_worker.py` 已存在；在末尾追加：
+
+```python
+@pytest.mark.asyncio
+async def test_worker_publishes_terminal_event(...):  # 沿用既有 test_agent_worker.py 的 fixture
+    ...
+    # 注入 InMemoryAgentEventBus，跑一个 succeed 流，断言收到 job.succeeded envelope
+```
+
+> 注：如 test_agent_worker.py 现有结构难以注入 event_bus，跳过此 step，依赖 Task 16 的端到端验证。
+
+- [ ] **Step 5: 运行测试**
+
+Run: `cd app && uv run pytest tests/test_agent_worker.py -v`
+Expected: PASS
+
+- [ ] **Step 6: Commit**
+
+```bash
+git add app/src/fileflash/agents/worker.py app/tests/test_agent_worker.py
+git commit -m "feat(agent): inject EventBus into worker and publish terminal events"
+```
+
+---
+
+## Task 16: 端到端集成测试（POST 消息 → worker 收到 → publish → SSE 收到）
+
+**Files:**
+
+- Create: `app/tests/test_agent_a_end_to_end.py`
+
+- [ ] **Step 1: 写端到端测试**
+
+```python
+# app/tests/test_agent_a_end_to_end.py
+from __future__ import annotations
+
+import asyncio
+from datetime import UTC, datetime
+
+import pytest
+
+from fileflash.agents.harness.event_bus import (
+    AgentEventEnvelope,
+    InMemoryAgentEventBus,
+)
+from fileflash.agents.harness.inbox import AgentInbox
+from fileflash.agents.runtime.execute_runner import (
+    AgentJobCanceled,
+    ExecuteRunner,
+)
+from fileflash.models.enums import AgentInboxKind
+
+
+@pytest.mark.asyncio
+async def test_user_pause_then_cancel_via_inbox(
+    db_session, executable_job_with_two_steps,  # noqa: ANN001
+):
+    bus = InMemoryAgentEventBus()
+    inbox = AgentInbox(db=db_session, event_bus=bus)
+    runner = ExecuteRunner(event_bus=bus)
+
+    seen_events: list[str] = []
+
+    async def consumer():
+        async with bus.subscribe(job_id=int(executable_job_with_two_steps.job_id)) as stream:
+            for _ in range(8):
+                try:
+                    env = await stream.next(timeout=2.0)
+                except TimeoutError:
+                    break
+                seen_events.append(env.event_type)
+                if env.event_type == "agent.paused":
+                    await inbox.handle(
+                        job_id=int(executable_job_with_two_steps.job_id),
+                        kind=AgentInboxKind.CONTROL_CANCEL,
+                        payload={},
+                    )
+                    await db_session.commit()
+
+    listener = asyncio.create_task(consumer())
+
+    async def pause_soon():
+        await asyncio.sleep(0.05)
+        await inbox.handle(
+            job_id=int(executable_job_with_two_steps.job_id),
+            kind=AgentInboxKind.CONTROL_PAUSE,
+            payload={},
+        )
+        await db_session.commit()
+
+    nudger = asyncio.create_task(pause_soon())
+
+    with pytest.raises(AgentJobCanceled):
+        await runner.run(db=db_session, job=executable_job_with_two_steps)
+
+    await nudger
+    listener.cancel()
+    with pytest.raises(asyncio.CancelledError):
+        await listener
+
+    assert "agent.paused" in seen_events
+    assert "tool.started" in seen_events or "tool.failed" in seen_events
+```
+
+- [ ] **Step 2: 运行**
+
+Run: `cd app && uv run pytest tests/test_agent_a_end_to_end.py -v`
+Expected: PASS
+
+- [ ] **Step 3: 全部 agent 测试 smoke**
+
+Run: `cd app && uv run pytest tests/ -k "agent" -v`
+Expected: 全部 PASS（含旧的 test_agent_routes.py / test_agent_repositories.py / test_agent_plan_execute_runtime.py）
+
+- [ ] **Step 4: Commit**
+
+```bash
+git add app/tests/test_agent_a_end_to_end.py
+git commit -m "test(agent): end-to-end pause + cancel via inbox"
+```
+
+---
+
+## Acceptance Checklist（实施完成判定）
+
+- [ ] `app/src/fileflash/agents/harness/event_bus.py` 提供 `InMemoryAgentEventBus` 与 `RedisAgentEventBus`，并通过 `build_agent_event_bus` 工厂自动选择
+- [ ] `AgentInboxMessage` 表通过 V14 Flyway 迁移创建，ORM model + repository 已接入
+- [ ] `POST /agent/jobs/{job_id}/messages` 接受 7 种 kind（reply + 6 种 control）
+- [ ] `POST /agent/cancel/{job_id}` 已删除；取消统一走 inbox `control.cancel`
+- [ ] SSE 端点不再轮询 DB；初始 replay 后纯订阅 EventBus，包含 30s 心跳
+- [ ] `ExecuteRunner` 在 step 边界处理 pause/resume/skip/approve/deny/cancel
+- [ ] `PlanRunner` 与 `ExecuteRunner` 都启动了 `AskProtocol`；后续 prompt 模板可调 `_ask`
+- [ ] `worker.py` 注入 EventBus 并 publish `job.succeeded` / `job.failed` / `job.canceled` 终态
+- [ ] 端到端集成测试覆盖 pause → cancel via inbox 全链路
+
+**注意（不在本 plan 范围）：**
+
+- 前端接入新事件类型与上行通道 — 留给 `2026-05-26-agent-A-interaction-frontend.md`
+- prompt 模板里何时调 `ask` — 留给后续；本 plan 只提供接口
+- worker 多副本下"等用户回答的 worker 被杀"恢复机制 — 仅靠 `agent_inbox_ask_timeout_sec` 兜底；进一步的 owner 恢复留给后续 plan
diff --git a/docs/superpowers/plans/2026-05-26-agent-A-interaction-frontend.md b/docs/superpowers/plans/2026-05-26-agent-A-interaction-frontend.md
new file mode 100644
index 0000000..49fa467
--- /dev/null
+++ b/docs/superpowers/plans/2026-05-26-agent-A-interaction-frontend.md
@@ -0,0 +1,1579 @@
+# Agent 子项目 A（交互/反馈层）— 前端实现计划
+
+> **For agentic workers:** REQUIRED SUB-SKILL: Use superpowers:subagent-driven-development (recommended) or superpowers:executing-plans to implement this plan task-by-task. Steps use checkbox (`- [ ]`) syntax for tracking.
+
+**Goal:** 把前端从"单向 SSE + 整个 job 取消"升级为"双向交互 + step 级 pause/resume/skip/approve + agent 中途提问 + 实时进度/思考/工具增量输出"，匹配 A-backend 已落地的事件类型与 `POST /agent/jobs/{id}/messages` 上行通道。
+
+**Architecture:** 在 `types/agent.d.ts` 扩展事件字面量与上行消息类型；`api/agent.ts` 用 `sendAgentMessage` + 6 个 control helper 取代 `cancelAgentJob`；`useAgentSession.ts` 引入 `waiting_for_user`/`paused` 状态、ask 缓存、`pauseTurn/resumeTurn/replyToAsk/...` 方法，cancel 改走 `control.cancel`；新增 `AskPrompt.vue` + `ControlBar.vue` 两个原子组件，TurnEntry 内嵌；TaskInputDock 在 waiting_for_user/paused 时切换主输入框 disable。
+
+**Tech Stack:** Vue 3 + TypeScript + Vitest + bun（**不用 npm**）+ 既有 i18n 体系 + 既有 atomic 设计语言（Industrial Dashboard，参见 `frontend_aesthetic.md`）。
+
+**Spec:** `docs/superpowers/specs/2026-05-26-agent-improvements-design.md` 子项目 A 部分（前端章节 A.7、A.8、A.10）
+
+**前置条件:** A-backend plan 已落地（commit 包含 `AgentInboxMessage` 模型、`POST /agent/jobs/{id}/messages`、SSE event_bus 推送、新 14 种 `AgentJobEventType`）
+
+---
+
+## File Structure
+
+**新建**
+
+- `web/src/components/organisms/agent/AskPrompt.vue` — 渲染单条 agent.ask 的输入气泡（选择型 / 自由文本，含 timeout 倒计时）
+- `web/src/components/organisms/agent/ControlBar.vue` — 渲染单 turn 的 pause/resume/skip/cancel 按钮组
+- `web/src/composables/useAskTimeout.ts` — ask 倒计时小工具（含 i18n 友好的 mm:ss 格式化）
+
+**修改**
+
+- `web/src/types/agent.d.ts` — 扩展 `AgentJobEventType`；新增 `MsgStatus`-相关、`AgentInboxMessageKind` / `AgentInboxMessageRequest` / `AgentInboxMessageResponse`、`AgentAskPayload` / `AgentProgressPayload` / `AgentThinkingPayload` / `AgentToolPartialPayload`
+- `web/src/api/agent.ts` — 删除 `cancelAgentJob`；新增 `sendAgentMessage` 与 6 个 helper：`sendAgentReply` / `pauseAgentJob` / `resumeAgentJob` / `approveAgentStep` / `denyAgentStep` / `skipAgentStep` / `cancelAgentTurn`
+- `web/src/composables/useAgentSession.ts` — `MsgStatus` 加 `waiting_for_user` / `paused`；`ChatMessage` 加 `pendingAsk`、`pauseRequestedAt`、`progress`、`thinking`、`partials`；`applyAgentEvent` 覆盖新 6 种事件；`cancel(msg)` 改走 `control.cancel`；新增方法
+- `web/src/composables/useAgentSession.spec.ts` — 覆盖新事件与新方法
+- `web/src/components/organisms/agent/TurnEntry.vue` — 内嵌 `AskPrompt` / `ControlBar`；新增 progress 条与 thinking 折叠区；扩展 `activityEvents` 过滤规则
+- `web/src/components/organisms/agent/TaskInputDock.vue` — `disabled` prop 范围扩大（waiting_for_user / paused 时锁主输入）
+- `web/src/i18n/messages.ts` — 13 条新 key（ask/progress/thinking/控制按钮/状态文案）+ 中英文翻译
+
+**测试**
+
+- `web/src/composables/useAgentSession.spec.ts` — 既有文件追加
+- (可选) `web/src/components/organisms/agent/AskPrompt.spec.ts` — 新（@vue/test-utils 风格如项目已用，否则跳过）
+
+---
+
+## Sequencing
+
+```
+Task 1 (types) ──► Task 2 (api helpers) ──► Task 3 (i18n keys)
+                                                │
+                          ┌─────────────────────┴──────────────────────┐
+                          ▼                                            ▼
+        Task 4 (useAgentSession state + cancel rewire)     Task 5 (useAskTimeout)
+                          │                                            │
+                          ▼                                            │
+        Task 6 (useAgentSession ask handlers + control methods)        │
+                          │                                            │
+                          ▼                                            ▼
+                          ▼─────────────► Task 7 (AskPrompt.vue) ◄─────┘
+                          │
+                          ▼
+                  Task 8 (ControlBar.vue)
+                          │
+                          ▼
+                  Task 9 (TurnEntry.vue 集成)
+                          │
+                          ▼
+                  Task 10 (TaskInputDock.vue 锁定)
+                          │
+                          ▼
+                  Task 11 (端到端 spec：ask → reply → resume → cancel)
+                          │
+                          ▼
+                  Task 12 (手测脚本 + dev server 真跑一次)
+```
+
+---
+
+## Task 1: 扩展 types/agent.d.ts
+
+**Files:**
+
+- Modify: `web/src/types/agent.d.ts`
+
+- [ ] **Step 1: 扩展 `AgentJobEventType` 字面量与新增上行消息 / 事件 payload 类型**
+
+把 `AgentJobEventType` 替换为：
+
+```ts
+export type AgentJobEventType =
+  | 'job.queued'
+  | 'job.running'
+  | 'plan.ready'
+  | 'tool.started'
+  | 'tool.succeeded'
+  | 'tool.failed'
+  | 'tool.partial'
+  | 'agent.thinking'
+  | 'agent.progress'
+  | 'agent.ask'
+  | 'agent.paused'
+  | 'agent.resumed'
+  | 'job.succeeded'
+  | 'job.failed'
+  | 'job.canceled';
+```
+
+在文件末尾追加：
+
+```ts
+// ----------------- Inbox (upstream channel) -----------------
+
+export type AgentInboxMessageKind =
+  | 'reply'
+  | 'control.pause'
+  | 'control.resume'
+  | 'control.approve'
+  | 'control.deny'
+  | 'control.skip'
+  | 'control.cancel';
+
+export interface AgentInboxMessageRequest {
+  kind: AgentInboxMessageKind;
+  replyTo?: string;            // ask 的 inboxMessageId（string-encoded）
+  value?: unknown;             // reply 时为用户回答
+  metadata?: Record<string, unknown>;
+}
+
+export interface AgentInboxMessageResponse {
+  inboxMessageId: string;
+  kind: AgentInboxMessageKind;
+  acceptedAt: string;
+}
+
+// ----------------- New event payloads -----------------
+
+export interface AgentAskPayload {
+  messageId: string;
+  prompt: string;
+  schema: Record<string, unknown>;     // 自由形式；例如 {"choice":["A","B"]}
+  timeoutSec: number;
+}
+
+export interface AgentProgressPayload {
+  step: number;
+  total: number;
+  message?: string;
+  percent?: number;
+}
+
+export interface AgentThinkingPayload {
+  text: string;
+}
+
+export interface AgentToolPartialPayload {
+  step: number;
+  tool: string;
+  chunk: unknown;
+}
+```
+
+- [ ] **Step 2: 删除 `CancelAgentResponse` 接口**
+
+后端已删除 `POST /agent/cancel`；前端 type 也清理。同步 `web/src/api/agent.ts` 的 import（Task 2 处理）。
+
+- [ ] **Step 3: typecheck**
+
+Run: `cd web && bun run typecheck`
+Expected: 仅出现"`CancelAgentResponse` 仍被 import in api/agent.ts"的错误——Task 2 修复。
+
+- [ ] **Step 4: Commit**
+
+```bash
+git add web/src/types/agent.d.ts
+git commit -m "feat(agent): extend frontend types for inbox + new event payloads"
+```
+
+---
+
+## Task 2: api/agent.ts 引入 sendAgentMessage + 6 个 helper
+
+**Files:**
+
+- Modify: `web/src/api/agent.ts`
+
+- [ ] **Step 1: 删除 `cancelAgentJob` 与对应 import**
+
+```ts
+// 删除：
+import type { ... CancelAgentResponse ... } from '../types/agent';
+export const cancelAgentJob = (jobId: string) => { ... };
+```
+
+- [ ] **Step 2: 新增 `sendAgentMessage` 与 6 个 helper**
+
+在 `streamAgentJobEvents` 之上插入：
+
+```ts
+import type {
+  AgentBackgroundJob,
+  AgentInboxMessageRequest,
+  AgentInboxMessageResponse,
+  AgentJobEvent,
+  ExecuteAgentRequest,
+  ExecuteAgentResponse,
+  PlanAgentRequest,
+  PlanAgentResponse,
+} from '../types/agent';
+
+// ----------------- inbox upstream -----------------
+
+export const sendAgentMessage = (
+  jobId: string,
+  body: AgentInboxMessageRequest,
+) => {
+  return http.post<AgentInboxMessageResponse>(
+    `/agent/jobs/${encodeURIComponent(jobId)}/messages`,
+    body,
+  );
+};
+
+export const sendAgentReply = (
+  jobId: string,
+  replyTo: string,
+  value: unknown,
+) => sendAgentMessage(jobId, { kind: 'reply', replyTo, value });
+
+export const pauseAgentJob = (jobId: string) =>
+  sendAgentMessage(jobId, { kind: 'control.pause' });
+
+export const resumeAgentJob = (jobId: string) =>
+  sendAgentMessage(jobId, { kind: 'control.resume' });
+
+export const approveAgentStep = (jobId: string) =>
+  sendAgentMessage(jobId, { kind: 'control.approve' });
+
+export const denyAgentStep = (jobId: string) =>
+  sendAgentMessage(jobId, { kind: 'control.deny' });
+
+export const skipAgentStep = (jobId: string) =>
+  sendAgentMessage(jobId, { kind: 'control.skip' });
+
+export const cancelAgentTurn = (jobId: string) =>
+  sendAgentMessage(jobId, { kind: 'control.cancel' });
+```
+
+> 注：`cancelAgentTurn` 命名故意区别于历史的 `cancelAgentJob`，提示这是"通过 inbox 取消当前 turn"。所有引用 `cancelAgentJob` 的地方在 Task 4 改成 `cancelAgentTurn`。
+
+- [ ] **Step 3: 全仓搜索旧 import**
+
+Run: `grep -rn "cancelAgentJob\|CancelAgentResponse" web/src/`
+Expected: 仅 `web/src/composables/useAgentSession.ts` 几处需要 Task 4 处理。
+
+- [ ] **Step 4: typecheck**
+
+Run: `cd web && bun run typecheck`
+Expected: 仅剩 useAgentSession.ts 的 import 错误（Task 4 修）。
+
+- [ ] **Step 5: Commit**
+
+```bash
+git add web/src/api/agent.ts
+git commit -m "feat(agent): add sendAgentMessage + 6 control helpers, drop cancelAgentJob"
+```
+
+---
+
+## Task 3: 新增 i18n key（中英文）
+
+**Files:**
+
+- Modify: `web/src/i18n/messages.ts`
+
+- [ ] **Step 1: 在 `LocaleKey` union（约 line 480-580）的 agent.v2 区块插入新 key**
+
+按字母序插在 `agent.v2.turn.cancel` 附近：
+
+```ts
+  | 'agent.v2.turn.status.waiting_for_user'
+  | 'agent.v2.turn.status.paused'
+  | 'agent.v2.turn.controls.pause'
+  | 'agent.v2.turn.controls.resume'
+  | 'agent.v2.turn.controls.skip'
+  | 'agent.v2.turn.controls.approve'
+  | 'agent.v2.turn.controls.deny'
+  | 'agent.v2.turn.ask.placeholder'
+  | 'agent.v2.turn.ask.send'
+  | 'agent.v2.turn.ask.timeout'
+  | 'agent.v2.turn.progress.label'
+  | 'agent.v2.turn.thinking.label'
+  | 'agent.v2.turn.thinking.toggle'
+```
+
+- [ ] **Step 2: 在 zh-CN 翻译 map 中添加（约 line 1066-1160）**
+
+```ts
+    'agent.v2.turn.status.waiting_for_user': '等待你回复',
+    'agent.v2.turn.status.paused': '已暂停',
+    'agent.v2.turn.controls.pause': '暂停',
+    'agent.v2.turn.controls.resume': '继续',
+    'agent.v2.turn.controls.skip': '跳过此步',
+    'agent.v2.turn.controls.approve': '批准',
+    'agent.v2.turn.controls.deny': '拒绝',
+    'agent.v2.turn.ask.placeholder': '输入回答…',
+    'agent.v2.turn.ask.send': '发送',
+    'agent.v2.turn.ask.timeout': '剩余 {value}',
+    'agent.v2.turn.progress.label': '进度',
+    'agent.v2.turn.thinking.label': '思考过程',
+    'agent.v2.turn.thinking.toggle': '展开 / 收起',
+```
+
+- [ ] **Step 3: 在 en 翻译 map 中添加（约 line 1641-1730）**
+
+```ts
+    'agent.v2.turn.status.waiting_for_user': 'WAITING FOR YOU',
+    'agent.v2.turn.status.paused': 'PAUSED',
+    'agent.v2.turn.controls.pause': 'Pause',
+    'agent.v2.turn.controls.resume': 'Resume',
+    'agent.v2.turn.controls.skip': 'Skip step',
+    'agent.v2.turn.controls.approve': 'Approve',
+    'agent.v2.turn.controls.deny': 'Deny',
+    'agent.v2.turn.ask.placeholder': 'Type your answer…',
+    'agent.v2.turn.ask.send': 'Send',
+    'agent.v2.turn.ask.timeout': '{value} left',
+    'agent.v2.turn.progress.label': 'PROGRESS',
+    'agent.v2.turn.thinking.label': 'THINKING',
+    'agent.v2.turn.thinking.toggle': 'Expand / Collapse',
+```
+
+- [ ] **Step 4: typecheck**
+
+Run: `cd web && bun run typecheck`
+Expected: PASS（LocaleKey union 与 map 一致）
+
+- [ ] **Step 5: Commit**
+
+```bash
+git add web/src/i18n/messages.ts
+git commit -m "feat(agent): add i18n keys for ask/pause/progress/controls"
+```
+
+---
+
+## Task 4: useAgentSession.ts — 扩展状态 + 改 cancel 走 inbox
+
+**Files:**
+
+- Modify: `web/src/composables/useAgentSession.ts`
+
+- [ ] **Step 1: 扩展 `MsgStatus` 与 `ChatMessage`**
+
+把现有 `MsgStatus` 类型改为：
+
+```ts
+export type MsgStatus =
+  | 'pending'
+  | 'running'
+  | 'succeeded'
+  | 'failed'
+  | 'canceled'
+  | 'waiting_for_user'
+  | 'paused';
+```
+
+把 `ChatMessage` 接口扩展为：
+
+```ts
+export interface PendingAsk {
+  messageId: string;
+  prompt: string;
+  schema: Record<string, unknown>;
+  timeoutSec: number;
+  askedAt: string;
+}
+
+export interface ToolPartial {
+  step: number;
+  tool: string;
+  chunks: unknown[];
+}
+
+export interface ChatMessage {
+  id: string;
+  role: 'user' | 'agent';
+  content: string;
+  status: MsgStatus;
+  planJobId?: string;
+  planHash?: string;
+  planResult?: AgentPlanResult;
+  executeJobId?: string;
+  executeResult?: AgentExecutionResult;
+  events: AgentJobEvent[];
+  errorMessage?: string;
+  timestamp: string;
+  // —— 新增（A 前端）——
+  pendingAsk?: PendingAsk;
+  pauseRequestedAt?: string;
+  progress?: { step: number; total: number; message?: string; percent?: number };
+  thinking?: string;                     // 累积的 thinking 文本
+  partials?: Record<number, ToolPartial>;
+}
+```
+
+- [ ] **Step 2: 调整 `applyAgentEvent` 覆盖新事件**
+
+替换现有 `applyAgentEvent` 为：
+
+```ts
+const applyAgentEvent = (msg: ChatMessage, event: AgentJobEvent, kind: 'plan' | 'execute') => {
+  appendAgentEvent(msg, event);
+
+  // 终态 / 既有事件
+  if (event.type === 'job.queued') {
+    msg.status = 'pending';
+  } else if (event.type === 'job.running' || event.type === 'tool.started') {
+    if (msg.status !== 'waiting_for_user' && msg.status !== 'paused') {
+      msg.status = 'running';
+    }
+  } else if (event.type === 'job.failed' || event.type === 'tool.failed') {
+    msg.status = 'failed';
+    const errorMessage = event.data?.errorMessage;
+    msg.errorMessage = typeof errorMessage === 'string' ? errorMessage : event.message;
+  } else if (event.type === 'job.canceled') {
+    msg.status = 'canceled';
+  } else if (event.type === 'job.succeeded') {
+    msg.status = 'succeeded';
+    msg.pendingAsk = undefined;
+    msg.pauseRequestedAt = undefined;
+  }
+
+  // 新事件
+  if (event.type === 'agent.ask') {
+    const payload = event.data as AgentAskPayload;
+    msg.pendingAsk = {
+      messageId: payload.messageId,
+      prompt: payload.prompt,
+      schema: payload.schema,
+      timeoutSec: payload.timeoutSec,
+      askedAt: event.timestamp,
+    };
+    msg.status = 'waiting_for_user';
+  } else if (event.type === 'agent.paused') {
+    msg.status = 'paused';
+    msg.pauseRequestedAt = event.timestamp;
+  } else if (event.type === 'agent.resumed') {
+    msg.status = 'running';
+    msg.pauseRequestedAt = undefined;
+  } else if (event.type === 'agent.progress') {
+    const payload = event.data as AgentProgressPayload;
+    msg.progress = {
+      step: payload.step,
+      total: payload.total,
+      message: payload.message,
+      percent: payload.percent,
+    };
+  } else if (event.type === 'agent.thinking') {
+    const payload = event.data as AgentThinkingPayload;
+    msg.thinking = (msg.thinking || '') + (payload.text || '');
+  } else if (event.type === 'tool.partial') {
+    const payload = event.data as AgentToolPartialPayload;
+    msg.partials = msg.partials || {};
+    const slot = msg.partials[payload.step] || { step: payload.step, tool: payload.tool, chunks: [] };
+    slot.chunks = [...slot.chunks, payload.chunk];
+    msg.partials[payload.step] = slot;
+  }
+
+  const result = event.data?.result;
+  if (event.type === 'plan.ready' && result) {
+    msg.planResult = result as AgentPlanResult;
+    msg.planHash = msg.planResult.planHash;
+  }
+  if (event.type === 'job.succeeded' && result) {
+    if (kind === 'plan') {
+      msg.planResult = result as AgentPlanResult;
+      msg.planHash = msg.planResult.planHash;
+    } else {
+      msg.executeResult = result as AgentExecutionResult;
+    }
+  }
+};
+```
+
+在 imports 顶部追加：
+
+```ts
+import type {
+  AgentAskPayload,
+  AgentExecutionPolicy,
+  AgentExecutionResult,
+  AgentJobEvent,
+  AgentPlanResult,
+  AgentProgressPayload,
+  AgentReasoningEffort,
+  AgentThinkingPayload,
+  AgentToolPartialPayload,
+  PlanAgentRequest,
+} from '../types/agent';
+```
+
+- [ ] **Step 3: 把 `cancel(msg)` 改走 `control.cancel`**
+
+替换 `cancel` 函数 + 删除顶部 `cancelAgentJob` import：
+
+```ts
+import {
+  cancelAgentTurn,
+  executeAgentPlan,
+  getAgentJob,
+  planAgentTask,
+  streamAgentJobEvents,
+} from '../api/agent';
+
+// ...
+
+async function cancel(msg: ChatMessage): Promise<void> {
+  markTurnCanceled(msg);
+  msg.status = 'canceled';
+  msg.pendingAsk = undefined;
+  msg.pauseRequestedAt = undefined;
+  stopPolling(`${msg.id}:plan`);
+  stopPolling(`${msg.id}:execute`);
+  stopStream(`${msg.id}:plan`);
+  stopStream(`${msg.id}:execute`);
+  const jobId = msg.executeJobId || msg.planJobId;
+  if (!jobId) return;
+  try {
+    await cancelAgentTurn(jobId);
+  } catch (error) {
+    msg.errorMessage = extractErrorMessage(error, 'Cancel failed.');
+  }
+}
+```
+
+同时把 `sendMessage` / `runExecute` 内的旧 `cancelAgentJob(res.jobId)` 替换为 `cancelAgentTurn(res.jobId)`：
+
+```ts
+// sendMessage 内：
+if (isTurnCanceled(reactiveAgent) || reactiveAgent.status === 'canceled') {
+  try {
+    await cancelAgentTurn(res.jobId);
+  } catch { /* ignore */ }
+  return;
+}
+
+// runExecute 内：
+if (!ensureTurnNotCanceled(msg)) {
+  try {
+    await cancelAgentTurn(res.jobId);
+  } catch { /* ignore */ }
+  return;
+}
+```
+
+- [ ] **Step 4: 全仓 grep**
+
+Run: `grep -rn "cancelAgentJob" web/src/`
+Expected: 无匹配。
+
+- [ ] **Step 5: typecheck + 跑既有测试**
+
+Run: `cd web && bun run typecheck && bun run test useAgentSession`
+Expected: typecheck PASS；既有 spec 大多 PASS。如果某些用例断言"取消时调用 cancelAgentJob"，改断言为 `cancelAgentTurn`（即 `sendAgentMessage(..., {kind:'control.cancel'})`）。
+
+- [ ] **Step 6: Commit**
+
+```bash
+git add web/src/composables/useAgentSession.ts
+git commit -m "feat(agent): extend session state for ask/pause/progress, rewire cancel via inbox"
+```
+
+---
+
+## Task 5: 新建 `useAskTimeout.ts`
+
+**Files:**
+
+- Create: `web/src/composables/useAskTimeout.ts`
+- Create: `web/src/composables/useAskTimeout.spec.ts`
+
+- [ ] **Step 1: 写测试**
+
+```ts
+// web/src/composables/useAskTimeout.spec.ts
+import { describe, it, expect, vi, beforeEach, afterEach } from 'vitest';
+import { ref } from 'vue';
+import { useAskTimeout } from './useAskTimeout';
+
+describe('useAskTimeout', () => {
+  beforeEach(() => {
+    vi.useFakeTimers();
+  });
+  afterEach(() => {
+    vi.useRealTimers();
+  });
+
+  it('counts down from askedAt + timeoutSec', () => {
+    const askedAt = ref('2026-05-26T12:00:00.000Z');
+    const timeoutSec = ref(120);
+    vi.setSystemTime(new Date('2026-05-26T12:00:30.000Z'));
+    const { remainingSec, formatted, expired } = useAskTimeout(askedAt, timeoutSec);
+    expect(remainingSec.value).toBe(90);
+    expect(formatted.value).toBe('01:30');
+    expect(expired.value).toBe(false);
+
+    vi.setSystemTime(new Date('2026-05-26T12:02:01.000Z'));
+    vi.advanceTimersByTime(1000);
+    expect(expired.value).toBe(true);
+    expect(remainingSec.value).toBe(0);
+    expect(formatted.value).toBe('00:00');
+  });
+
+  it('returns expired immediately when askedAt is missing', () => {
+    const askedAt = ref<string | undefined>(undefined);
+    const timeoutSec = ref(60);
+    const { expired, formatted } = useAskTimeout(askedAt, timeoutSec);
+    expect(expired.value).toBe(true);
+    expect(formatted.value).toBe('00:00');
+  });
+});
+```
+
+- [ ] **Step 2: 运行测试，确认 fail**
+
+Run: `cd web && bun run test useAskTimeout`
+Expected: FAIL — module missing.
+
+- [ ] **Step 3: 实现**
+
+```ts
+// web/src/composables/useAskTimeout.ts
+import { computed, onScopeDispose, ref, watchEffect, type Ref } from 'vue';
+
+export function useAskTimeout(
+  askedAt: Ref<string | undefined | null>,
+  timeoutSec: Ref<number>,
+) {
+  const now = ref<number>(Date.now());
+  let timer: ReturnType<typeof setInterval> | null = null;
+
+  watchEffect(() => {
+    if (timer) clearInterval(timer);
+    if (!askedAt.value || timeoutSec.value <= 0) return;
+    timer = setInterval(() => {
+      now.value = Date.now();
+    }, 1000);
+  });
+
+  onScopeDispose(() => {
+    if (timer) clearInterval(timer);
+  });
+
+  const deadline = computed(() => {
+    if (!askedAt.value) return null;
+    const base = Date.parse(askedAt.value);
+    if (Number.isNaN(base)) return null;
+    return base + timeoutSec.value * 1000;
+  });
+
+  const remainingSec = computed(() => {
+    if (deadline.value === null) return 0;
+    return Math.max(0, Math.ceil((deadline.value - now.value) / 1000));
+  });
+
+  const expired = computed(() => deadline.value === null || remainingSec.value <= 0);
+
+  const formatted = computed(() => {
+    const total = remainingSec.value;
+    const mm = String(Math.floor(total / 60)).padStart(2, '0');
+    const ss = String(total % 60).padStart(2, '0');
+    return `${mm}:${ss}`;
+  });
+
+  return { remainingSec, formatted, expired };
+}
+```
+
+- [ ] **Step 4: 运行测试**
+
+Run: `cd web && bun run test useAskTimeout`
+Expected: PASS（2 个用例）
+
+- [ ] **Step 5: Commit**
+
+```bash
+git add web/src/composables/useAskTimeout.ts web/src/composables/useAskTimeout.spec.ts
+git commit -m "feat(agent): add useAskTimeout countdown composable"
+```
+
+---
+
+## Task 6: useAgentSession.ts — ask reply 与控制方法
+
+**Files:**
+
+- Modify: `web/src/composables/useAgentSession.ts`
+- Modify: `web/src/composables/useAgentSession.spec.ts`
+
+- [ ] **Step 1: 更新 spec 顶部的 `vi.mock` 工厂，注册新 helper**
+
+`useAgentSession.spec.ts` 顶部已有：
+
+```ts
+vi.mock('../api/agent', () => ({
+  planAgentTask: vi.fn(),
+  executeAgentPlan: vi.fn(),
+  cancelAgentJob: vi.fn(),
+  getAgentJob: vi.fn(),
+  streamAgentJobEvents: vi.fn(),
+}));
+```
+
+替换为：
+
+```ts
+vi.mock('../api/agent', () => ({
+  planAgentTask: vi.fn(),
+  executeAgentPlan: vi.fn(),
+  cancelAgentTurn: vi.fn(),         // 替代旧 cancelAgentJob
+  getAgentJob: vi.fn(),
+  streamAgentJobEvents: vi.fn(),
+  sendAgentMessage: vi.fn(),
+  sendAgentReply: vi.fn(),
+  pauseAgentJob: vi.fn(),
+  resumeAgentJob: vi.fn(),
+  approveAgentStep: vi.fn(),
+  denyAgentStep: vi.fn(),
+  skipAgentStep: vi.fn(),
+}));
+```
+
+把既有用到 `agentApi.cancelAgentJob` 的断言全部改为 `agentApi.cancelAgentTurn`（Task 4 已经改了源；spec 这里同步）。
+
+Run: `grep -n "cancelAgentJob" web/src/composables/useAgentSession.spec.ts`
+Expected: 找到的每一处都要改成 `cancelAgentTurn`。
+
+- [ ] **Step 2: 在 spec 末尾追加 inbox-controls 用例**
+
+```ts
+import * as agentApi from '../api/agent';
+
+describe('useAgentSession — inbox controls', () => {
+  beforeEach(() => {
+    vi.mocked(agentApi.sendAgentReply).mockResolvedValue({
+      inboxMessageId: '42', kind: 'reply', acceptedAt: '2026-05-26T00:00:00Z',
+    });
+    vi.mocked(agentApi.pauseAgentJob).mockResolvedValue({
+      inboxMessageId: '50', kind: 'control.pause', acceptedAt: '2026-05-26T00:00:00Z',
+    });
+  });
+
+  it('replyToAsk sends reply to backend and clears pendingAsk', async () => {
+    const { default: useAgentSession } = await loadComposable();
+    const { createSession, replyToAsk } = useAgentSession();
+    const session = createSession();
+    const msg: ChatMessage = {
+      id: 'msg-1',
+      role: 'agent',
+      content: '',
+      status: 'waiting_for_user',
+      events: [],
+      timestamp: new Date().toISOString(),
+      executeJobId: '77',
+      pendingAsk: {
+        messageId: '101',
+        prompt: 'choose',
+        schema: { choice: ['A', 'B'] },
+        timeoutSec: 60,
+        askedAt: new Date().toISOString(),
+      },
+    };
+    session.messages.push(msg);
+
+    await replyToAsk(msg, 'A');
+
+    expect(agentApi.sendAgentReply).toHaveBeenCalledWith('77', '101', 'A');
+    expect(msg.pendingAsk).toBeUndefined();
+    expect(msg.status).toBe('running');
+  });
+
+  it('pauseTurn sends control.pause and records pauseRequestedAt', async () => {
+    const { default: useAgentSession } = await loadComposable();
+    const { createSession, pauseTurn } = useAgentSession();
+    const session = createSession();
+    const msg: ChatMessage = {
+      id: 'msg-2', role: 'agent', content: '', status: 'running',
+      events: [], timestamp: new Date().toISOString(), executeJobId: '88',
+    };
+    session.messages.push(msg);
+
+    await pauseTurn(msg);
+    expect(agentApi.pauseAgentJob).toHaveBeenCalledWith('88');
+    // 本地不立即翻 paused，等 agent.paused 事件
+    expect(msg.pauseRequestedAt).toBeTruthy();
+  });
+});
+```
+
+> 注：上述用例用项目既有 `vi.mock + vi.mocked + loadComposable()` 风格（参见同文件其它用例），不引入 `vi.spyOn(await import(...))` 写法。`ChatMessage` 类型可能需要从 `'../composables/useAgentSession'` 导入（既有用例如何引用就跟随）。
+
+- [ ] **Step 2: 实现 5 个新方法**
+
+在 `useAgentSession.ts` 内（`cancel` 函数附近）新增：
+
+```ts
+import {
+  approveAgentStep,
+  cancelAgentTurn,
+  denyAgentStep,
+  executeAgentPlan,
+  getAgentJob,
+  pauseAgentJob,
+  planAgentTask,
+  resumeAgentJob,
+  sendAgentReply,
+  skipAgentStep,
+  streamAgentJobEvents,
+} from '../api/agent';
+
+// ...
+
+const activeJobId = (msg: ChatMessage): string | undefined =>
+  msg.executeJobId || msg.planJobId;
+
+async function replyToAsk(msg: ChatMessage, value: unknown): Promise<void> {
+  const jobId = activeJobId(msg);
+  if (!jobId || !msg.pendingAsk) return;
+  const replyTo = msg.pendingAsk.messageId;
+  msg.pendingAsk = undefined;
+  msg.status = 'running';
+  try {
+    await sendAgentReply(jobId, replyTo, value);
+  } catch (error) {
+    msg.status = 'waiting_for_user';
+    msg.pendingAsk = {
+      messageId: replyTo,
+      prompt: msg.pendingAsk?.prompt || '',
+      schema: msg.pendingAsk?.schema || {},
+      timeoutSec: msg.pendingAsk?.timeoutSec || 0,
+      askedAt: msg.pendingAsk?.askedAt || new Date().toISOString(),
+    };
+    msg.errorMessage = extractErrorMessage(error, 'Reply failed.');
+  }
+}
+
+async function pauseTurn(msg: ChatMessage): Promise<void> {
+  const jobId = activeJobId(msg);
+  if (!jobId) return;
+  msg.pauseRequestedAt = new Date().toISOString();
+  try {
+    await pauseAgentJob(jobId);
+  } catch (error) {
+    msg.pauseRequestedAt = undefined;
+    msg.errorMessage = extractErrorMessage(error, 'Pause failed.');
+  }
+}
+
+async function resumeTurn(msg: ChatMessage): Promise<void> {
+  const jobId = activeJobId(msg);
+  if (!jobId) return;
+  try {
+    await resumeAgentJob(jobId);
+  } catch (error) {
+    msg.errorMessage = extractErrorMessage(error, 'Resume failed.');
+  }
+}
+
+async function approveStep(msg: ChatMessage): Promise<void> {
+  const jobId = activeJobId(msg);
+  if (!jobId) return;
+  try {
+    await approveAgentStep(jobId);
+  } catch (error) {
+    msg.errorMessage = extractErrorMessage(error, 'Approve failed.');
+  }
+}
+
+async function denyStep(msg: ChatMessage): Promise<void> {
+  const jobId = activeJobId(msg);
+  if (!jobId) return;
+  try {
+    await denyAgentStep(jobId);
+  } catch (error) {
+    msg.errorMessage = extractErrorMessage(error, 'Deny failed.');
+  }
+}
+
+async function skipStep(msg: ChatMessage): Promise<void> {
+  const jobId = activeJobId(msg);
+  if (!jobId) return;
+  try {
+    await skipAgentStep(jobId);
+  } catch (error) {
+    msg.errorMessage = extractErrorMessage(error, 'Skip failed.');
+  }
+}
+```
+
+把 6 个方法加到 return 对象末尾：
+
+```ts
+  return {
+    sessions: s.sessions,
+    activeSessionId: s.activeSessionId,
+    activeSession,
+    activeTurns,
+    policy: s.policy,
+    reasoningEffort: s.reasoningEffort,
+    taskInput: s.taskInput,
+    isSending: s.isSending,
+    createSession,
+    switchSession,
+    deleteSession,
+    resetActiveSession,
+    sendMessage,
+    runExecute,
+    cancel,
+    // —— 新增 ——
+    replyToAsk,
+    pauseTurn,
+    resumeTurn,
+    approveStep,
+    denyStep,
+    skipStep,
+  };
+```
+
+- [ ] **Step 3: 运行测试**
+
+Run: `cd web && bun run test useAgentSession`
+Expected: PASS（含新追加的两个用例）
+
+- [ ] **Step 4: Commit**
+
+```bash
+git add web/src/composables/useAgentSession.ts web/src/composables/useAgentSession.spec.ts
+git commit -m "feat(agent): add replyToAsk + pause/resume/skip/approve/deny composables"
+```
+
+---
+
+## Task 7: `AskPrompt.vue`
+
+**Files:**
+
+- Create: `web/src/components/organisms/agent/AskPrompt.vue`
+
+- [ ] **Step 1: 实现组件**
+
+```vue
+<!-- web/src/components/organisms/agent/AskPrompt.vue -->
+<script setup lang="ts">
+import { computed, ref, toRefs } from 'vue';
+import Button from '../../molecules/Button.vue';
+import { useLocaleStore } from '../../../store/locale';
+import { useAskTimeout } from '../../../composables/useAskTimeout';
+import type { PendingAsk } from '../../../composables/useAgentSession';
+
+const props = defineProps<{
+  ask: PendingAsk;
+  disabled?: boolean;
+}>();
+
+const emit = defineEmits<{ reply: [value: unknown] }>();
+
+const localeStore = useLocaleStore();
+const t = localeStore.t;
+
+const askedAt = computed(() => props.ask.askedAt);
+const timeoutSec = computed(() => props.ask.timeoutSec);
+const { formatted, expired } = useAskTimeout(askedAt, timeoutSec);
+
+const text = ref('');
+
+const choices = computed<string[]>(() => {
+  const c = props.ask.schema?.choice;
+  return Array.isArray(c) ? (c as unknown[]).map((v) => String(v)) : [];
+});
+
+const submit = () => {
+  if (props.disabled || expired.value) return;
+  if (text.value.trim()) {
+    emit('reply', text.value.trim());
+    text.value = '';
+  }
+};
+
+const onKey = (e: KeyboardEvent) => {
+  if (e.key === 'Enter' && !e.shiftKey) {
+    e.preventDefault();
+    submit();
+  }
+};
+</script>
+
+<template>
+  <section class="ff-askp" :class="{ 'is-expired': expired }">
+    <header class="ff-askp__head">
+      <span class="ff-askp__label">{{ t('agent.v2.turn.status.waiting_for_user') }}</span>
+      <span class="ff-askp__timer">{{ t('agent.v2.turn.ask.timeout', { value: formatted }) }}</span>
+    </header>
+    <p class="ff-askp__prompt">{{ ask.prompt }}</p>
+
+    <div v-if="choices.length" class="ff-askp__choices">
+      <Button
+        v-for="choice in choices"
+        :key="choice"
+        variant="secondary"
+        size="sm"
+        :disabled="disabled || expired"
+        @click="emit('reply', choice)"
+      >{{ choice }}</Button>
+    </div>
+
+    <div v-else class="ff-askp__free">
+      <textarea
+        class="ff-askp__ta"
+        :value="text"
+        :disabled="disabled || expired"
+        :placeholder="t('agent.v2.turn.ask.placeholder')"
+        rows="2"
+        @input="(e) => (text = (e.target as HTMLTextAreaElement).value)"
+        @keydown="onKey"
+      />
+      <Button
+        variant="primary"
+        size="sm"
+        :disabled="!text.trim() || disabled || expired"
+        @click="submit"
+      >{{ t('agent.v2.turn.ask.send') }}</Button>
+    </div>
+  </section>
+</template>
+
+<style scoped>
+.ff-askp {
+  display: flex; flex-direction: column; gap: var(--sp-sm);
+  padding: var(--sp-md);
+  border: 1px solid var(--ac);
+  background: var(--surface-base);
+}
+.ff-askp.is-expired { border-color: var(--text-tertiary); opacity: 0.6; }
+.ff-askp__head {
+  display: flex; justify-content: space-between; align-items: center;
+  font-family: var(--font-mono); font-size: var(--text-small);
+  letter-spacing: var(--tracking-wide); text-transform: uppercase;
+}
+.ff-askp__label { color: var(--ac); }
+.ff-askp__timer { color: var(--text-tertiary); }
+.ff-askp__prompt { margin: 0; color: var(--text-primary); white-space: pre-wrap; }
+.ff-askp__choices { display: flex; gap: var(--sp-sm); flex-wrap: wrap; }
+.ff-askp__free { display: flex; gap: var(--sp-sm); align-items: flex-end; }
+.ff-askp__ta {
+  flex: 1; resize: vertical; min-height: 48px;
+  padding: var(--sp-sm) var(--sp-md);
+  background: var(--surface-raised); color: var(--text-primary);
+  border: 1px solid var(--border-default); border-radius: 0;
+  font-family: var(--font-sans); font-size: var(--text-body); outline: none;
+}
+.ff-askp__ta:focus { border-color: var(--ac); }
+.ff-askp__ta:disabled { opacity: 0.6; cursor: not-allowed; }
+</style>
+```
+
+> 设计风格：沿用 Industrial Dashboard（参见 memory `frontend_aesthetic.md`）—— 直角硬边、`var(--ac)` 主色描边、等宽数字倒计时。
+
+- [ ] **Step 2: 确认 PendingAsk 已被 useAgentSession 导出**
+
+```ts
+// web/src/composables/useAgentSession.ts —— 末尾 export 区：
+export type { PendingAsk };
+```
+
+Run: `grep -n "export type.*PendingAsk\|export interface PendingAsk" web/src/composables/useAgentSession.ts`
+Expected: 至少一行命中。
+
+- [ ] **Step 3: typecheck**
+
+Run: `cd web && bun run typecheck`
+Expected: PASS
+
+- [ ] **Step 4: Commit**
+
+```bash
+git add web/src/components/organisms/agent/AskPrompt.vue web/src/composables/useAgentSession.ts
+git commit -m "feat(agent): AskPrompt component for inline ask UI"
+```
+
+---
+
+## Task 8: `ControlBar.vue`
+
+**Files:**
+
+- Create: `web/src/components/organisms/agent/ControlBar.vue`
+
+- [ ] **Step 1: 实现组件**
+
+```vue
+<!-- web/src/components/organisms/agent/ControlBar.vue -->
+<script setup lang="ts">
+import Button from '../../molecules/Button.vue';
+import { useLocaleStore } from '../../../store/locale';
+import type { MsgStatus } from '../../../composables/useAgentSession';
+
+defineProps<{
+  status: MsgStatus;
+  hasPlanRiskStep?: boolean;        // plan 中含 high-risk 步骤时显示 approve/deny
+}>();
+
+defineEmits<{
+  pause: [];
+  resume: [];
+  skip: [];
+  approve: [];
+  deny: [];
+  cancel: [];
+}>();
+
+const localeStore = useLocaleStore();
+const t = localeStore.t;
+</script>
+
+<template>
+  <div class="ff-ctrl">
+    <Button
+      v-if="status === 'running'"
+      variant="ghost"
+      size="sm"
+      @click.stop="$emit('pause')"
+    >{{ t('agent.v2.turn.controls.pause') }}</Button>
+
+    <Button
+      v-if="status === 'paused'"
+      variant="primary"
+      size="sm"
+      @click.stop="$emit('resume')"
+    >{{ t('agent.v2.turn.controls.resume') }}</Button>
+
+    <Button
+      v-if="status === 'running' || status === 'paused'"
+      variant="ghost"
+      size="sm"
+      @click.stop="$emit('skip')"
+    >{{ t('agent.v2.turn.controls.skip') }}</Button>
+
+    <template v-if="hasPlanRiskStep && status === 'running'">
+      <Button variant="primary" size="sm" @click.stop="$emit('approve')">
+        {{ t('agent.v2.turn.controls.approve') }}
+      </Button>
+      <Button variant="ghost" size="sm" @click.stop="$emit('deny')">
+        {{ t('agent.v2.turn.controls.deny') }}
+      </Button>
+    </template>
+
+    <Button
+      v-if="status === 'pending' || status === 'running' || status === 'paused' || status === 'waiting_for_user'"
+      variant="ghost"
+      size="sm"
+      @click.stop="$emit('cancel')"
+    >{{ t('agent.v2.turn.cancel') }}</Button>
+  </div>
+</template>
+
+<style scoped>
+.ff-ctrl { display: flex; gap: var(--sp-sm); justify-content: flex-end; flex-wrap: wrap; }
+</style>
+```
+
+- [ ] **Step 2: typecheck**
+
+Run: `cd web && bun run typecheck`
+Expected: PASS
+
+- [ ] **Step 3: Commit**
+
+```bash
+git add web/src/components/organisms/agent/ControlBar.vue
+git commit -m "feat(agent): ControlBar component for pause/resume/skip/approve/deny/cancel"
+```
+
+---
+
+## Task 9: 集成到 TurnEntry.vue
+
+**Files:**
+
+- Modify: `web/src/components/organisms/agent/TurnEntry.vue`
+
+- [ ] **Step 1: 扩展 emits 与 props**
+
+```ts
+defineEmits<{
+  execute: [];
+  cancel: [];
+  focus: [];
+  reply: [value: unknown];
+  pause: [];
+  resume: [];
+  skip: [];
+  approve: [];
+  deny: [];
+}>();
+```
+
+`isActive` 计算更新覆盖新状态：
+
+```ts
+const isActive = computed(
+  () =>
+    props.turn.agent.status === 'pending' ||
+    props.turn.agent.status === 'running' ||
+    props.turn.agent.status === 'paused' ||
+    props.turn.agent.status === 'waiting_for_user',
+);
+```
+
+`activityEvents` 过滤新事件：
+
+```ts
+const activityEvents = computed(() =>
+  (props.turn.agent.events || [])
+    .filter((event) =>
+      event.message &&
+      !event.type.startsWith('job.succeeded') &&
+      event.type !== 'agent.thinking' &&    // thinking 单独折叠区
+      event.type !== 'agent.progress' &&    // progress 单独条
+      event.type !== 'tool.partial',        // partial 不进活动列表
+    )
+    .slice(-4),
+);
+
+const hasPlanRiskStep = computed(() =>
+  Boolean(
+    props.turn.agent.planResult?.proposedActions?.some(
+      (a) => a.riskLevel === 'high' || a.requiresConfirmation,
+    ),
+  ),
+);
+
+const thinkingExpanded = ref(false);
+```
+
+- [ ] **Step 2: 替换 template 中的"按钮行"为 `AskPrompt + ControlBar + 进度条 + thinking`**
+
+把 line 78-138 之间的内容替换为：
+
+```vue
+<div v-if="turn.agent.status === 'running' || turn.agent.status === 'paused'" class="ff-te__progress" />
+
+<div v-if="turn.agent.progress" class="ff-te__progress-meta">
+  <span class="ff-te__progress-label">{{ t('agent.v2.turn.progress.label') }}</span>
+  <span class="ff-te__progress-num">
+    <MonoNumber :value="`${turn.agent.progress.step}/${turn.agent.progress.total}`" />
+  </span>
+  <span v-if="turn.agent.progress.message" class="ff-te__progress-msg">{{ turn.agent.progress.message }}</span>
+</div>
+
+<details v-if="turn.agent.thinking" class="ff-te__thinking" :open="thinkingExpanded" @toggle="(e) => (thinkingExpanded = (e.target as HTMLDetailsElement).open)">
+  <summary>{{ t('agent.v2.turn.thinking.label') }}</summary>
+  <pre class="ff-te__thinking-body">{{ turn.agent.thinking }}</pre>
+</details>
+
+<ol v-if="activityEvents.length" class="ff-te__events">
+  <li v-for="event in activityEvents" :key="event.id" class="ff-te__event">
+    <span class="ff-te__event-dot" />
+    <span>{{ event.message }}</span>
+  </li>
+</ol>
+
+<AskPrompt
+  v-if="turn.agent.pendingAsk"
+  :ask="turn.agent.pendingAsk"
+  @reply="(value) => $emit('reply', value)"
+/>
+
+<p v-if="resultText" class="ff-te__sum ff-te__answer">
+  {{ resultText }}
+</p>
+
+<p v-else-if="turn.agent.planResult?.summary" class="ff-te__sum">
+  {{ turn.agent.planResult.summary }}
+</p>
+
+<section v-if="!resultText && turn.agent.planResult?.proposedActions?.length" class="ff-te__actions">
+  <PlanActionRow
+    v-for="a in turn.agent.planResult.proposedActions"
+    :key="a.step"
+    :action="a"
+  />
+</section>
+
+<div v-if="turn.agent.planResult?.costEstimate" class="ff-te__cost">
+  <!-- 既有 cost block 保持原样 -->
+</div>
+
+<div v-if="turn.agent.executeResult?.warnings?.length" class="ff-te__warn">
+  <!-- 既有 warn block 保持原样 -->
+</div>
+
+<div v-if="turn.agent.errorMessage" class="ff-te__err">{{ turn.agent.errorMessage }}</div>
+
+<div v-if="canExecute || isActive" class="ff-te__row">
+  <Button
+    v-if="canExecute"
+    variant="primary"
+    size="sm"
+    @click.stop="$emit('execute')"
+  >{{ t('agent.v2.turn.execute') }}</Button>
+  <ControlBar
+    v-if="isActive"
+    :status="turn.agent.status"
+    :has-plan-risk-step="hasPlanRiskStep"
+    @pause="$emit('pause')"
+    @resume="$emit('resume')"
+    @skip="$emit('skip')"
+    @approve="$emit('approve')"
+    @deny="$emit('deny')"
+    @cancel="$emit('cancel')"
+  />
+</div>
+```
+
+加入 imports：
+
+```ts
+import { computed, ref } from 'vue';
+import AskPrompt from './AskPrompt.vue';
+import ControlBar from './ControlBar.vue';
+```
+
+- [ ] **Step 3: 扩展 style，给新元素加样式**
+
+```css
+.ff-te__status--waiting_for_user { color: var(--ac); }
+.ff-te__status--paused { color: var(--status-warning); }
+
+.ff-te__progress-meta {
+  display: flex; gap: var(--sp-md); align-items: baseline;
+  font-family: var(--font-mono); font-size: var(--text-small);
+  letter-spacing: var(--tracking-wide); text-transform: uppercase;
+  color: var(--text-tertiary);
+}
+.ff-te__progress-label { color: var(--text-tertiary); }
+.ff-te__progress-num { color: var(--text-secondary); }
+.ff-te__progress-msg { color: var(--text-secondary); text-transform: none; letter-spacing: normal; }
+
+.ff-te__thinking {
+  border: 1px dashed var(--border-default);
+  padding: var(--sp-sm) var(--sp-md);
+  font-family: var(--font-mono); font-size: var(--text-small);
+}
+.ff-te__thinking summary {
+  cursor: pointer; color: var(--text-tertiary);
+  letter-spacing: var(--tracking-wide); text-transform: uppercase;
+}
+.ff-te__thinking-body {
+  margin: var(--sp-sm) 0 0; white-space: pre-wrap; color: var(--text-secondary);
+  max-height: 240px; overflow: auto;
+}
+```
+
+- [ ] **Step 4: 同步 status i18n key 渲染**
+
+`statusLabel` 已用 `agent.v2.turn.status.${status}` 模板拼接——新加的 `waiting_for_user` / `paused` i18n key 已在 Task 3 加入，因此 TypeScript 不会报错。
+
+- [ ] **Step 5: typecheck**
+
+Run: `cd web && bun run typecheck`
+Expected: PASS
+
+- [ ] **Step 6: Commit**
+
+```bash
+git add web/src/components/organisms/agent/TurnEntry.vue
+git commit -m "feat(agent): TurnEntry renders ask/progress/thinking/control bar"
+```
+
+---
+
+## Task 10: TaskInputDock.vue — waiting/paused 时锁主输入
+
+**Files:**
+
+- Modify: `web/src/components/organisms/agent/TaskInputDock.vue`
+- Modify: 父容器（找到使用 TaskInputDock 的页面，传新的 disabled）
+
+- [ ] **Step 1: TaskInputDock 不改 props 定义（已有 disabled）；改用法**
+
+`TaskInputDock` 的 `disabled` 已经接受 boolean——只需要在父容器传值时把 `waiting_for_user` / `paused` 也算上。
+
+- [ ] **Step 2: 找到 TaskInputDock 的使用方**
+
+Run: `grep -rn "TaskInputDock" web/src/`
+
+预计在 `web/src/views/agent/` 或 `web/src/pages/agent/` 下；找出后修改 disabled 绑定：
+
+```vue
+<TaskInputDock
+  :model-value="taskInput"
+  :policy="policy"
+  :reasoning-effort="reasoningEffort"
+  :disabled="
+    isSending ||
+    activeSession?.messages.some(
+      (m) => m.role === 'agent' && (m.status === 'waiting_for_user' || m.status === 'paused')
+    )
+  "
+  @update:model-value="(v) => (taskInput = v)"
+  @update:policy="(v) => (policy = v)"
+  @update:reasoning-effort="(v) => (reasoningEffort = v)"
+  @submit="sendMessage"
+/>
+```
+
+> 注：如果父容器已有别的 disabled 来源，用 `||` 叠加；不要替换。
+
+- [ ] **Step 3: typecheck + 跑既有 TaskInputDock 相关 spec（如有）**
+
+Run: `cd web && bun run typecheck`
+Expected: PASS
+
+- [ ] **Step 4: Commit**
+
+```bash
+git add web/src/components/organisms/agent/TaskInputDock.vue web/src/<父容器路径>
+git commit -m "feat(agent): lock TaskInputDock while turn waits for user or paused"
+```
+
+---
+
+## Task 11: 端到端 spec — ask 全链路 + pause/resume + cancel via inbox
+
+**Files:**
+
+- Modify: `web/src/composables/useAgentSession.spec.ts`
+
+- [ ] **Step 1: 写测试**
+
+在 `useAgentSession.spec.ts` 末尾追加。沿用 Task 6 已建立的 `vi.mock` + `vi.mocked` + `loadComposable()` 风格（**不**用 `vi.spyOn(await import(...))`）：
+
+```ts
+import type { AgentJobEvent } from '../types/agent';
+
+describe('useAgentSession — A frontend end-to-end', () => {
+  it('replyToAsk forwards reply via inbox and advances status to running', async () => {
+    vi.mocked(agentApi.sendAgentReply).mockResolvedValue({
+      inboxMessageId: '1', kind: 'reply', acceptedAt: '2026-05-26T00:00:00Z',
+    });
+
+    const { default: useAgentSession } = await loadComposable();
+    const { createSession, replyToAsk } = useAgentSession();
+    const session = createSession();
+    const msg: ChatMessage = {
+      id: 'msg-e2e', role: 'agent', content: '', status: 'waiting_for_user',
+      events: [], timestamp: new Date().toISOString(), executeJobId: '99',
+      pendingAsk: {
+        messageId: '101', prompt: 'pick', schema: { choice: ['A', 'B'] },
+        timeoutSec: 60, askedAt: new Date().toISOString(),
+      },
+    };
+    session.messages.push(msg);
+
+    await replyToAsk(msg, 'A');
+
+    expect(agentApi.sendAgentReply).toHaveBeenCalledWith('99', '101', 'A');
+    expect(msg.status).toBe('running');
+    expect(msg.pendingAsk).toBeUndefined();
+  });
+
+  it('pause + resume sends control.pause then control.resume', async () => {
+    vi.mocked(agentApi.pauseAgentJob).mockResolvedValue({
+      inboxMessageId: '2', kind: 'control.pause', acceptedAt: '2026-05-26T00:00:00Z',
+    });
+    vi.mocked(agentApi.resumeAgentJob).mockResolvedValue({
+      inboxMessageId: '3', kind: 'control.resume', acceptedAt: '2026-05-26T00:00:00Z',
+    });
+
+    const { default: useAgentSession } = await loadComposable();
+    const { createSession, pauseTurn, resumeTurn } = useAgentSession();
+    const session = createSession();
+    const msg: ChatMessage = {
+      id: 'msg-pp', role: 'agent', content: '', status: 'running',
+      events: [], timestamp: new Date().toISOString(), executeJobId: '77',
+    };
+    session.messages.push(msg);
+
+    await pauseTurn(msg);
+    expect(agentApi.pauseAgentJob).toHaveBeenCalledWith('77');
+
+    await resumeTurn(msg);
+    expect(agentApi.resumeAgentJob).toHaveBeenCalledWith('77');
+  });
+
+  it('cancel goes through inbox helper (not legacy /cancel route)', async () => {
+    vi.mocked(agentApi.cancelAgentTurn).mockResolvedValue({
+      inboxMessageId: '4', kind: 'control.cancel', acceptedAt: '2026-05-26T00:00:00Z',
+    });
+
+    const { default: useAgentSession } = await loadComposable();
+    const { createSession, cancel } = useAgentSession();
+    const session = createSession();
+    const msg: ChatMessage = {
+      id: 'msg-c', role: 'agent', content: '', status: 'running',
+      events: [], timestamp: new Date().toISOString(), executeJobId: '55',
+    };
+    session.messages.push(msg);
+
+    await cancel(msg);
+    expect(agentApi.cancelAgentTurn).toHaveBeenCalledWith('55');
+    expect(msg.status).toBe('canceled');
+  });
+});
+```
+
+- [ ] **Step 2: 运行**
+
+Run: `cd web && bun run test useAgentSession`
+Expected: PASS（含新 3 个用例 + 全部既有用例）
+
+- [ ] **Step 3: 运行全前端测试 smoke**
+
+Run: `cd web && bun run test`
+Expected: 全部 PASS（含 useAskTimeout、useAgentSession）
+
+- [ ] **Step 4: Commit**
+
+```bash
+git add web/src/composables/useAgentSession.spec.ts
+git commit -m "test(agent): end-to-end specs for ask/pause/resume/cancel via inbox"
+```
+
+---
+
+## Task 12: 手动验证 + 截图
+
+**Files:** N/A（dev server + 浏览器）
+
+- [ ] **Step 1: 启动后端 + worker + 前端**
+
+Run（三个终端）：
+
+- `cd app && uv run uvicorn fileflash.main:app --reload`
+- `cd app && uv run python -m fileflash.scripts.run_with_workers`
+- `cd web && bun run dev`
+
+- [ ] **Step 2: 在浏览器中跑 4 个场景**
+
+1. **agent.progress 实时显示**：发一个会有多步的请求（例如"列出根目录"），观察 TurnEntry 出现 `PROGRESS step/total` 行
+2. **手动暂停 + 恢复**：长任务中点 Pause → 等 3s → 点 Resume；UI 应在 `agent.paused` / `agent.resumed` 事件到达时切换状态
+3. **取消走 inbox**：长任务中点 Cancel；Network 面板应只见到 `POST /agent/jobs/<id>/messages`（body `{kind:"control.cancel"}`），**不**应有任何 `POST /agent/cancel/<id>`
+4. **ask 流程**：手动触发一个会调 `AskProtocol.ask()` 的场景（若 PlanRunner 暂未启用 ask，跳过此项并在 acceptance checklist 标注"待后续 prompt 模板启用"）
+
+- [ ] **Step 3: 监控 console + Network**
+
+Network 应无 404、500；console 应无报红错误；旧的 `agent/cancel/...` 调用应已不出现。
+
+- [ ] **Step 4: 截图保留**
+
+把 3-4 个场景截图保存到本地（PR 描述贴）。
+
+> 注：本 Task 不写代码也不 commit；它是"验收门"。
+
+---
+
+## Acceptance Checklist
+
+- [ ] `web/src/types/agent.d.ts` 含 14 种 `AgentJobEventType` 与 7 种 `AgentInboxMessageKind`
+- [ ] `web/src/api/agent.ts` 删除 `cancelAgentJob`、新增 `sendAgentMessage` 与 6 个 control helper（pause/resume/approve/deny/skip/cancel）+ `sendAgentReply`
+- [ ] `useAgentSession.ts` 的 `MsgStatus` 含 `waiting_for_user` / `paused`；`ChatMessage` 含 `pendingAsk` / `pauseRequestedAt` / `progress` / `thinking` / `partials`
+- [ ] `useAgentSession` 暴露 `replyToAsk` / `pauseTurn` / `resumeTurn` / `approveStep` / `denyStep` / `skipStep`；`cancel` 走 `control.cancel`
+- [ ] `AskPrompt.vue` 渲染 prompt + schema.choice 按钮组 / 自由文本 + 倒计时；`ControlBar.vue` 按状态渲染按钮
+- [ ] `TurnEntry.vue` 显示 progress 条、thinking 折叠区、AskPrompt、ControlBar；状态行支持新状态
+- [ ] `TaskInputDock.vue` 在 `waiting_for_user` / `paused` 时主输入框 disable
+- [ ] 13 条新 i18n key 中英文齐全
+- [ ] `useAgentSession.spec.ts` + `useAskTimeout.spec.ts` 全部 PASS
+- [ ] Task 12 手测 3+ 场景通过，Network 中没有遗留的 `POST /agent/cancel/...` 调用
+
+## 范围外（留给后续）
+
+- prompt 模板里 LLM 触发 `ask` 的判断逻辑（A-backend Task 14 step 3 已注明）—— 触发后本前端 plan 的 AskPrompt 会自动渲染
+- `tool.partial` 的 UI 渲染（本 plan 仅做数据缓存，UI 留给后续；TurnEntry 当前不渲染 partials 内容）
+- 思考块的 token 级流式动画（spec 明确不做）
+- 多 tab/多端同步（spec 明确不做）
diff --git a/docs/superpowers/specs/2026-05-26-agent-improvements-design.md b/docs/superpowers/specs/2026-05-26-agent-improvements-design.md
new file mode 100644
index 0000000..26ab36e
--- /dev/null
+++ b/docs/superpowers/specs/2026-05-26-agent-improvements-design.md
@@ -0,0 +1,456 @@
+# Agent 子系统改进设计（2026-05-26）
+
+## 背景与目标
+
+FileFlash 当前 agent 子系统存在三个互相牵连的问题：
+
+1. **交互、反馈机制不完善**——只有单向 SSE，事件由后端 0.6s 轮询 DB 产出；事件类型贫乏；用户在 plan 之后不能与 agent 中途对话；只能 cancel 整个 job，无 pause/resume/step 审批。
+2. **删除 session 没有级联**——前端 `deleteSession()` 仅清 localStorage；后端无 DELETE 接口；BackgroundJob 与"对话级 session"之间没有归属关系。
+3. **内置工具太少**——硬编码 9 个 `drive.*`，扩展一个工具要改 3 处（`DEFAULT_AGENT_TOOLS` / `_tool_schemas` / `router.dispatch`）。
+
+本设计把以上三件事拆成三个互相独立、可分别落地的子项目，从架构层把"双向交互通道、对话级 session、工具表"这三块地基补齐。
+
+## 顶层路线图
+
+| 子项目 | 内容 | 体量 |
+|---|---|---|
+| **A. 交互/反馈层重构** | Redis pub/sub 替换 DB 轮询；POST 上行 inbox；新事件类型；ask/pause/resume/step approve | 大 |
+| **B. ChatSession 上升到后端 + 软删除 + 级联中断** | 新建 `AgentChatSession` 表；BackgroundJob 归属到 session；DELETE 接口；前端 localStorage 迁服务端 | 中 |
+| **C. ToolRegistry 注册架构 + 5 个查询工具** | `ToolSpec` 对象替代 if/elif；schema/dispatch/risk 三合一；新增 search/getInfo/listRecent/statsByCategory/findDuplicates | 中 |
+
+依赖关系：
+
+```
+A ──► B   （B 的 worker 中断与 session 级 control 复用 A 的 inbox 通道）
+   │
+   └──► C  独立可并行
+```
+
+推荐顺序：**A → 并行(B,C) → 收尾**。
+
+## 统一非目标（三个子项目共同）
+
+- 不引入 WebSocket（双向通道用 SSE 推送 + POST inbox）
+- 不引入新的存储引擎（Redis 已在用、PostgreSQL 已在用）
+- 不重写 prompt 模板
+- 不动 skill 体系（`AgentSkill` / `tool_whitelist_json` 语义保留）
+- 不做 MCP server 接入
+- 不做工具运行时配额（`harness/budget.py` 仍是 scaffold）
+- 不做内容理解类工具（OCR、摘要等）
+
+---
+
+## 子项目 A：交互/反馈层重构
+
+### A.1 架构组件
+
+```
+                  ┌────────────────┐
+worker (agent) ──►│  AgentEventBus │──► Redis pub/sub channel
+                  └────────────────┘     agent:job:{job_id}:events
+                          ▲
+                          │ subscribe
+                  ┌───────┴──────────┐
+       web ──────►│  SSE endpoint    │────► browser
+                  └──────────────────┘
+                                                     ┌────────────────┐
+       browser ──POST messages──► web ──► AgentInbox │ → Redis channel│
+                                          (写 DB +)  │   agent:job:..:│
+                                                     │   inbox        │
+                                                     └────────────────┘
+                                                              ▲
+                                                              │ subscribe
+                                                          worker (await)
+```
+
+四个新单元，每个职责单一：
+
+| 单元 | 文件 | 职责 |
+|---|---|---|
+| `AgentEventBus` | `agents/harness/event_bus.py`（替换现有空 scaffold） | 把事件 publish 到 Redis；提供异步订阅器 |
+| `AgentInbox` | `agents/harness/inbox.py`（新） | 接收用户上行消息，写 DB + publish 到 inbox channel |
+| `AskProtocol` | `agents/harness/ask.py`（新） | runner 调用 `await ask(...)` 暂停等回答；底层订阅 inbox channel |
+| 新 schema | `schemas/agent.py` 扩展 | 新事件类型 + 上行 message 类型 |
+
+### A.2 数据流（以 agent 中途提问为例）
+
+1. `plan_runner` 决定需要澄清 → `await AskProtocol.ask(job_id, prompt, schema, timeout)`
+2. `AskProtocol`：① 写一行 `AgentInboxMessage(role=agent, kind=ask, status=waiting)`；② `event_bus.publish(agent.ask)`；③ 在 `asyncio.Event` 上等待 inbox 订阅器唤醒
+3. 前端收到 `agent.ask` SSE → 渲染选择气泡 → 用户选择 → `POST /agent/jobs/{id}/messages` body `{kind:"reply", reply_to:<message_id>, value:...}`
+4. `AgentInbox.handle`：① 写 `AgentInboxMessage(role=user, kind=reply, reply_to=...)`；② publish 到 `agent:job:{id}:inbox`
+5. worker 端 `AskProtocol` 订阅器收到消息 → set `asyncio.Event` → 调用方 `await` 返回回答 → runner 继续
+
+### A.3 新事件类型（`schemas/agent.py`）
+
+**下行**（worker → 前端，沿 SSE）：
+
+- `agent.thinking` — `{text}` 阶段性 reasoning 块（不做 token 级流）
+- `agent.progress` — `{step, total, message, percent?}` 长任务进度
+- `agent.ask` — `{message_id, prompt, schema, timeout_sec}` 请用户回答
+- `agent.paused` / `agent.resumed` — 状态变化广播
+- `tool.partial` — `{tool_name, step_no, chunk}` 大输出分段
+- 保留：`job.*` / `plan.ready` / `tool.started/succeeded/failed`
+
+**上行**（前端 → worker，沿 POST `/agent/jobs/{id}/messages`，body 区分 `kind`）：
+
+- `kind:"reply"` — 回答 `agent.ask`
+- `kind:"control.pause"` / `kind:"control.resume"`
+- `kind:"control.approve"` / `kind:"control.deny"` — 单工具实时审批
+- `kind:"control.skip"` — 跳过当前步
+- `kind:"control.cancel"` — 取消（与既有 `POST /agent/cancel/{job_id}` 等价，新接口归一化）
+
+### A.4 新表
+
+```sql
+AgentInboxMessage
+  inbox_message_id   PK   BigInt Identity
+  job_id             FK   BackgroundJob CASCADE   NOT NULL
+  role               enum ('agent', 'user')
+  kind               enum ('ask', 'reply',
+                          'control.pause', 'control.resume',
+                          'control.approve', 'control.deny',
+                          'control.skip', 'control.cancel')
+  payload_json       JSONB                         NOT NULL
+  reply_to_id        FK   self                     NULL
+  status             enum ('waiting','answered','timed_out','dropped')
+                                                   NULL  -- 仅 kind=ask 用
+  created_at         DateTime                      NOT NULL
+  answered_at        DateTime                      NULL
+
+INDEX (job_id, created_at)
+INDEX (job_id, status)
+```
+
+事件本身不入库（已经在 Redis pub/sub）。审计如需要再加 `agent_event_log`，本轮不做。
+
+### A.5 SSE 推送实现替换
+
+`routers/agent.py` 的 `_event_stream`（agent.py:84）从 DB 轮询改为：
+
+```python
+async with event_bus.subscribe(job_id) as stream:
+    async for event in stream:
+        yield sse_format(event)
+```
+
+`AGENT_EVENT_POLL_INTERVAL_SEC` 配置项**直接删除**——agent 子系统当前没有第三方 API 消费者，不必保留 deprecation 期。DB 轮询逻辑彻底删除。
+
+### A.6 worker 中断/暂停实现
+
+`ExecuteRunner` 每步开始前：
+
+```python
+await inbox.consume_controls(job_id)   # 处理所有 pending control
+if state.is_paused:
+    await inbox.wait_for_resume(job_id)  # 阻塞直到 control.resume
+if state.is_canceled:
+    raise JobCancelled()
+```
+
+pause/resume/skip 不杀 worker——仅在 step 边界检查 inbox。意味着如果一个 LLM 调用正在进行（≤30s），pause 会在它返回后才生效。**真中断（HTTP 任务取消）不在本轮范围内**。
+
+### A.7 前端状态机变化
+
+`useAgentSession.ts` 增两个状态：
+
+- `waiting_for_user`（收到 `agent.ask`）
+- `paused`（收到 `agent.paused`）
+
+新组件/改动：
+
+- `TaskInputDock.vue`：`waiting_for_user` 时渲染 ask 选项/输入框；`paused` 时渲染恢复按钮
+- `TurnEntry.vue`：渲染 `agent.thinking` / `agent.progress` / `tool.partial`
+- 新增 `web/src/api/agent.ts:sendAgentMessage()` 调 POST `/agent/jobs/{id}/messages`
+
+### A.8 路由层变化
+
+新增：
+
+- `POST /agent/jobs/{job_id}/messages` — 上行通道（body 含 `kind`）
+
+删除：
+
+- `POST /agent/cancel/{job_id}` — 直接删除；取消改走 `POST /agent/jobs/{id}/messages` body `{kind:"control.cancel"}`
+
+保留不变：
+
+- `POST /agent/plan` / `POST /agent/execute` / `GET /agent/jobs/{id}/events`
+
+### A.9 测试策略
+
+- `AgentEventBus`：单元测试 publish/subscribe；fake Redis（既有项目已有的 fakeredis 复用，如无则 mock）
+- `AgentInbox`：集成测试 happy path + 重复 reply + 不存在的 reply_to
+- `AskProtocol`：测试超时；测试在 worker 重启后仍能从 DB 重建状态（recovery 不做，但 status=waiting 的 ask 重启后 fail-fast）
+- SSE 端到端：mock worker publish 一串事件，前端断言收到顺序
+
+### A.10 非目标（A 特有）
+
+- 不做 token 级流式 thinking
+- 不做多 tab/多端同步（同账号多开浏览器不保证一致）
+- 不做 ask 超时后的自动 fallback（超时直接 fail job）
+- 不做 worker 端真中断 LLM 调用（只在 step 边界检查）
+
+---
+
+## 子项目 B：ChatSession 上升到后端 + 软删除 + 级联中断
+
+### B.1 关键事实
+
+- 后端 `AgentWorkSession` ≠ 前端 "Session"：前者是**单 job 的 checkpoint**（`job_id UNIQUE`）；后者是**前端 localStorage 对象**，含多个 ChatMessage、每条可关联多个 BackgroundJob。
+- 后端目前**没有"对话级 session"实体**，无法回答"这个 session 下有哪些 plan/job"。
+- 本子项目把对话级 session 实体化到后端，并基于它做软删除 + 级联中断。
+
+### B.2 新表
+
+```sql
+AgentChatSession
+  chat_session_id    PK   BigInt Identity
+  user_id            FK   User CASCADE        NOT NULL
+  title              String(255)              NOT NULL
+  archived           Boolean DEFAULT FALSE
+  deleted_at         DateTime                 NULL   -- 软删除标记
+  created_at         DateTime                 NOT NULL
+  updated_at         DateTime                 NOT NULL
+
+INDEX (user_id, deleted_at, updated_at DESC)
+```
+
+### B.3 BackgroundJob 改动
+
+- 新增 `chat_session_id FK AgentChatSession ON DELETE CASCADE NULLABLE`
+- 新增 `deleted_at DateTime NULL`（job 级软删除，跟随 session 软删除标记）
+- 旧 job（无 chat_session_id）保留 NULL，列表查询 default 隐藏；提供"未归属"过滤
+- FK 选 CASCADE 的原因：硬删 session 时 BackgroundJob 同步消失，再通过既有 `job_id CASCADE` 把 Plan/ActionLog/WorkSession/InboxMessage 一并清掉。NULLABLE 是为了兼容历史 job 与"显式归属未来某 session"两种情况。
+
+### B.4 API
+
+| Method | Path | 行为 |
+|---|---|---|
+| `POST /agent/chat-sessions` | 创建新 session（body: title?） | 返回 `{chat_session_id, ...}` |
+| `GET /agent/chat-sessions` | 当前用户未删除 session 列表（分页） | `deleted_at IS NULL` |
+| `GET /agent/chat-sessions/{id}` | 单 session + 该 session 下的 turn 概览 | 404 if 不属于当前用户或已软删 |
+| `PATCH /agent/chat-sessions/{id}` | 改 title / archived | 仅限自己 |
+| `DELETE /agent/chat-sessions/{id}` | **软删除**（流程见 B.5） | 200 |
+
+`POST /agent/plan` 和 `POST /agent/execute` 入参**强制**新增 `chat_session_id`（必填）；缺省直接返回 422。前端在迁移后所有调用点都传值。
+
+### B.5 DELETE 流程
+
+```
+1. SELECT ... FOR UPDATE 该 session（防并发）
+2. set chat_session.deleted_at = now()
+3. 找出该 session 下所有未完成 BackgroundJob（status in ('queued','running','planning','awaiting_confirm','executing','paused')）
+4. 对每个未完成 job：
+   - mark job.deleted_at = now()
+   - 调既有 cancel_job 逻辑 set cancel_requested_at
+   - 通过 A 的 inbox 写 AgentInboxMessage(kind='control.cancel') 唤醒 worker
+5. 已完成 job：仅 mark deleted_at，不回滚业务操作
+6. 关联 Plan / ActionLog / WorkSession / InboxMessage 保留（FK 是 job_id CASCADE，硬删时才级联）
+7. event_bus.publish('session.deleted', {chat_session_id})
+```
+
+> 注：drive 业务操作（move/delete 文件）一旦执行就不可逆。"取消" 仅停止后续步骤，不撤销已生效结果。
+
+### B.6 GC 任务
+
+- 新建 cron：每天扫 `chat_session.deleted_at < now() - INTERVAL '30 days'` 的记录，**硬删**
+- 硬删 chat_session 时关联表通过 FK CASCADE 自动清理：
+  - `BackgroundJob`（FK `chat_session_id ON DELETE CASCADE`）→ 触发 job 删除
+  - 进而 `AgentPlan` / `AgentActionLog` / `AgentWorkSession` / `AgentInboxMessage` 通过既有 `job_id CASCADE` 自动清
+- `AgentMemory` 走 `user_id`，不受影响
+- 未归属 session 的旧 job（`chat_session_id IS NULL`）不在 GC 范围内
+- GC 写入既有 cron 体系（参考 `services/admin/storage.py` 模式）
+
+### B.7 前端迁移
+
+- `useAgentSession.ts`：
+  - 删除 `STORAGE_KEY = 'fileflash.agent.sessions.v1'` 持久化（保留 in-memory cache）
+  - 初始化：调 `GET /agent/chat-sessions` 拉列表
+  - `createSession()` → `POST /agent/chat-sessions`，拿服务端 id
+  - `deleteSession()` → `DELETE /agent/chat-sessions/{id}`
+  - 旧 localStorage 数据：首次启动检测到旧 key 时，**逐条迁移**（POST 创建 session、把 ChatMessage 内 job_id 通过新接口 `POST /agent/chat-sessions/{id}/attach-jobs` 挂上），迁移完成后删除旧 key
+- `web/src/api/agent.ts`：新增 chat-session CRUD 方法
+- 单元测试 `useAgentSession.spec.ts` 改为对 mock API 断言而非对 localStorage 断言
+
+### B.8 worker 中断协议
+
+复用 A.6 的协议：B 不引入新的中断机制，只是确保 DELETE 流程发出的 `control.cancel` 能被 ExecuteRunner / PlanRunner 在 step 边界识别并抛 `JobCancelled`。
+
+### B.9 测试策略
+
+- API：测 CRUD + 权限隔离（A 用户不能删 B 的 session）+ 软删后 GET 返 404
+- DELETE 级联：建 session 含 2 个 running job、1 个 succeeded job → DELETE → 断言两个 running job `cancel_requested_at` 已设、inbox 收到 `control.cancel`、succeeded job 不变、所有 job `deleted_at` 已设
+- 前端迁移：mock 旧 localStorage 数据 + mock API，断言迁移后旧 key 已删、API 调用顺序正确
+- GC：插入 31 天前已软删的 session 跑 GC，断言记录消失
+
+### B.10 非目标（B 特有）
+
+- 不做"恢复已删 session" UI（数据 30 天内还在 DB，但本轮不出 UI）
+- 不做 session 跨用户共享
+- 不做 session 收藏/标签
+- 不做管理员强制硬删入口
+
+---
+
+## 子项目 C：ToolRegistry 注册架构 + 查询工具
+
+### C.1 现状痛点
+
+- `router.py:38-130` 一大串 if/elif；新加工具改 3 处
+- `policy.py:classify_tool_risk()` / `classify_tool_side_effect()` 又是一组 if/elif
+- `AgentSkill.tool_whitelist_json` 是字符串名单，无 registry 校验
+
+### C.2 ToolRegistry 结构
+
+```python
+# agents/harness/tool_registry.py（新）
+
+@dataclass(frozen=True)
+class ToolSpec:
+    name: str                              # "drive.listFolder"
+    description: str                       # 给 LLM 看
+    schema: dict[str, Any]                 # JSON Schema input
+    side_effect: Literal["read", "write"]
+    risk: Literal["low", "medium", "high"]
+    requires_confirmation: bool
+    handler: Callable[[ToolContext, dict], Awaitable[dict]]
+
+class ToolRegistry:
+    def register(self, spec: ToolSpec) -> None: ...
+    def get(self, name: str) -> ToolSpec: ...
+    def all(self) -> list[ToolSpec]: ...
+    def schemas_for(self, names: list[str]) -> list[dict]: ...
+
+REGISTRY = ToolRegistry()
+```
+
+`ToolContext` 保留现有 router.py 内传 ctx 的形态（携带 db session、user、job 等）。
+
+### C.3 文件布局
+
+```
+agents/
+  harness/
+    tool_registry.py        ← 新：Spec + Registry
+  tools/                    ← 新目录
+    __init__.py             ← import 所有工具触发注册
+    drive_list_folder.py
+    drive_count_files.py
+    drive_create_folder.py
+    drive_move_file.py
+    drive_move_folder.py
+    drive_rename_file.py
+    drive_rename_folder.py
+    drive_delete_file.py
+    drive_delete_folder.py
+    # —— 本轮新增 5 个查询工具 ——
+    drive_search_files.py
+    drive_get_file_info.py
+    drive_list_recent.py
+    drive_stats_by_category.py
+    drive_find_duplicates.py
+```
+
+每个工具文件结构：
+
+```python
+# agents/tools/drive_list_folder.py
+from ..harness.tool_registry import REGISTRY, ToolSpec
+from ..harness.context import ToolContext
+
+async def _handle(ctx: ToolContext, args: dict) -> dict:
+    ...  # 业务逻辑（从 router.py 搬过来）
+
+REGISTRY.register(ToolSpec(
+    name="drive.listFolder",
+    description="List entries inside a folder.",
+    schema={...},                      # 从 plan_runner._tool_schemas 搬
+    side_effect="read",
+    risk="low",
+    requires_confirmation=False,
+    handler=_handle,
+))
+```
+
+### C.4 拆掉的旧代码
+
+- `router.py:dispatch` 的 if/elif 全部删除 → 改为 `spec = REGISTRY.get(name); return await spec.handler(ctx, args)` + 通用错误包装
+- `plan_runner.py:_tool_schemas` → `REGISTRY.schemas_for(whitelist or REGISTRY.all_names())`
+- `plan_runner.py:DEFAULT_AGENT_TOOLS` → 不再硬编码；改从 `REGISTRY.all_names()` 计算（或保留作为"默认启用名单"配置项）
+- `policy.py:classify_tool_risk / classify_tool_side_effect` → 从 `REGISTRY.get(name).risk / side_effect` 读取；删除 if/elif 表
+- `AgentSkill` 保存时调 `REGISTRY.validate(whitelist)`：未知工具名直接 422
+
+### C.5 新增 5 个查询工具
+
+| name | 入参 | 出参 | 实现说明 |
+|---|---|---|---|
+| `drive.searchFiles` | `query` / `folder_id?` / `category?` / `mime_prefix?` / `modified_after?` / `limit≤200` | `[{file_id,name,path,size,mime,modified_at}]` | 复用 `services/files` 既有查询能力；不做全文 |
+| `drive.getFileInfo` | `file_id` | 单条详情 + 路径 + size + mime + tags | 复用现有 getFile |
+| `drive.listRecent` | `limit≤50` / `since?` | 最近修改的文件列表 | 走既有最近活动查询 |
+| `drive.statsByCategory` | `folder_id?` | `{image:N, video:N, document:N, other:N, total_size}` | 利用 mime/category 分桶 |
+| `drive.findDuplicates` | `folder_id?` / `by="hash"\|"name+size"` | 重复文件组列表 | 用既有 hash 字段 |
+
+全部 `side_effect=read`、`risk=low`、`requires_confirmation=false`，不进审批流。
+
+### C.6 plan_runner / prompt 影响
+
+- `DEFAULT_AGENT_TOOLS` 从 9 个变 14 个
+- prompt 模板**不动**——schema 自动从 registry 取
+- `_skill_tool_whitelist()` 行为不变（仍读 `AgentSkill.tool_whitelist_json`），但加 registry 校验
+
+### C.7 测试策略
+
+- `ToolRegistry`：单元测试（注册/查找/重复名字报错/未知名字报错/schemas_for 顺序）
+- 每个新工具：集成测试调 handler → 期望输出。**用真 DB + 真 services**（不 mock，遵循项目原则）
+- `policy.py` 改用 registry 后：保留原有风险/副作用的回归测试，断言读 registry 与旧 if/elif 给出同结果
+- 端到端：plan 一个含 `drive.searchFiles` 的请求 → confirm LLM 拿到 schema → execute → action_log 有正确记录
+
+### C.8 非目标（C 特有）
+
+- 不做 MCP server 接入（`AgentMcpServer` 表保留，本轮不动）
+- 不做工具版本/弃用机制
+- 不做工具运行时配额
+- 不做内容理解工具（OCR/摘要/缩略图）
+- 不动 `AgentSkill.tool_whitelist_json` 数据形态（仍是字符串名单）
+
+---
+
+## 跨子项目影响矩阵
+
+| 文件 / 模块 | A 改动 | B 改动 | C 改动 |
+|---|---|---|---|
+| `models/tables_agent.py` | + `AgentInboxMessage` | + `AgentChatSession`；`BackgroundJob` 加列 | — |
+| `schemas/agent.py` | + 新事件类型、上行 message 类型 | + ChatSession schema | — |
+| `routers/agent.py` | + POST `/agent/jobs/{id}/messages`；SSE 改 event_bus | + chat-sessions CRUD；plan/execute 入参 | — |
+| `agents/harness/events.py` | 替换为 `event_bus.py` | — | — |
+| `agents/harness/inbox.py` | 新 | — | — |
+| `agents/harness/ask.py` | 新 | — | — |
+| `agents/harness/policy.py` | — | — | 读 registry 替代 if/elif |
+| `agents/harness/router.py` | — | — | dispatch 改为 registry lookup |
+| `agents/runtime/plan_runner.py` | 接 ask | 接 chat_session_id | schema 改读 registry |
+| `agents/runtime/execute_runner.py` | step 边界检查 inbox / pause | 同 A | dispatch 简化 |
+| `agents/tools/` | — | — | 新目录，14 个工具文件 |
+| `services/admin/storage.py`（GC） | — | + chat-session GC 任务 | — |
+| `web/src/composables/useAgentSession.ts` | + waiting_for_user / paused 状态 | localStorage → API | — |
+| `web/src/components/organisms/agent/` | TurnEntry / TaskInputDock 渲染新事件 | SessionList 调 API | — |
+| `web/src/api/agent.ts` | + sendAgentMessage | + chat-session CRUD | — |
+
+## 兼容与迁移
+
+- **后端 API**：本设计**不要求向后兼容**——agent 子系统目前没有公开第三方 API 消费者；旧的 `POST /agent/cancel/{job_id}` 直接删除，前端同 PR 切换到 `control.cancel`
+- **前端 localStorage**：`fileflash.agent.sessions.v1` 数据**一次性迁移**到服务端；迁移完成清 key
+- **数据库迁移**：3 张表层面的改动（新增 `AgentInboxMessage` / `AgentChatSession`、`BackgroundJob` 加列），用 Alembic 一次迁移完成；旧 BackgroundJob `chat_session_id` 留 NULL（视作未归属）
+- **配置项**：`AGENT_EVENT_POLL_INTERVAL_SEC` 删除；新增 `AGENT_INBOX_ASK_TIMEOUT_SEC`（默认 1800s）、`AGENT_CHAT_SESSION_GC_DAYS`（默认 30）
+
+## 滚动出场顺序
+
+1. **A 全量上线**：A 是基础设施，B/C 都依赖它；A 不上线则 B 的中断协议无处发、C 的 step approval 也没通道
+2. **B 与 C 可并行**：互不依赖
+3. **每个子项目独立 PR / 独立 plan**：在写 implementation plan 时，按子项目各自拆 phase
+
+## 风险与开放问题
+
+- **Redis pub/sub 可靠性**：消息丢失风险存在（订阅者未连上时 publish 的消息会丢）。缓解：① 关键状态（ask、控制信号）持久化到 `AgentInboxMessage` 表；② SSE 重连时前端从 inbox/action_log 增量拉一次 catch-up。**event_bus 的事件本身不持久化是 acceptable 的**（属于实时通知）。
+- **worker 多副本**：当前 `AgentWorkerConsumer` 可能多副本运行（`agent-{uuid}` 命名）。`AskProtocol` 等待的 `asyncio.Event` 是进程内的——如果用户回复到来时该 worker 已挂，`status=waiting` 的 ask 永远不会被消费。**缓解**：worker 启动时扫一次 owned-by-self 的 waiting ask、超过 timeout 直接 fail；同时 `AGENT_INBOX_ASK_TIMEOUT_SEC` 默认 30 分钟限制阻塞时间。
+- **真中断 LLM 调用**：不在本轮范围。若用户对"pause 后 30s 才生效"反馈强烈，下一轮加 httpx 任务取消。
+- **前端迁移失败**：localStorage 迁移过程中网络失败可能丢数据。缓解：迁移**幂等**——同步前不删 localStorage；服务端创建成功后再删。
diff --git a/web/src/api/agent.spec.ts b/web/src/api/agent.spec.ts
new file mode 100644
index 0000000..0466f2d
--- /dev/null
+++ b/web/src/api/agent.spec.ts
@@ -0,0 +1,47 @@
+import { describe, expect, it, vi, beforeEach, afterEach } from 'vitest';
+
+vi.mock('../store/user', () => ({
+  useUserStore: () => ({ token: 'test-token' }),
+}));
+
+import { createAgentSseParser, streamAgentJobEvents } from './agent';
+import type { AgentJobEvent } from '../types/agent';
+
+describe('api/agent event stream helpers', () => {
+  const originalFetch = globalThis.fetch;
+
+  beforeEach(() => {
+    vi.restoreAllMocks();
+  });
+
+  afterEach(() => {
+    globalThis.fetch = originalFetch;
+  });
+
+  it('parses SSE events across multiple chunks', () => {
+    const events: AgentJobEvent[] = [];
+    const parser = createAgentSseParser((event) => events.push(event));
+
+    parser.feed('event: job.running\n');
+    parser.feed(
+      'data: {"id":"1","jobId":"j1","taskType":"agent.plan","type":"job.running","status":"running","message":"正在规划","data":{},"timestamp":"2026-05-20T00:00:00Z"}\n\n',
+    );
+    parser.feed(
+      'event: plan.ready\ndata: {"id":"2","jobId":"j1","taskType":"agent.plan","type":"plan.ready","status":"succeeded","message":"计划已生成","data":{"result":{"planHash":"h1"}},"timestamp":"2026-05-20T00:00:01Z"}\n\n',
+    );
+    parser.flush();
+
+    expect(events).toHaveLength(2);
+    expect(events[0].type).toBe('job.running');
+    expect(events[1].data.result.planHash).toBe('h1');
+  });
+
+  it('throws on stream setup failure so callers can fall back to polling', async () => {
+    globalThis.fetch = vi.fn().mockResolvedValue({
+      ok: false,
+      status: 503,
+    } as Response) as unknown as typeof fetch;
+
+    await expect(streamAgentJobEvents('job-1')).rejects.toThrow('503');
+  });
+});
diff --git a/web/src/api/agent.ts b/web/src/api/agent.ts
index b05f22a..5938f0b 100644
--- a/web/src/api/agent.ts
+++ b/web/src/api/agent.ts
@@ -1,7 +1,10 @@
 import http from '../utils/http';
+import { useUserStore } from '../store/user';
 import type {
   AgentBackgroundJob,
-  CancelAgentResponse,
+  AgentInboxMessageRequest,
+  AgentInboxMessageResponse,
+  AgentJobEvent,
   ExecuteAgentRequest,
   ExecuteAgentResponse,
   PlanAgentRequest,
@@ -16,10 +19,114 @@ export const executeAgentPlan = (data: ExecuteAgentRequest) => {
   return http.post<ExecuteAgentResponse>('/agent/execute', data);
 };
 
-export const cancelAgentJob = (jobId: string) => {
-  return http.post<CancelAgentResponse>(`/agent/cancel/${encodeURIComponent(jobId)}`);
+export const sendAgentMessage = (
+  jobId: string,
+  body: AgentInboxMessageRequest,
+) => {
+  return http.post<AgentInboxMessageResponse>(
+    `/agent/jobs/${encodeURIComponent(jobId)}/messages`,
+    body,
+  );
 };
 
+export const sendAgentReply = (
+  jobId: string,
+  replyTo: string,
+  value: unknown,
+) => sendAgentMessage(jobId, { kind: 'reply', replyTo, value });
+
+export const pauseAgentJob = (jobId: string) =>
+  sendAgentMessage(jobId, { kind: 'control.pause' });
+
+export const resumeAgentJob = (jobId: string) =>
+  sendAgentMessage(jobId, { kind: 'control.resume' });
+
+export const approveAgentStep = (jobId: string) =>
+  sendAgentMessage(jobId, { kind: 'control.approve' });
+
+export const denyAgentStep = (jobId: string) =>
+  sendAgentMessage(jobId, { kind: 'control.deny' });
+
+export const skipAgentStep = (jobId: string) =>
+  sendAgentMessage(jobId, { kind: 'control.skip' });
+
+export const cancelAgentTurn = (jobId: string) =>
+  sendAgentMessage(jobId, { kind: 'control.cancel' });
+
 export const getAgentJob = <T = Record<string, any>>(jobId: string) => {
   return http.get<AgentBackgroundJob<T>>(`/jobs/${encodeURIComponent(jobId)}`);
 };
+
+export interface AgentJobEventHandlers {
+  onEvent?: (event: AgentJobEvent) => void;
+}
+
+export const createAgentSseParser = (onEvent: (event: AgentJobEvent) => void) => {
+  let buffer = '';
+
+  const parseBlock = (block: string) => {
+    const dataLines = block
+      .split('\n')
+      .filter((line) => line.startsWith('data:'))
+      .map((line) => line.slice(5).trimStart());
+    if (!dataLines.length) return;
+    const raw = dataLines.join('\n').trim();
+    if (!raw) return;
+    onEvent(JSON.parse(raw) as AgentJobEvent);
+  };
+
+  const feed = (chunk: string) => {
+    buffer += chunk.replace(/\r\n/g, '\n');
+    let boundary = buffer.indexOf('\n\n');
+    while (boundary >= 0) {
+      const block = buffer.slice(0, boundary);
+      buffer = buffer.slice(boundary + 2);
+      parseBlock(block);
+      boundary = buffer.indexOf('\n\n');
+    }
+  };
+
+  const flush = () => {
+    if (!buffer.trim()) return;
+    parseBlock(buffer);
+    buffer = '';
+  };
+
+  return { feed, flush };
+};
+
+export const streamAgentJobEvents = async (
+  jobId: string,
+  handlers: AgentJobEventHandlers = {},
+  signal?: AbortSignal,
+) => {
+  const userStore = useUserStore();
+  const baseUrl = (import.meta.env.VITE_BASE_URL || '/api/v1').replace(/\/$/, '');
+  const headers: Record<string, string> = { Accept: 'text/event-stream' };
+  if (userStore.token) {
+    headers.Authorization = `Bearer ${userStore.token}`;
+  }
+  const response = await fetch(`${baseUrl}/agent/jobs/${encodeURIComponent(jobId)}/events`, {
+    method: 'GET',
+    headers,
+    credentials: 'include',
+    signal,
+  });
+  if (!response.ok) {
+    throw new Error(`Agent event stream failed: ${response.status}`);
+  }
+  if (!response.body) {
+    throw new Error('Agent event stream is not readable');
+  }
+
+  const parser = createAgentSseParser((event) => handlers.onEvent?.(event));
+  const reader = response.body.getReader();
+  const decoder = new TextDecoder();
+  while (true) {
+    const { value, done } = await reader.read();
+    if (done) break;
+    parser.feed(decoder.decode(value, { stream: true }));
+  }
+  parser.feed(decoder.decode());
+  parser.flush();
+};
diff --git a/web/src/api/user.ts b/web/src/api/user.ts
index 4c02748..13256ea 100644
--- a/web/src/api/user.ts
+++ b/web/src/api/user.ts
@@ -13,7 +13,9 @@ import type {
     StorageStats, 
     ActivityLog,
     GetActivityLogRequest,
-    User
+    User,
+    AdminUserItem,
+    GetAdminUsersParams,
 } from '../types/user';
 import type { PaginatedData } from '../types/base';
 
@@ -144,14 +146,8 @@ export const getUsers = (params: { search?: string; page?: number; perPage?: num
   return http.get<PaginatedData<User>>('/users', params);
 };
 
-export const getAdminUsers = (params: {
-  page?: number;
-  perPage?: number;
-  search?: string;
-  status?: 'active' | 'suspended';
-  role?: 'user' | 'admin';
-}) => {
-  return http.get<PaginatedData<any>>('/admin/users', params);
+export const getAdminUsers = (params: GetAdminUsersParams) => {
+  return http.get<PaginatedData<AdminUserItem>>('/admin/users', params);
 };
 
 export const updateUserStatus = (userId: string, status: 'active' | 'suspended') => {
diff --git a/web/src/components/organisms/agent/AskPrompt.vue b/web/src/components/organisms/agent/AskPrompt.vue
new file mode 100644
index 0000000..ced92ae
--- /dev/null
+++ b/web/src/components/organisms/agent/AskPrompt.vue
@@ -0,0 +1,164 @@
+<script setup lang="ts">
+import { computed, ref } from 'vue';
+import Button from '../../molecules/Button.vue';
+import { useLocaleStore } from '../../../store/locale';
+import { useAskTimeout } from '../../../composables/useAskTimeout';
+import type { PendingAsk } from '../../../composables/useAgentSession';
+
+const props = defineProps<{
+  ask: PendingAsk;
+  disabled?: boolean;
+}>();
+
+const emit = defineEmits<{ reply: [value: unknown] }>();
+
+const localeStore = useLocaleStore();
+const t = localeStore.t;
+
+const askedAt = computed(() => props.ask.askedAt);
+const timeoutSec = computed(() => props.ask.timeoutSec);
+const { formatted, expired } = useAskTimeout(askedAt, timeoutSec);
+
+const text = ref('');
+
+const choices = computed<string[]>(() => {
+  const choice = props.ask.schema?.choice;
+  return Array.isArray(choice) ? choice.map((value) => String(value)) : [];
+});
+
+const timeoutLabel = computed(() =>
+  t('agent.v2.turn.ask.timeout').replace('{value}', formatted.value),
+);
+
+const submit = () => {
+  if (props.disabled || expired.value) return;
+  const answer = text.value.trim();
+  if (!answer) return;
+  emit('reply', answer);
+  text.value = '';
+};
+
+const onInput = (event: Event) => {
+  text.value = (event.target as HTMLTextAreaElement).value;
+};
+
+const onKey = (event: KeyboardEvent) => {
+  if (event.key === 'Enter' && !event.shiftKey) {
+    event.preventDefault();
+    submit();
+  }
+};
+</script>
+
+<template>
+  <section class="ff-askp" :class="{ 'is-expired': expired }">
+    <header class="ff-askp__head">
+      <span class="ff-askp__label">{{ t('agent.v2.turn.status.waiting_for_user') }}</span>
+      <span class="ff-askp__timer">{{ timeoutLabel }}</span>
+    </header>
+    <p class="ff-askp__prompt">{{ ask.prompt }}</p>
+
+    <div v-if="choices.length" class="ff-askp__choices">
+      <Button
+        v-for="choice in choices"
+        :key="choice"
+        variant="ghost"
+        size="sm"
+        :disabled="disabled || expired"
+        @click="emit('reply', choice)"
+      >
+        {{ choice }}
+      </Button>
+    </div>
+
+    <div v-else class="ff-askp__free">
+      <textarea
+        class="ff-askp__ta"
+        :value="text"
+        :disabled="disabled || expired"
+        :placeholder="t('agent.v2.turn.ask.placeholder')"
+        rows="2"
+        @input="onInput"
+        @keydown="onKey"
+      />
+      <Button
+        variant="primary"
+        size="sm"
+        :disabled="!text.trim() || disabled || expired"
+        @click="submit"
+      >
+        {{ t('agent.v2.turn.ask.send') }}
+      </Button>
+    </div>
+  </section>
+</template>
+
+<style scoped>
+.ff-askp {
+  display: flex;
+  flex-direction: column;
+  gap: var(--sp-sm);
+  padding: var(--sp-md);
+  border: 1px solid var(--ac);
+  background: var(--surface-base);
+}
+.ff-askp.is-expired {
+  border-color: var(--text-tertiary);
+  opacity: 0.6;
+}
+.ff-askp__head {
+  display: flex;
+  justify-content: space-between;
+  align-items: center;
+  gap: var(--sp-md);
+  font-family: var(--font-mono);
+  font-size: var(--text-small);
+  letter-spacing: var(--tracking-wide);
+  text-transform: uppercase;
+}
+.ff-askp__label { color: var(--ac); }
+.ff-askp__timer {
+  color: var(--text-tertiary);
+  white-space: nowrap;
+}
+.ff-askp__prompt {
+  margin: 0;
+  color: var(--text-primary);
+  white-space: pre-wrap;
+}
+.ff-askp__choices {
+  display: flex;
+  gap: var(--sp-sm);
+  flex-wrap: wrap;
+}
+.ff-askp__free {
+  display: flex;
+  gap: var(--sp-sm);
+  align-items: flex-end;
+}
+.ff-askp__ta {
+  flex: 1;
+  resize: vertical;
+  min-height: 48px;
+  padding: var(--sp-sm) var(--sp-md);
+  background: var(--surface-raised);
+  color: var(--text-primary);
+  border: 1px solid var(--border-default);
+  border-radius: 0;
+  font-family: var(--font-sans);
+  font-size: var(--text-body);
+  outline: none;
+}
+.ff-askp__ta:focus { border-color: var(--ac); }
+.ff-askp__ta:disabled {
+  opacity: 0.6;
+  cursor: not-allowed;
+}
+
+@media (max-width: 720px) {
+  .ff-askp__free {
+    flex-direction: column;
+    align-items: stretch;
+  }
+}
+</style>
diff --git a/web/src/components/organisms/agent/ControlBar.vue b/web/src/components/organisms/agent/ControlBar.vue
new file mode 100644
index 0000000..46836c8
--- /dev/null
+++ b/web/src/components/organisms/agent/ControlBar.vue
@@ -0,0 +1,85 @@
+<script setup lang="ts">
+import Button from '../../molecules/Button.vue';
+import { useLocaleStore } from '../../../store/locale';
+import type { MsgStatus } from '../../../composables/useAgentSession';
+
+defineProps<{
+  status: MsgStatus;
+  hasPlanRiskStep?: boolean;
+}>();
+
+defineEmits<{
+  pause: [];
+  resume: [];
+  skip: [];
+  approve: [];
+  deny: [];
+  cancel: [];
+}>();
+
+const localeStore = useLocaleStore();
+const t = localeStore.t;
+</script>
+
+<template>
+  <div class="ff-ctrl">
+    <Button
+      v-if="status === 'running'"
+      variant="ghost"
+      size="sm"
+      @click.stop="$emit('pause')"
+    >
+      {{ t('agent.v2.turn.controls.pause') }}
+    </Button>
+
+    <Button
+      v-if="status === 'paused'"
+      variant="primary"
+      size="sm"
+      @click.stop="$emit('resume')"
+    >
+      {{ t('agent.v2.turn.controls.resume') }}
+    </Button>
+
+    <Button
+      v-if="status === 'running' || status === 'paused'"
+      variant="ghost"
+      size="sm"
+      @click.stop="$emit('skip')"
+    >
+      {{ t('agent.v2.turn.controls.skip') }}
+    </Button>
+
+    <template v-if="hasPlanRiskStep && status === 'running'">
+      <Button variant="primary" size="sm" @click.stop="$emit('approve')">
+        {{ t('agent.v2.turn.controls.approve') }}
+      </Button>
+      <Button variant="ghost" size="sm" @click.stop="$emit('deny')">
+        {{ t('agent.v2.turn.controls.deny') }}
+      </Button>
+    </template>
+
+    <Button
+      v-if="
+        status === 'pending' ||
+        status === 'running' ||
+        status === 'paused' ||
+        status === 'waiting_for_user'
+      "
+      variant="ghost"
+      size="sm"
+      @click.stop="$emit('cancel')"
+    >
+      {{ t('agent.v2.turn.cancel') }}
+    </Button>
+  </div>
+</template>
+
+<style scoped>
+.ff-ctrl {
+  display: flex;
+  gap: var(--sp-sm);
+  justify-content: flex-end;
+  flex-wrap: wrap;
+}
+</style>
diff --git a/web/src/components/organisms/agent/TaskTimeline.vue b/web/src/components/organisms/agent/TaskTimeline.vue
index 912febe..94297f8 100644
--- a/web/src/components/organisms/agent/TaskTimeline.vue
+++ b/web/src/components/organisms/agent/TaskTimeline.vue
@@ -14,6 +14,12 @@ const props = defineProps<{
 defineEmits<{
   execute: [id: string];
   cancel: [id: string];
+  reply: [id: string, value: unknown];
+  pause: [id: string];
+  resume: [id: string];
+  skip: [id: string];
+  approve: [id: string];
+  deny: [id: string];
   'focus-turn': [id: string];
   'hint-pick': [text: string];
 }>();
@@ -63,6 +69,12 @@ watch(
       :focused="turn.agent.id === focusedId"
       @execute="$emit('execute', turn.agent.id)"
       @cancel="$emit('cancel', turn.agent.id)"
+      @reply="(value) => $emit('reply', turn.agent.id, value)"
+      @pause="$emit('pause', turn.agent.id)"
+      @resume="$emit('resume', turn.agent.id)"
+      @skip="$emit('skip', turn.agent.id)"
+      @approve="$emit('approve', turn.agent.id)"
+      @deny="$emit('deny', turn.agent.id)"
       @focus="$emit('focus-turn', turn.agent.id)"
     />
   </div>
diff --git a/web/src/components/organisms/agent/TurnEntry.spec.ts b/web/src/components/organisms/agent/TurnEntry.spec.ts
index bd18def..9f6684d 100644
--- a/web/src/components/organisms/agent/TurnEntry.spec.ts
+++ b/web/src/components/organisms/agent/TurnEntry.spec.ts
@@ -9,6 +9,7 @@ const baseTurn = (overrides: Partial<AgentTurn['agent']> = {}): AgentTurn => ({
     role: 'user',
     content: 'do it',
     status: 'succeeded',
+    events: [],
     timestamp: '2026-05-20T00:00:00Z',
   },
   agent: {
@@ -16,6 +17,7 @@ const baseTurn = (overrides: Partial<AgentTurn['agent']> = {}): AgentTurn => ({
     role: 'agent',
     content: '',
     status: 'succeeded',
+    events: [],
     timestamp: '2026-05-20T00:00:00Z',
     planHash: 'hash-1',
     planResult: {
@@ -39,6 +41,37 @@ describe('organisms/agent/TurnEntry', () => {
     expect(w.text()).toContain('plan summary text');
   });
 
+  it('renders planning evidence beneath summary', () => {
+    const w = mount(TurnEntry, {
+      props: {
+        turn: baseTurn({
+          planResult: {
+            planJobId: 'p-1',
+            planHash: 'hash-1',
+            chosenSkill: null,
+            proposedActions: [],
+            summary: 'plan summary text',
+            requiresConfirmation: false,
+            costEstimate: { tokens: 100, toolCalls: 2, durationSecEstimate: 5 },
+            planningEvidence: [
+              {
+                step: 1,
+                tool: 'drive.searchFiles',
+                input: { folderId: 'root', query: '银翼杀手', category: 'video' },
+                outputPreview: { totalItems: 2 },
+              },
+            ],
+          },
+        }),
+        policy: 'confirm',
+        focused: false,
+      },
+    });
+    expect(w.text()).toContain('规划依据');
+    expect(w.text()).toContain('drive.searchFiles');
+    expect(w.text()).toContain('银翼杀手');
+  });
+
   it('renders execution answer before the plan summary', () => {
     const w = mount(TurnEntry, {
       props: {
@@ -62,6 +95,43 @@ describe('organisms/agent/TurnEntry', () => {
     expect(w.text()).not.toContain('plan summary text');
   });
 
+  it('renders lightweight agent activity events before the answer', () => {
+    const w = mount(TurnEntry, {
+      props: {
+        turn: baseTurn({
+          events: [
+            {
+              id: 'ev-1',
+              jobId: 'e-1',
+              taskType: 'agent.execute',
+              type: 'tool.started',
+              status: 'running',
+              agentPhase: 'executing',
+              message: '正在读取名称包含“银翼杀手”的视频文件数量。',
+              data: {},
+              timestamp: '2026-05-20T00:00:01Z',
+            },
+          ],
+          executeResult: {
+            planJobId: 'p-1',
+            executeJobId: 'e-1',
+            summary: 'execution summary text',
+            answer: '你上传了 2 部名称包含“银翼杀手”的电影（按视频文件统计）。',
+            appliedActions: 1,
+            skippedActions: 0,
+            warnings: [],
+            finishedAt: '2026-05-20T00:01:00Z',
+          },
+        }),
+        policy: 'confirm',
+        focused: false,
+      },
+    });
+
+    expect(w.text()).toContain('正在读取名称包含');
+    expect(w.text()).toContain('你上传了 2 部名称包含');
+  });
+
   it('hides Execute button when policy=planOnly', () => {
     const w = mount(TurnEntry, {
       props: { turn: baseTurn(), policy: 'planOnly', focused: false },
diff --git a/web/src/components/organisms/agent/TurnEntry.vue b/web/src/components/organisms/agent/TurnEntry.vue
index 0173611..ea4fbaa 100644
--- a/web/src/components/organisms/agent/TurnEntry.vue
+++ b/web/src/components/organisms/agent/TurnEntry.vue
@@ -1,11 +1,13 @@
 <script setup lang="ts">
-import { computed } from 'vue';
+import { computed, ref } from 'vue';
 import Button from '../../molecules/Button.vue';
 import MonoNumber from '../../atoms/MonoNumber.vue';
 import PlanActionRow from './PlanActionRow.vue';
+import AskPrompt from './AskPrompt.vue';
+import ControlBar from './ControlBar.vue';
 import { useLocaleStore } from '../../../store/locale';
 import type { LocaleKey } from '../../../i18n/messages';
-import type { AgentExecutionPolicy } from '../../../types/agent';
+import type { AgentExecutionPolicy, AgentPlanningEvidence } from '../../../types/agent';
 import type { AgentTurn } from '../../../composables/useAgentSession';
 
 const props = defineProps<{
@@ -14,7 +16,17 @@ const props = defineProps<{
   focused: boolean;
 }>();
 
-defineEmits<{ execute: []; cancel: []; focus: [] }>();
+defineEmits<{
+  execute: [];
+  cancel: [];
+  focus: [];
+  reply: [value: unknown];
+  pause: [];
+  resume: [];
+  skip: [];
+  approve: [];
+  deny: [];
+}>();
 
 const localeStore = useLocaleStore();
 const t = localeStore.t;
@@ -28,18 +40,61 @@ const canExecute = computed(
 );
 
 const isActive = computed(
-  () => props.turn.agent.status === 'pending' || props.turn.agent.status === 'running',
+  () =>
+    props.turn.agent.status === 'pending' ||
+    props.turn.agent.status === 'running' ||
+    props.turn.agent.status === 'paused' ||
+    props.turn.agent.status === 'waiting_for_user',
 );
 
 const resultText = computed(
   () => props.turn.agent.executeResult?.answer || props.turn.agent.executeResult?.summary || '',
 );
 
+const activityEvents = computed(() =>
+  (props.turn.agent.events || [])
+    .filter(
+      (event) =>
+        event.message &&
+        event.type !== 'job.succeeded' &&
+        event.type !== 'agent.thinking' &&
+        event.type !== 'agent.progress' &&
+        event.type !== 'tool.partial',
+    )
+    .slice(-4),
+);
+
+const hasPlanRiskStep = computed(() =>
+  Boolean(
+    props.turn.agent.planResult?.proposedActions?.some(
+      (action) => action.riskLevel === 'high' || action.requiresConfirmation,
+    ),
+  ),
+);
+
+const thinkingExpanded = ref(false);
+
 const statusLabel = computed(() => {
   const key = `agent.v2.turn.status.${props.turn.agent.status}` as LocaleKey;
   return t(key);
 });
 
+const planningEvidence = computed(
+  () => props.turn.agent.planResult?.planningEvidence?.filter(Boolean) ?? [],
+);
+const visibleEvidence = computed(() => planningEvidence.value.slice(0, 3));
+const hiddenEvidence = computed(() => planningEvidence.value.slice(3));
+
+const formatEvidencePreview = (evidence: AgentPlanningEvidence) =>
+  JSON.stringify(
+    {
+      input: evidence.input || {},
+      outputPreview: evidence.outputPreview || {},
+    },
+    null,
+    2,
+  );
+
 const formatTime = (iso: string) => {
   try {
     return new Date(iso).toLocaleTimeString([], { hour: '2-digit', minute: '2-digit' });
@@ -69,7 +124,42 @@ const formatTime = (iso: string) => {
           }}</span>
         </header>
 
-        <div v-if="isActive" class="ff-te__progress" />
+        <div v-if="turn.agent.status === 'running' || turn.agent.status === 'paused'" class="ff-te__progress" />
+
+        <div v-if="turn.agent.progress" class="ff-te__progress-meta">
+          <span class="ff-te__progress-label">{{ t('agent.v2.turn.progress.label') }}</span>
+          <span class="ff-te__progress-num">
+            <MonoNumber :value="`${turn.agent.progress.step}/${turn.agent.progress.total}`" />
+          </span>
+          <span v-if="turn.agent.progress.message" class="ff-te__progress-msg">
+            {{ turn.agent.progress.message }}
+          </span>
+        </div>
+
+        <details
+          v-if="turn.agent.thinking"
+          class="ff-te__thinking"
+          :open="thinkingExpanded"
+          @toggle="(event) => (thinkingExpanded = (event.target as HTMLDetailsElement).open)"
+        >
+          <summary :title="t('agent.v2.turn.thinking.toggle')">
+            {{ t('agent.v2.turn.thinking.label') }}
+          </summary>
+          <pre class="ff-te__thinking-body">{{ turn.agent.thinking }}</pre>
+        </details>
+
+        <ol v-if="activityEvents.length" class="ff-te__events">
+          <li v-for="event in activityEvents" :key="event.id" class="ff-te__event">
+            <span class="ff-te__event-dot" />
+            <span>{{ event.message }}</span>
+          </li>
+        </ol>
+
+        <AskPrompt
+          v-if="turn.agent.pendingAsk"
+          :ask="turn.agent.pendingAsk"
+          @reply="(value) => $emit('reply', value)"
+        />
 
         <p v-if="resultText" class="ff-te__sum ff-te__answer">
           {{ resultText }}
@@ -79,6 +169,29 @@ const formatTime = (iso: string) => {
           {{ turn.agent.planResult.summary }}
         </p>
 
+        <section v-if="planningEvidence.length" class="ff-te__evidence">
+          <p class="ff-te__evidence-label">{{ t('agent.v2.turn.evidence.label') }}</p>
+          <ol class="ff-te__evidence-list">
+            <li v-for="item in visibleEvidence" :key="`evidence-${item.step}-${item.tool}`" class="ff-te__evidence-item">
+              <span class="ff-te__evidence-head">#{{ item.step }} · {{ item.tool }}</span>
+              <pre class="ff-te__evidence-json">{{ formatEvidencePreview(item) }}</pre>
+            </li>
+          </ol>
+          <details v-if="hiddenEvidence.length" class="ff-te__evidence-more">
+            <summary>+{{ hiddenEvidence.length }} {{ t('agent.v2.turn.evidence.more') }}</summary>
+            <ol class="ff-te__evidence-list">
+              <li
+                v-for="item in hiddenEvidence"
+                :key="`evidence-hidden-${item.step}-${item.tool}`"
+                class="ff-te__evidence-item"
+              >
+                <span class="ff-te__evidence-head">#{{ item.step }} · {{ item.tool }}</span>
+                <pre class="ff-te__evidence-json">{{ formatEvidencePreview(item) }}</pre>
+              </li>
+            </ol>
+          </details>
+        </section>
+
         <section v-if="!resultText && turn.agent.planResult?.proposedActions?.length" class="ff-te__actions">
           <PlanActionRow
             v-for="a in turn.agent.planResult.proposedActions"
@@ -116,12 +229,17 @@ const formatTime = (iso: string) => {
             size="sm"
             @click.stop="$emit('execute')"
           >{{ t('agent.v2.turn.execute') }}</Button>
-          <Button
+          <ControlBar
             v-if="isActive"
-            variant="ghost"
-            size="sm"
-            @click.stop="$emit('cancel')"
-          >{{ t('agent.v2.turn.cancel') }}</Button>
+            :status="turn.agent.status"
+            :has-plan-risk-step="hasPlanRiskStep"
+            @pause="$emit('pause')"
+            @resume="$emit('resume')"
+            @skip="$emit('skip')"
+            @approve="$emit('approve')"
+            @deny="$emit('deny')"
+            @cancel="$emit('cancel')"
+          />
         </div>
       </div>
     </div>
@@ -176,6 +294,8 @@ const formatTime = (iso: string) => {
 .ff-te__status--succeeded { color: var(--status-success); }
 .ff-te__status--failed { color: var(--status-error); }
 .ff-te__status--canceled { color: var(--text-tertiary); }
+.ff-te__status--waiting_for_user { color: var(--ac); }
+.ff-te__status--paused { color: var(--status-warning); }
 
 .ff-te__progress {
   height: 2px;
@@ -188,9 +308,115 @@ const formatTime = (iso: string) => {
   100% { background-position: -200% 0; }
 }
 
+.ff-te__progress-meta {
+  display: flex;
+  gap: var(--sp-md);
+  align-items: baseline;
+  font-family: var(--font-mono);
+  font-size: var(--text-small);
+  letter-spacing: var(--tracking-wide);
+  text-transform: uppercase;
+  color: var(--text-tertiary);
+}
+.ff-te__progress-label { color: var(--text-tertiary); }
+.ff-te__progress-num { color: var(--text-secondary); }
+.ff-te__progress-msg {
+  color: var(--text-secondary);
+  text-transform: none;
+  letter-spacing: 0;
+}
+
+.ff-te__thinking {
+  border: 1px dashed var(--border-default);
+  padding: var(--sp-sm) var(--sp-md);
+  font-family: var(--font-mono);
+  font-size: var(--text-small);
+}
+.ff-te__thinking summary {
+  cursor: pointer;
+  color: var(--text-tertiary);
+  letter-spacing: var(--tracking-wide);
+  text-transform: uppercase;
+}
+.ff-te__thinking-body {
+  margin: var(--sp-sm) 0 0;
+  white-space: pre-wrap;
+  color: var(--text-secondary);
+  max-height: 240px;
+  overflow: auto;
+}
+
 .ff-te__sum { margin: 0; color: var(--text-primary); }
 .ff-te__answer { white-space: pre-wrap; }
 
+.ff-te__events {
+  display: flex;
+  flex-direction: column;
+  gap: 4px;
+  margin: 0;
+  padding: 0;
+  list-style: none;
+}
+.ff-te__event {
+  display: flex;
+  align-items: center;
+  gap: 8px;
+  min-height: 18px;
+  font-family: var(--font-mono);
+  font-size: var(--text-small);
+  color: var(--text-tertiary);
+}
+.ff-te__event-dot {
+  width: 5px;
+  height: 5px;
+  background: var(--ac);
+  flex: 0 0 auto;
+}
+
+.ff-te__evidence {
+  display: grid;
+  gap: var(--sp-xs);
+}
+.ff-te__evidence-label {
+  margin: 0;
+  font-family: var(--font-mono);
+  font-size: var(--text-small);
+  color: var(--text-tertiary);
+  letter-spacing: var(--tracking-wide);
+  text-transform: uppercase;
+}
+.ff-te__evidence-list {
+  margin: 0;
+  padding-left: 18px;
+  display: grid;
+  gap: var(--sp-xs);
+}
+.ff-te__evidence-item {
+  display: grid;
+  gap: 4px;
+}
+.ff-te__evidence-head {
+  font-family: var(--font-mono);
+  font-size: var(--text-small);
+  color: var(--text-secondary);
+}
+.ff-te__evidence-json {
+  margin: 0;
+  padding: var(--sp-xs);
+  border: 1px solid var(--border-subtle);
+  background: var(--surface-inset);
+  color: var(--text-secondary);
+  font-size: 12px;
+  white-space: pre-wrap;
+  word-break: break-word;
+}
+.ff-te__evidence-more summary {
+  cursor: pointer;
+  color: var(--text-tertiary);
+  font-family: var(--font-mono);
+  font-size: var(--text-small);
+}
+
 .ff-te__actions {
   border: 1px solid var(--border-subtle);
   border-bottom: 0;
diff --git a/web/src/components/organisms/agent/index.ts b/web/src/components/organisms/agent/index.ts
index 16d4510..67d4d58 100644
--- a/web/src/components/organisms/agent/index.ts
+++ b/web/src/components/organisms/agent/index.ts
@@ -1,6 +1,8 @@
 export { default as SessionItem } from './SessionItem.vue';
 export { default as SessionList } from './SessionList.vue';
 export { default as PlanActionRow } from './PlanActionRow.vue';
+export { default as AskPrompt } from './AskPrompt.vue';
+export { default as ControlBar } from './ControlBar.vue';
 export { default as TurnEntry } from './TurnEntry.vue';
 export { default as TaskTimeline } from './TaskTimeline.vue';
 export { default as TaskInputDock } from './TaskInputDock.vue';
diff --git a/web/src/composables/useAgentSession.spec.ts b/web/src/composables/useAgentSession.spec.ts
index ef1b101..e505c53 100644
--- a/web/src/composables/useAgentSession.spec.ts
+++ b/web/src/composables/useAgentSession.spec.ts
@@ -1,11 +1,20 @@
 import { describe, it, expect, beforeEach, afterEach, vi } from 'vitest';
 import { nextTick } from 'vue';
+import type { ChatMessage } from './useAgentSession';
 
 vi.mock('../api/agent', () => ({
   planAgentTask: vi.fn(),
   executeAgentPlan: vi.fn(),
-  cancelAgentJob: vi.fn(),
+  cancelAgentTurn: vi.fn(),
   getAgentJob: vi.fn(),
+  streamAgentJobEvents: vi.fn(),
+  sendAgentMessage: vi.fn(),
+  sendAgentReply: vi.fn(),
+  pauseAgentJob: vi.fn(),
+  resumeAgentJob: vi.fn(),
+  approveAgentStep: vi.fn(),
+  denyAgentStep: vi.fn(),
+  skipAgentStep: vi.fn(),
 }));
 
 vi.mock('../store/user', () => ({
@@ -46,6 +55,24 @@ const readOnlyPlanResult = {
   requiresConfirmation: true,
 };
 
+const readOnlyPlanResultWithEvidence = {
+  ...readOnlyPlanResult,
+  planningEvidence: [
+    {
+      step: 1,
+      tool: 'drive.searchFiles',
+      input: { folderId: 'root', query: '银翼杀手', category: 'video' },
+      outputPreview: {
+        totalItems: 2,
+        items: [
+          { fileId: '19', name: '银翼杀手1982.mp4' },
+          { fileId: '20', name: '银翼杀手2049.mp4' },
+        ],
+      },
+    },
+  ],
+};
+
 const writePlanResult = {
   ...planResult,
   proposedActions: [
@@ -93,6 +120,7 @@ describe('useAgentSession', () => {
     vi.clearAllMocks();
     localStorage.clear();
     vi.useFakeTimers();
+    vi.mocked(agentApi.streamAgentJobEvents).mockRejectedValue(new Error('stream unavailable'));
   });
 
   afterEach(async () => {
@@ -291,6 +319,81 @@ describe('useAgentSession', () => {
     expect(turn.agent.status).toBe('succeeded');
   });
 
+  it('uses streamed plan and execute events when available', async () => {
+    vi.mocked(agentApi.planAgentTask).mockResolvedValue({
+      jobId: 'job-1',
+      status: 'pending',
+      taskType: 'agent.plan',
+    });
+    vi.mocked(agentApi.executeAgentPlan).mockResolvedValue({
+      jobId: 'job-2',
+      status: 'pending',
+      taskType: 'agent.execute',
+    });
+    vi.mocked(agentApi.streamAgentJobEvents)
+      .mockImplementationOnce(async (_jobId, handlers) => {
+        handlers?.onEvent?.({
+          id: 'plan-ready-1',
+          jobId: 'job-1',
+          taskType: 'agent.plan',
+          type: 'plan.ready',
+          status: 'succeeded',
+          agentPhase: 'completed',
+          message: '计划已生成。',
+          data: { result: readOnlyPlanResultWithEvidence },
+          timestamp: '2026-05-20T00:00:00Z',
+        });
+        handlers?.onEvent?.({
+          id: 'plan-done-1',
+          jobId: 'job-1',
+          taskType: 'agent.plan',
+          type: 'job.succeeded',
+          status: 'succeeded',
+          agentPhase: 'completed',
+          message: '任务已完成。',
+          data: { result: readOnlyPlanResultWithEvidence },
+          timestamp: '2026-05-20T00:00:01Z',
+        });
+      })
+      .mockImplementationOnce(async (_jobId, handlers) => {
+        handlers?.onEvent?.({
+          id: 'tool-start-1',
+          jobId: 'job-2',
+          taskType: 'agent.execute',
+          type: 'tool.started',
+          status: 'running',
+          agentPhase: 'executing',
+          message: '正在读取名称包含“银翼杀手”的视频文件数量。',
+          data: { step: 1, tool: 'drive.countFiles' },
+          timestamp: '2026-05-20T00:00:02Z',
+        });
+        handlers?.onEvent?.({
+          id: 'execute-done-1',
+          jobId: 'job-2',
+          taskType: 'agent.execute',
+          type: 'job.succeeded',
+          status: 'succeeded',
+          agentPhase: 'completed',
+          message: '答案已生成。',
+          data: { result: execResult },
+          timestamp: '2026-05-20T00:00:03Z',
+        });
+      });
+
+    const { default: useAgentSession } = await loadComposable();
+    const { taskInput, sendMessage, activeTurns } = useAgentSession();
+    taskInput.value = '我上传了几部银翼杀手？';
+    await sendMessage();
+
+    const turn = activeTurns.value[0];
+    expect(agentApi.getAgentJob).not.toHaveBeenCalled();
+    expect(agentApi.executeAgentPlan).toHaveBeenCalled();
+    expect(turn.agent.events.map((event) => event.id)).toContain('tool-start-1');
+    expect(turn.agent.planResult?.planningEvidence?.[0]?.tool).toBe('drive.searchFiles');
+    expect(turn.agent.executeResult?.answer).toContain('3 部电影');
+    expect(turn.agent.status).toBe('succeeded');
+  });
+
   it('does not auto-execute write plans in confirm policy', async () => {
     vi.mocked(agentApi.planAgentTask).mockResolvedValue({
       jobId: 'job-1',
@@ -415,7 +518,7 @@ describe('useAgentSession', () => {
     expect(turn.agent.errorMessage).toBe('Execute failed.');
   });
 
-  it('cancel calls cancelAgentJob and clears polling for that turn', async () => {
+  it('cancel calls cancelAgentTurn and clears polling for that turn', async () => {
     vi.mocked(agentApi.planAgentTask).mockResolvedValue({
       jobId: 'job-1',
       status: 'pending',
@@ -426,10 +529,10 @@ describe('useAgentSession', () => {
       jobId: 'job-1',
       status: 'running',
     } as any);
-    vi.mocked(agentApi.cancelAgentJob).mockResolvedValue({
-      jobId: 'job-1',
-      status: 'canceled',
-      canceledAt: '2026-05-20T00:00:00Z',
+    vi.mocked(agentApi.cancelAgentTurn).mockResolvedValue({
+      inboxMessageId: 'inbox-1',
+      kind: 'control.cancel',
+      acceptedAt: '2026-05-20T00:00:00Z',
     });
 
     const { default: useAgentSession } = await loadComposable();
@@ -440,7 +543,7 @@ describe('useAgentSession', () => {
     const turn = activeTurns.value[0];
     const callsBefore = vi.mocked(agentApi.getAgentJob).mock.calls.length;
     await cancel(turn.agent);
-    expect(agentApi.cancelAgentJob).toHaveBeenCalled();
+    expect(agentApi.cancelAgentTurn).toHaveBeenCalled();
     // Advance time to ensure timer wouldn't fire again
     await vi.advanceTimersByTimeAsync(3000);
     const callsAfter = vi.mocked(agentApi.getAgentJob).mock.calls.length;
@@ -450,10 +553,10 @@ describe('useAgentSession', () => {
   it('cancel before plan job id arrives keeps turn canceled and does not start polling', async () => {
     const planGate = deferred<any>();
     vi.mocked(agentApi.planAgentTask).mockReturnValue(planGate.promise);
-    vi.mocked(agentApi.cancelAgentJob).mockResolvedValue({
-      jobId: 'job-late',
-      status: 'canceled',
-      canceledAt: '2026-05-20T00:00:00Z',
+    vi.mocked(agentApi.cancelAgentTurn).mockResolvedValue({
+      inboxMessageId: 'inbox-late',
+      kind: 'control.cancel',
+      acceptedAt: '2026-05-20T00:00:00Z',
     });
 
     const { default: useAgentSession } = await loadComposable();
@@ -474,7 +577,7 @@ describe('useAgentSession', () => {
     await sendTask;
 
     expect(agentApi.getAgentJob).not.toHaveBeenCalled();
-    expect(agentApi.cancelAgentJob).toHaveBeenCalledWith('job-late');
+    expect(agentApi.cancelAgentTurn).toHaveBeenCalledWith('job-late');
     expect(turn.agent.status).toBe('canceled');
   });
 
@@ -486,10 +589,10 @@ describe('useAgentSession', () => {
       taskType: 'agent.plan',
     });
     vi.mocked(agentApi.getAgentJob).mockReturnValue(firstPoll.promise);
-    vi.mocked(agentApi.cancelAgentJob).mockResolvedValue({
-      jobId: 'job-1',
-      status: 'canceled',
-      canceledAt: '2026-05-20T00:00:00Z',
+    vi.mocked(agentApi.cancelAgentTurn).mockResolvedValue({
+      inboxMessageId: 'inbox-1',
+      kind: 'control.cancel',
+      acceptedAt: '2026-05-20T00:00:00Z',
     });
 
     const { default: useAgentSession } = await loadComposable();
@@ -497,8 +600,9 @@ describe('useAgentSession', () => {
     taskInput.value = 'hello';
 
     const sendTask = sendMessage();
-    await Promise.resolve();
-    await Promise.resolve();
+    for (let i = 0; i < 6 && vi.mocked(agentApi.getAgentJob).mock.calls.length === 0; i += 1) {
+      await Promise.resolve();
+    }
     const turn = activeTurns.value[0];
     await cancel(turn.agent);
     expect(turn.agent.status).toBe('canceled');
@@ -514,6 +618,208 @@ describe('useAgentSession', () => {
     expect(vi.mocked(agentApi.getAgentJob).mock.calls.length).toBe(1);
   });
 
+  it('applies ask, progress, thinking, pause, resume, and partial stream events', async () => {
+    vi.mocked(agentApi.planAgentTask).mockResolvedValue({
+      jobId: 'job-ask',
+      status: 'pending',
+      taskType: 'agent.plan',
+    });
+    vi.mocked(agentApi.streamAgentJobEvents).mockImplementationOnce(async (_jobId, handlers) => {
+      handlers?.onEvent?.({
+        id: 'progress-1',
+        jobId: 'job-ask',
+        taskType: 'agent.plan',
+        type: 'agent.progress',
+        status: 'running',
+        agentPhase: 'planning',
+        message: 'step one',
+        data: { step: 1, total: 3, message: 'Reading folders', percent: 33 },
+        timestamp: '2026-05-26T00:00:00Z',
+      });
+      handlers?.onEvent?.({
+        id: 'thinking-1',
+        jobId: 'job-ask',
+        taskType: 'agent.plan',
+        type: 'agent.thinking',
+        status: 'running',
+        agentPhase: 'planning',
+        message: '',
+        data: { text: 'Need user choice.' },
+        timestamp: '2026-05-26T00:00:01Z',
+      });
+      handlers?.onEvent?.({
+        id: 'partial-1',
+        jobId: 'job-ask',
+        taskType: 'agent.plan',
+        type: 'tool.partial',
+        status: 'running',
+        agentPhase: 'planning',
+        message: '',
+        data: { step: 1, tool: 'drive.listFolder', chunk: { name: 'A' } },
+        timestamp: '2026-05-26T00:00:02Z',
+      });
+      handlers?.onEvent?.({
+        id: 'paused-1',
+        jobId: 'job-ask',
+        taskType: 'agent.plan',
+        type: 'agent.paused',
+        status: 'paused',
+        agentPhase: 'planning',
+        message: 'paused',
+        data: {},
+        timestamp: '2026-05-26T00:00:03Z',
+      });
+      handlers?.onEvent?.({
+        id: 'resumed-1',
+        jobId: 'job-ask',
+        taskType: 'agent.plan',
+        type: 'agent.resumed',
+        status: 'running',
+        agentPhase: 'planning',
+        message: 'resumed',
+        data: {},
+        timestamp: '2026-05-26T00:00:04Z',
+      });
+      handlers?.onEvent?.({
+        id: 'ask-1',
+        jobId: 'job-ask',
+        taskType: 'agent.plan',
+        type: 'agent.ask',
+        status: 'waiting_for_user',
+        agentPhase: 'planning',
+        message: 'choose',
+        data: {
+          messageId: 'ask-101',
+          prompt: 'Pick one',
+          schema: { choice: ['A', 'B'] },
+          timeoutSec: 60,
+        },
+        timestamp: '2026-05-26T00:00:05Z',
+      });
+    });
+
+    const { default: useAgentSession } = await loadComposable();
+    const { taskInput, sendMessage, activeTurns } = useAgentSession();
+    taskInput.value = 'choose a folder';
+    await sendMessage();
+
+    const turn = activeTurns.value[0];
+    expect(turn.agent.status).toBe('waiting_for_user');
+    expect(turn.agent.pendingAsk?.messageId).toBe('ask-101');
+    expect(turn.agent.progress?.step).toBe(1);
+    expect(turn.agent.thinking).toContain('Need user choice.');
+    expect(turn.agent.partials?.[1].chunks).toEqual([{ name: 'A' }]);
+  });
+
+  it('replyToAsk forwards reply via inbox and advances status to running', async () => {
+    vi.mocked(agentApi.sendAgentReply).mockResolvedValue({
+      inboxMessageId: 'reply-1',
+      kind: 'reply',
+      acceptedAt: '2026-05-26T00:00:00Z',
+    });
+
+    const { default: useAgentSession } = await loadComposable();
+    const { createSession, replyToAsk } = useAgentSession();
+    const session = createSession();
+    const msg: ChatMessage = {
+      id: 'msg-e2e',
+      role: 'agent',
+      content: '',
+      status: 'waiting_for_user',
+      events: [],
+      timestamp: new Date().toISOString(),
+      executeJobId: '99',
+      pendingAsk: {
+        messageId: '101',
+        prompt: 'pick',
+        schema: { choice: ['A', 'B'] },
+        timeoutSec: 60,
+        askedAt: new Date().toISOString(),
+      },
+    };
+    session.messages.push(msg);
+
+    await replyToAsk(msg, 'A');
+
+    expect(agentApi.sendAgentReply).toHaveBeenCalledWith('99', '101', 'A');
+    expect(msg.status).toBe('running');
+    expect(msg.pendingAsk).toBeUndefined();
+  });
+
+  it('pause and resume send control.pause then control.resume', async () => {
+    vi.mocked(agentApi.pauseAgentJob).mockResolvedValue({
+      inboxMessageId: 'pause-1',
+      kind: 'control.pause',
+      acceptedAt: '2026-05-26T00:00:00Z',
+    });
+    vi.mocked(agentApi.resumeAgentJob).mockResolvedValue({
+      inboxMessageId: 'resume-1',
+      kind: 'control.resume',
+      acceptedAt: '2026-05-26T00:00:01Z',
+    });
+
+    const { default: useAgentSession } = await loadComposable();
+    const { createSession, pauseTurn, resumeTurn } = useAgentSession();
+    const session = createSession();
+    const msg: ChatMessage = {
+      id: 'msg-pp',
+      role: 'agent',
+      content: '',
+      status: 'running',
+      events: [],
+      timestamp: new Date().toISOString(),
+      executeJobId: '77',
+    };
+    session.messages.push(msg);
+
+    await pauseTurn(msg);
+    expect(agentApi.pauseAgentJob).toHaveBeenCalledWith('77');
+    expect(msg.pauseRequestedAt).toBeTruthy();
+
+    await resumeTurn(msg);
+    expect(agentApi.resumeAgentJob).toHaveBeenCalledWith('77');
+  });
+
+  it('approve, deny, and skip send inbox control helpers', async () => {
+    vi.mocked(agentApi.approveAgentStep).mockResolvedValue({
+      inboxMessageId: 'approve-1',
+      kind: 'control.approve',
+      acceptedAt: '2026-05-26T00:00:00Z',
+    });
+    vi.mocked(agentApi.denyAgentStep).mockResolvedValue({
+      inboxMessageId: 'deny-1',
+      kind: 'control.deny',
+      acceptedAt: '2026-05-26T00:00:00Z',
+    });
+    vi.mocked(agentApi.skipAgentStep).mockResolvedValue({
+      inboxMessageId: 'skip-1',
+      kind: 'control.skip',
+      acceptedAt: '2026-05-26T00:00:00Z',
+    });
+
+    const { default: useAgentSession } = await loadComposable();
+    const { createSession, approveStep, denyStep, skipStep } = useAgentSession();
+    const session = createSession();
+    const msg: ChatMessage = {
+      id: 'msg-controls',
+      role: 'agent',
+      content: '',
+      status: 'running',
+      events: [],
+      timestamp: new Date().toISOString(),
+      planJobId: '66',
+    };
+    session.messages.push(msg);
+
+    await approveStep(msg);
+    await denyStep(msg);
+    await skipStep(msg);
+
+    expect(agentApi.approveAgentStep).toHaveBeenCalledWith('66');
+    expect(agentApi.denyAgentStep).toHaveBeenCalledWith('66');
+    expect(agentApi.skipAgentStep).toHaveBeenCalledWith('66');
+  });
+
   it('reload — sessions persist via localStorage', async () => {
     const { default: useAgentSession, __resetForTests } = await loadComposable();
     const a = useAgentSession();
diff --git a/web/src/composables/useAgentSession.ts b/web/src/composables/useAgentSession.ts
index a8a14b4..56995ed 100644
--- a/web/src/composables/useAgentSession.ts
+++ b/web/src/composables/useAgentSession.ts
@@ -1,22 +1,55 @@
 import { computed, onScopeDispose, ref, watch, type Ref } from 'vue';
 import {
-  cancelAgentJob,
+  approveAgentStep,
+  cancelAgentTurn,
+  denyAgentStep,
   executeAgentPlan,
   getAgentJob,
+  pauseAgentJob,
   planAgentTask,
+  resumeAgentJob,
+  sendAgentReply,
+  skipAgentStep,
+  streamAgentJobEvents,
 } from '../api/agent';
 import { useUserStore } from '../store/user';
 import { useLocaleStore } from '../store/locale';
 import { ui } from '../utils/ui';
 import type {
+  AgentAskPayload,
   AgentExecutionPolicy,
   AgentExecutionResult,
+  AgentJobEvent,
   AgentPlanResult,
+  AgentProgressPayload,
   AgentReasoningEffort,
+  AgentThinkingPayload,
+  AgentToolPartialPayload,
   PlanAgentRequest,
 } from '../types/agent';
 
-export type MsgStatus = 'pending' | 'running' | 'succeeded' | 'failed' | 'canceled';
+export type MsgStatus =
+  | 'pending'
+  | 'running'
+  | 'succeeded'
+  | 'failed'
+  | 'canceled'
+  | 'waiting_for_user'
+  | 'paused';
+
+export interface PendingAsk {
+  messageId: string;
+  prompt: string;
+  schema: Record<string, unknown>;
+  timeoutSec: number;
+  askedAt: string;
+}
+
+export interface ToolPartial {
+  step: number;
+  tool: string;
+  chunks: unknown[];
+}
 
 export interface ChatMessage {
   id: string;
@@ -28,8 +61,14 @@ export interface ChatMessage {
   planResult?: AgentPlanResult;
   executeJobId?: string;
   executeResult?: AgentExecutionResult;
+  events: AgentJobEvent[];
   errorMessage?: string;
   timestamp: string;
+  pendingAsk?: PendingAsk;
+  pauseRequestedAt?: string;
+  progress?: { step: number; total: number; message?: string; percent?: number };
+  thinking?: string;
+  partials?: Record<number, ToolPartial>;
 }
 
 export interface Session {
@@ -92,7 +131,10 @@ const normalizeSessions = (value: unknown): Session[] => {
     const session: Session = {
       id: record.id,
       title: typeof record.title === 'string' ? record.title : 'New session',
-      messages: record.messages as ChatMessage[],
+      messages: (record.messages as ChatMessage[]).map((message) => ({
+        ...message,
+        events: Array.isArray(message.events) ? message.events : [],
+      })),
       createdAt: typeof record.createdAt === 'string' ? record.createdAt : now,
       updatedAt: typeof record.updatedAt === 'string' ? record.updatedAt : now,
     };
@@ -141,6 +183,7 @@ interface SessionState {
   isSending: Ref<boolean>;
   pollGenerations: Map<string, number>;
   pollSleepTimers: Map<string, ReturnType<typeof setTimeout>>;
+  streamControllers: Map<string, AbortController>;
   canceledTurns: Set<string>;
 }
 
@@ -157,6 +200,7 @@ const getState = (): SessionState => {
   const isSending = ref<boolean>(false);
   const pollGenerations = new Map<string, number>();
   const pollSleepTimers = new Map<string, ReturnType<typeof setTimeout>>();
+  const streamControllers = new Map<string, AbortController>();
   const canceledTurns = new Set<string>();
 
   watch(sessions, (v) => persistSessions(v), { deep: true });
@@ -171,6 +215,7 @@ const getState = (): SessionState => {
     isSending,
     pollGenerations,
     pollSleepTimers,
+    streamControllers,
     canceledTurns,
   };
   return _state;
@@ -180,6 +225,8 @@ export const __resetForTests = () => {
   if (_state) {
     _state.pollSleepTimers.forEach((t) => clearTimeout(t));
     _state.pollSleepTimers.clear();
+    _state.streamControllers.forEach((controller) => controller.abort());
+    _state.streamControllers.clear();
     _state.pollGenerations.clear();
     _state.canceledTurns.clear();
   }
@@ -258,9 +305,18 @@ export default function useAgentSession() {
     clearSleepTimer(key);
   };
 
+  const stopStream = (key: string) => {
+    const controller = s.streamControllers.get(key);
+    if (!controller) return;
+    controller.abort();
+    s.streamControllers.delete(key);
+  };
+
   const stopAllPolling = () => {
     s.pollSleepTimers.forEach((t) => clearTimeout(t));
     s.pollSleepTimers.clear();
+    s.streamControllers.forEach((controller) => controller.abort());
+    s.streamControllers.clear();
     s.pollGenerations.clear();
   };
 
@@ -346,6 +402,8 @@ export default function useAgentSession() {
       clearTurnCanceled(msg);
       stopPolling(`${msg.id}:plan`);
       stopPolling(`${msg.id}:execute`);
+      stopStream(`${msg.id}:plan`);
+      stopStream(`${msg.id}:execute`);
     });
     s.sessions.value.splice(idx, 1);
     if (s.activeSessionId.value === id) {
@@ -362,6 +420,8 @@ export default function useAgentSession() {
       clearTurnCanceled(msg);
       stopPolling(`${msg.id}:plan`);
       stopPolling(`${msg.id}:execute`);
+      stopStream(`${msg.id}:plan`);
+      stopStream(`${msg.id}:execute`);
     });
     stopAllPolling();
     activeSession.value.messages = [];
@@ -371,6 +431,123 @@ export default function useAgentSession() {
 
   const ensureSession = (): Session => activeSession.value ?? createSession();
 
+  const appendAgentEvent = (msg: ChatMessage, event: AgentJobEvent) => {
+    if (msg.events.some((item) => item.id === event.id)) return;
+    msg.events.push(event);
+  };
+
+  const applyAgentEvent = (msg: ChatMessage, event: AgentJobEvent, kind: 'plan' | 'execute') => {
+    appendAgentEvent(msg, event);
+
+    if (event.type === 'job.queued') {
+      msg.status = 'pending';
+    } else if (event.type === 'job.running' || event.type === 'tool.started') {
+      if (msg.status !== 'waiting_for_user' && msg.status !== 'paused') {
+        msg.status = 'running';
+      }
+    } else if (event.type === 'job.failed' || event.type === 'tool.failed') {
+      msg.status = 'failed';
+      const errorMessage = event.data?.errorMessage;
+      msg.errorMessage = typeof errorMessage === 'string' ? errorMessage : event.message;
+    } else if (event.type === 'job.canceled') {
+      msg.status = 'canceled';
+    } else if (event.type === 'job.succeeded') {
+      msg.status = 'succeeded';
+      msg.pendingAsk = undefined;
+      msg.pauseRequestedAt = undefined;
+    }
+
+    if (event.type === 'agent.ask') {
+      const payload = event.data as AgentAskPayload;
+      msg.pendingAsk = {
+        messageId: payload.messageId,
+        prompt: payload.prompt,
+        schema: payload.schema,
+        timeoutSec: payload.timeoutSec,
+        askedAt: event.timestamp,
+      };
+      msg.status = 'waiting_for_user';
+    } else if (event.type === 'agent.paused') {
+      msg.status = 'paused';
+      msg.pauseRequestedAt = event.timestamp;
+    } else if (event.type === 'agent.resumed') {
+      msg.status = 'running';
+      msg.pauseRequestedAt = undefined;
+    } else if (event.type === 'agent.progress') {
+      const payload = event.data as AgentProgressPayload;
+      msg.progress = {
+        step: payload.step,
+        total: payload.total,
+        message: payload.message,
+        percent: payload.percent,
+      };
+    } else if (event.type === 'agent.thinking') {
+      const payload = event.data as AgentThinkingPayload;
+      msg.thinking = (msg.thinking || '') + (payload.text || '');
+    } else if (event.type === 'tool.partial') {
+      const payload = event.data as AgentToolPartialPayload;
+      msg.partials = msg.partials || {};
+      const slot = msg.partials[payload.step] || {
+        step: payload.step,
+        tool: payload.tool,
+        chunks: [],
+      };
+      slot.chunks = [...slot.chunks, payload.chunk];
+      msg.partials[payload.step] = slot;
+    }
+
+    const result = event.data?.result;
+    if (event.type === 'plan.ready' && result) {
+      msg.planResult = result as AgentPlanResult;
+      msg.planHash = msg.planResult.planHash;
+    }
+    if (event.type === 'job.succeeded' && result) {
+      if (kind === 'plan') {
+        msg.planResult = result as AgentPlanResult;
+        msg.planHash = msg.planResult.planHash;
+      } else {
+        msg.executeResult = result as AgentExecutionResult;
+      }
+    }
+  };
+
+  const shouldAutoExecutePlan = (msg: ChatMessage): boolean =>
+    Boolean(
+      msg.planResult &&
+        ((s.policy.value === 'autopilot' && !msg.planResult.requiresConfirmation) ||
+          (s.policy.value === 'confirm' && isReadOnlyAutoExecutable(msg.planResult))),
+    );
+
+  async function streamJobEvents(
+    kind: 'plan' | 'execute',
+    msg: ChatMessage,
+    jobId: string,
+  ): Promise<boolean> {
+    const timerKey = `${msg.id}:${kind}`;
+    stopStream(timerKey);
+    const controller = new AbortController();
+    s.streamControllers.set(timerKey, controller);
+    try {
+      await streamAgentJobEvents(
+        jobId,
+        {
+          onEvent: (event) => {
+            if (!ensureTurnNotCanceled(msg)) return;
+            applyAgentEvent(msg, event, kind);
+          },
+        },
+        controller.signal,
+      );
+      return true;
+    } catch {
+      return controller.signal.aborted;
+    } finally {
+      if (s.streamControllers.get(timerKey) === controller) {
+        s.streamControllers.delete(timerKey);
+      }
+    }
+  }
+
   async function pollPlanJob(msg: ChatMessage, jobId: string): Promise<void> {
     const timerKey = `${msg.id}:plan`;
     await startPollLoop(timerKey, msg, async (generation) => {
@@ -387,11 +564,7 @@ export default function useAgentSession() {
           msg.errorMessage = job.errorMessage || 'Plan failed.';
         }
         if (isTerminalStatus(job.status)) {
-          const shouldAutoExecute =
-            msg.planResult &&
-            ((s.policy.value === 'autopilot' && !msg.planResult.requiresConfirmation) ||
-              (s.policy.value === 'confirm' && isReadOnlyAutoExecutable(msg.planResult)));
-          if (shouldAutoExecute) {
+          if (shouldAutoExecutePlan(msg)) {
             await runExecute(msg);
           }
           return false;
@@ -439,6 +612,7 @@ export default function useAgentSession() {
       role: 'user',
       content: input,
       status: 'succeeded',
+      events: [],
       timestamp: now,
     };
     const agentMsg: ChatMessage = {
@@ -446,6 +620,7 @@ export default function useAgentSession() {
       role: 'agent',
       content: '',
       status: 'pending',
+      events: [],
       timestamp: now,
     };
     session.messages.push(userMsg, agentMsg);
@@ -463,14 +638,19 @@ export default function useAgentSession() {
       reactiveAgent.planJobId = res.jobId;
       if (isTurnCanceled(reactiveAgent) || reactiveAgent.status === 'canceled') {
         try {
-          await cancelAgentJob(res.jobId);
+          await cancelAgentTurn(res.jobId);
         } catch {
           // ignore cancellation sync errors after local cancel
         }
         return;
       }
       reactiveAgent.status = 'pending';
-      await pollPlanJob(reactiveAgent, res.jobId);
+      const streamed = await streamJobEvents('plan', reactiveAgent, res.jobId);
+      if (!streamed && ensureTurnNotCanceled(reactiveAgent)) {
+        await pollPlanJob(reactiveAgent, res.jobId);
+      } else if (streamed && ensureTurnNotCanceled(reactiveAgent) && shouldAutoExecutePlan(reactiveAgent)) {
+        await runExecute(reactiveAgent);
+      }
     } catch (error) {
       if (isTurnCanceled(reactiveAgent) || reactiveAgent.status === 'canceled') return;
       reactiveAgent.status = 'failed';
@@ -521,13 +701,16 @@ export default function useAgentSession() {
       msg.executeJobId = res.jobId;
       if (!ensureTurnNotCanceled(msg)) {
         try {
-          await cancelAgentJob(res.jobId);
+          await cancelAgentTurn(res.jobId);
         } catch {
           // ignore cancellation sync errors after local cancel
         }
         return;
       }
-      await pollExecuteJob(msg, res.jobId);
+      const streamed = await streamJobEvents('execute', msg, res.jobId);
+      if (!streamed && ensureTurnNotCanceled(msg)) {
+        await pollExecuteJob(msg, res.jobId);
+      }
     } catch (error) {
       if (!ensureTurnNotCanceled(msg)) return;
       msg.status = 'failed';
@@ -535,15 +718,89 @@ export default function useAgentSession() {
     }
   }
 
+  const activeJobId = (msg: ChatMessage): string | undefined =>
+    msg.executeJobId || msg.planJobId;
+
+  async function replyToAsk(msg: ChatMessage, value: unknown): Promise<void> {
+    const jobId = activeJobId(msg);
+    if (!jobId || !msg.pendingAsk) return;
+    const pendingAsk = msg.pendingAsk;
+    msg.pendingAsk = undefined;
+    msg.status = 'running';
+    try {
+      await sendAgentReply(jobId, pendingAsk.messageId, value);
+    } catch (error) {
+      msg.status = 'waiting_for_user';
+      msg.pendingAsk = pendingAsk;
+      msg.errorMessage = extractErrorMessage(error, 'Reply failed.');
+    }
+  }
+
+  async function pauseTurn(msg: ChatMessage): Promise<void> {
+    const jobId = activeJobId(msg);
+    if (!jobId) return;
+    msg.pauseRequestedAt = new Date().toISOString();
+    try {
+      await pauseAgentJob(jobId);
+    } catch (error) {
+      msg.pauseRequestedAt = undefined;
+      msg.errorMessage = extractErrorMessage(error, 'Pause failed.');
+    }
+  }
+
+  async function resumeTurn(msg: ChatMessage): Promise<void> {
+    const jobId = activeJobId(msg);
+    if (!jobId) return;
+    try {
+      await resumeAgentJob(jobId);
+    } catch (error) {
+      msg.errorMessage = extractErrorMessage(error, 'Resume failed.');
+    }
+  }
+
+  async function approveStep(msg: ChatMessage): Promise<void> {
+    const jobId = activeJobId(msg);
+    if (!jobId) return;
+    try {
+      await approveAgentStep(jobId);
+    } catch (error) {
+      msg.errorMessage = extractErrorMessage(error, 'Approve failed.');
+    }
+  }
+
+  async function denyStep(msg: ChatMessage): Promise<void> {
+    const jobId = activeJobId(msg);
+    if (!jobId) return;
+    try {
+      await denyAgentStep(jobId);
+    } catch (error) {
+      msg.errorMessage = extractErrorMessage(error, 'Deny failed.');
+    }
+  }
+
+  async function skipStep(msg: ChatMessage): Promise<void> {
+    const jobId = activeJobId(msg);
+    if (!jobId) return;
+    try {
+      await skipAgentStep(jobId);
+    } catch (error) {
+      msg.errorMessage = extractErrorMessage(error, 'Skip failed.');
+    }
+  }
+
   async function cancel(msg: ChatMessage): Promise<void> {
     markTurnCanceled(msg);
     msg.status = 'canceled';
-    const jobId = msg.executeJobId || msg.planJobId;
+    msg.pendingAsk = undefined;
+    msg.pauseRequestedAt = undefined;
     stopPolling(`${msg.id}:plan`);
     stopPolling(`${msg.id}:execute`);
+    stopStream(`${msg.id}:plan`);
+    stopStream(`${msg.id}:execute`);
+    const jobId = activeJobId(msg);
     if (!jobId) return;
     try {
-      await cancelAgentJob(jobId);
+      await cancelAgentTurn(jobId);
     } catch (error) {
       msg.errorMessage = extractErrorMessage(error, 'Cancel failed.');
     }
@@ -571,5 +828,11 @@ export default function useAgentSession() {
     sendMessage,
     runExecute,
     cancel,
+    replyToAsk,
+    pauseTurn,
+    resumeTurn,
+    approveStep,
+    denyStep,
+    skipStep,
   };
 }
diff --git a/web/src/composables/useAskTimeout.spec.ts b/web/src/composables/useAskTimeout.spec.ts
new file mode 100644
index 0000000..47407cc
--- /dev/null
+++ b/web/src/composables/useAskTimeout.spec.ts
@@ -0,0 +1,37 @@
+import { describe, it, expect, vi, beforeEach, afterEach } from 'vitest';
+import { ref } from 'vue';
+import { useAskTimeout } from './useAskTimeout';
+
+describe('useAskTimeout', () => {
+  beforeEach(() => {
+    vi.useFakeTimers();
+  });
+
+  afterEach(() => {
+    vi.useRealTimers();
+  });
+
+  it('counts down from askedAt + timeoutSec', () => {
+    const askedAt = ref('2026-05-26T12:00:00.000Z');
+    const timeoutSec = ref(120);
+    vi.setSystemTime(new Date('2026-05-26T12:00:30.000Z'));
+    const { remainingSec, formatted, expired } = useAskTimeout(askedAt, timeoutSec);
+    expect(remainingSec.value).toBe(90);
+    expect(formatted.value).toBe('01:30');
+    expect(expired.value).toBe(false);
+
+    vi.setSystemTime(new Date('2026-05-26T12:02:01.000Z'));
+    vi.advanceTimersByTime(1000);
+    expect(expired.value).toBe(true);
+    expect(remainingSec.value).toBe(0);
+    expect(formatted.value).toBe('00:00');
+  });
+
+  it('returns expired immediately when askedAt is missing', () => {
+    const askedAt = ref<string | undefined>(undefined);
+    const timeoutSec = ref(60);
+    const { expired, formatted } = useAskTimeout(askedAt, timeoutSec);
+    expect(expired.value).toBe(true);
+    expect(formatted.value).toBe('00:00');
+  });
+});
diff --git a/web/src/composables/useAskTimeout.ts b/web/src/composables/useAskTimeout.ts
new file mode 100644
index 0000000..8cab007
--- /dev/null
+++ b/web/src/composables/useAskTimeout.ts
@@ -0,0 +1,60 @@
+import { computed, getCurrentScope, onScopeDispose, ref, watchEffect, type Ref } from 'vue';
+
+export function useAskTimeout(
+  askedAt: Ref<string | undefined | null>,
+  timeoutSec: Ref<number>,
+) {
+  const now = ref<number>(Date.now());
+  let timer: ReturnType<typeof setInterval> | null = null;
+
+  const clearTimer = () => {
+    if (!timer) return;
+    clearInterval(timer);
+    timer = null;
+  };
+
+  const stopWatch = watchEffect(() => {
+    clearTimer();
+    now.value = Date.now();
+    if (!askedAt.value || timeoutSec.value <= 0) return;
+    const base = Date.parse(askedAt.value);
+    if (Number.isNaN(base)) return;
+    const deadlineMs = base + timeoutSec.value * 1000;
+    timer = setInterval(() => {
+      now.value = Date.now();
+      if (now.value >= deadlineMs) {
+        clearTimer();
+      }
+    }, 1000);
+  });
+
+  if (getCurrentScope()) {
+    onScopeDispose(() => {
+      clearTimer();
+      stopWatch();
+    });
+  }
+
+  const deadline = computed(() => {
+    if (!askedAt.value) return null;
+    const base = Date.parse(askedAt.value);
+    if (Number.isNaN(base)) return null;
+    return base + timeoutSec.value * 1000;
+  });
+
+  const remainingSec = computed(() => {
+    if (deadline.value === null) return 0;
+    return Math.max(0, Math.ceil((deadline.value - now.value) / 1000));
+  });
+
+  const expired = computed(() => deadline.value === null || remainingSec.value <= 0);
+
+  const formatted = computed(() => {
+    const total = remainingSec.value;
+    const mm = String(Math.floor(total / 60)).padStart(2, '0');
+    const ss = String(total % 60).padStart(2, '0');
+    return `${mm}:${ss}`;
+  });
+
+  return { remainingSec, formatted, expired };
+}
diff --git a/web/src/i18n/messages.ts b/web/src/i18n/messages.ts
index 8d27119..2388308 100644
--- a/web/src/i18n/messages.ts
+++ b/web/src/i18n/messages.ts
@@ -513,10 +513,25 @@ export type LocaleKey =
   | 'agent.v2.turn.status.succeeded'
   | 'agent.v2.turn.status.failed'
   | 'agent.v2.turn.status.canceled'
+  | 'agent.v2.turn.status.waiting_for_user'
+  | 'agent.v2.turn.status.paused'
+  | 'agent.v2.turn.controls.pause'
+  | 'agent.v2.turn.controls.resume'
+  | 'agent.v2.turn.controls.skip'
+  | 'agent.v2.turn.controls.approve'
+  | 'agent.v2.turn.controls.deny'
+  | 'agent.v2.turn.ask.placeholder'
+  | 'agent.v2.turn.ask.send'
+  | 'agent.v2.turn.ask.timeout'
+  | 'agent.v2.turn.progress.label'
+  | 'agent.v2.turn.thinking.label'
+  | 'agent.v2.turn.thinking.toggle'
   | 'agent.v2.turn.cost.label'
   | 'agent.v2.turn.cost.tokens'
   | 'agent.v2.turn.cost.calls'
   | 'agent.v2.turn.cost.est'
+  | 'agent.v2.turn.evidence.label'
+  | 'agent.v2.turn.evidence.more'
   | 'agent.v2.turn.warn.label'
   | 'agent.v2.turn.execute'
   | 'agent.v2.turn.cancel'
@@ -1093,10 +1108,25 @@ export const LOCALE_MESSAGES: Record<AppLanguage, LocaleMessages> = {
     'agent.v2.turn.status.succeeded': '已完成',
     'agent.v2.turn.status.failed': '失败',
     'agent.v2.turn.status.canceled': '已取消',
+    'agent.v2.turn.status.waiting_for_user': '等待你回复',
+    'agent.v2.turn.status.paused': '已暂停',
+    'agent.v2.turn.controls.pause': '暂停',
+    'agent.v2.turn.controls.resume': '继续',
+    'agent.v2.turn.controls.skip': '跳过此步',
+    'agent.v2.turn.controls.approve': '批准',
+    'agent.v2.turn.controls.deny': '拒绝',
+    'agent.v2.turn.ask.placeholder': '输入回答…',
+    'agent.v2.turn.ask.send': '发送',
+    'agent.v2.turn.ask.timeout': '剩余 {value}',
+    'agent.v2.turn.progress.label': '进度',
+    'agent.v2.turn.thinking.label': '思考过程',
+    'agent.v2.turn.thinking.toggle': '展开 / 收起',
     'agent.v2.turn.cost.label': '消耗',
     'agent.v2.turn.cost.tokens': 'tokens',
     'agent.v2.turn.cost.calls': '调用',
     'agent.v2.turn.cost.est': '预计',
+    'agent.v2.turn.evidence.label': '规划依据',
+    'agent.v2.turn.evidence.more': '更多',
     'agent.v2.turn.warn.label': '警告',
     'agent.v2.turn.execute': '执行',
     'agent.v2.turn.cancel': '取消',
@@ -1668,10 +1698,25 @@ export const LOCALE_MESSAGES: Record<AppLanguage, LocaleMessages> = {
     'agent.v2.turn.status.succeeded': 'succeeded',
     'agent.v2.turn.status.failed': 'failed',
     'agent.v2.turn.status.canceled': 'canceled',
+    'agent.v2.turn.status.waiting_for_user': 'WAITING FOR YOU',
+    'agent.v2.turn.status.paused': 'PAUSED',
+    'agent.v2.turn.controls.pause': 'Pause',
+    'agent.v2.turn.controls.resume': 'Resume',
+    'agent.v2.turn.controls.skip': 'Skip step',
+    'agent.v2.turn.controls.approve': 'Approve',
+    'agent.v2.turn.controls.deny': 'Deny',
+    'agent.v2.turn.ask.placeholder': 'Type your answer…',
+    'agent.v2.turn.ask.send': 'Send',
+    'agent.v2.turn.ask.timeout': '{value} left',
+    'agent.v2.turn.progress.label': 'PROGRESS',
+    'agent.v2.turn.thinking.label': 'THINKING',
+    'agent.v2.turn.thinking.toggle': 'Expand / Collapse',
     'agent.v2.turn.cost.label': 'COST',
     'agent.v2.turn.cost.tokens': 'tokens',
     'agent.v2.turn.cost.calls': 'calls',
     'agent.v2.turn.cost.est': 'est',
+    'agent.v2.turn.evidence.label': 'PLANNING EVIDENCE',
+    'agent.v2.turn.evidence.more': 'more',
     'agent.v2.turn.warn.label': 'WARN',
     'agent.v2.turn.execute': 'Execute',
     'agent.v2.turn.cancel': 'Cancel',
diff --git a/web/src/mock/handlers/agent.ts b/web/src/mock/handlers/agent.ts
index 09feeeb..e0cade1 100644
--- a/web/src/mock/handlers/agent.ts
+++ b/web/src/mock/handlers/agent.ts
@@ -3,6 +3,8 @@ import { createMockId, getCurrentUser, mockJobs } from '../state';
 import type {
   AgentBackgroundJob,
   AgentExecutionResult,
+  AgentInboxMessageRequest,
+  AgentInboxMessageResponse,
   AgentPlanResult,
   AgentProposedAction,
   ExecuteAgentRequest,
@@ -13,6 +15,52 @@ const nowIso = () => new Date().toISOString();
 
 const isTerminal = (status: string) => ['succeeded', 'failed', 'canceled'].includes(status);
 
+const extractCountSearch = (input: string) => {
+  let text = input.replace(/[?？!！。.,，;；:：]/g, ' ').trim();
+  [
+    '我上传了多少部',
+    '我上传了多少个',
+    '我上传了几部',
+    '我上传了几个',
+    '上传了多少部',
+    '上传了多少个',
+    '上传了几部',
+    '上传了几个',
+    '有多少部',
+    '有多少个',
+    '有几部',
+    '有几个',
+  ].forEach((phrase) => {
+    text = text.split(phrase).join(' ');
+  });
+  [
+    '我',
+    '上传',
+    '了',
+    '有',
+    '多少',
+    '几个',
+    '几部',
+    '多少部',
+    '多少个',
+    '部',
+    '个',
+    '文件',
+    '电影',
+    '影片',
+    '视频',
+    '音频',
+    '音乐',
+    '图片',
+    '照片',
+    '文档',
+    '压缩包',
+  ].forEach((token) => {
+    text = text.split(token).join(' ');
+  });
+  return text.split(/\s+/).filter(Boolean).join(' ') || undefined;
+};
+
 const pickPlanActions = (input: string): AgentProposedAction[] => {
   const normalized = input.toLowerCase();
   if (
@@ -33,9 +81,10 @@ const pickPlanActions = (input: string): AgentProposedAction[] => {
           folderId: 'root',
           recursive: true,
           category:
-            normalized.includes('电影') || normalized.includes('视频') || normalized.includes('movie')
+            normalized.includes('电影') || normalized.includes('视频') || normalized.includes('几部') || normalized.includes('movie')
               ? 'video'
               : undefined,
+          search: extractCountSearch(input),
         },
       },
     ];
@@ -194,6 +243,21 @@ const finishJobCanceled = (job: AgentBackgroundJob) => {
   job.updatedAt = timestamp;
 };
 
+const pauseJob = (job: AgentBackgroundJob) => {
+  if (isTerminal(job.status)) return;
+  const timestamp = nowIso();
+  job.status = 'paused';
+  job.agentPhase = 'executing';
+  job.updatedAt = timestamp;
+};
+
+const resumeJob = (job: AgentBackgroundJob) => {
+  if (isTerminal(job.status)) return;
+  const timestamp = nowIso();
+  job.status = 'running';
+  job.updatedAt = timestamp;
+};
+
 const getJobById = (jobId: string) => (mockJobs[jobId] || null) as AgentBackgroundJob | null;
 
 const shouldSimulateFailure = (input: string) => {
@@ -224,6 +288,24 @@ const schedulePlanLifecycle = (job: AgentBackgroundJob, payload: PlanAgentReques
       toolCalls: proposedActions.length,
       durationSecEstimate: proposedActions.length * 4,
     },
+    planningEvidence: [
+      {
+        step: 1,
+        tool: 'drive.searchFiles',
+        input: {
+          folderId: payload.context.rootFolderId || 'root',
+          query: payload.input,
+          category: 'video',
+        },
+        outputPreview: {
+          totalItems: 2,
+          items: [
+            { fileId: '19', name: '银翼杀手1982.mp4' },
+            { fileId: '20', name: '银翼杀手2049.mp4' },
+          ],
+        },
+      },
+    ],
   };
 
   setTimeout(() => {
@@ -272,10 +354,13 @@ const scheduleExecuteLifecycle = (job: AgentBackgroundJob, plan: AgentPlanResult
 const mockExecutionAnswer = (plan: AgentPlanResult) => {
   const countAction = plan.proposedActions.find((action) => action.tool === 'drive.countFiles');
   if (!countAction) return null;
+  const search = String(countAction.input.search || '').trim();
+  const qualifier = search ? `名称包含“${search}”的` : '';
   if (countAction.input.category === 'video') {
-    return '你上传了 7 部电影（按视频文件统计）。';
+    const total = search === '银翼杀手' ? 2 : 7;
+    return `你上传了 ${total} 部${qualifier}电影（按视频文件统计）。`;
   }
-  return '你上传了 12 个文件。';
+  return `你上传了 12 个${qualifier}文件。`;
 };
 
 export const setupAgentMocks = () => {
@@ -369,8 +454,8 @@ export const setupAgentMocks = () => {
     };
   });
 
-  Mock.mock(/\/api\/v1\/agent\/cancel\/([^/?]+)$/, 'post', (options) => {
-    const jobId = (options.url.match(/\/api\/v1\/agent\/cancel\/([^/?]+)/) || [])[1];
+  Mock.mock(/\/api\/v1\/agent\/jobs\/([^/?]+)\/messages$/, 'post', (options) => {
+    const jobId = (options.url.match(/\/api\/v1\/agent\/jobs\/([^/?]+)\/messages/) || [])[1];
     const job = jobId ? getJobById(jobId) : null;
     if (!job) {
       return {
@@ -381,19 +466,26 @@ export const setupAgentMocks = () => {
       };
     }
 
-    if (!isTerminal(job.status)) {
+    const payload = JSON.parse(options.body || '{}') as AgentInboxMessageRequest;
+    if (payload.kind === 'control.cancel') {
       finishJobCanceled(job);
+    } else if (payload.kind === 'control.pause') {
+      pauseJob(job);
+    } else if (payload.kind === 'control.resume') {
+      resumeJob(job);
     }
 
+    const response: AgentInboxMessageResponse = {
+      inboxMessageId: createMockId('inbox'),
+      kind: payload.kind,
+      acceptedAt: nowIso(),
+    };
+
     return {
       success: true,
       code: 200,
-      message: 'Job canceled',
-      data: {
-        jobId: job.jobId,
-        status: job.status,
-        canceledAt: job.cancelRequestedAt || nowIso(),
-      },
+      message: 'Agent message accepted',
+      data: response,
     };
   });
 };
diff --git a/web/src/mock/handlers/skill.ts b/web/src/mock/handlers/skill.ts
index 2cd81a8..6368cbb 100644
--- a/web/src/mock/handlers/skill.ts
+++ b/web/src/mock/handlers/skill.ts
@@ -4,6 +4,22 @@ import { createMockId, getCurrentUser, mockSkills, paginate } from '../state';
 type VisibilityFilter = 'all' | 'global' | 'private';
 
 const now = () => new Date().toISOString();
+const supportedTools = new Set([
+  'drive.listFolder',
+  'drive.countFiles',
+  'drive.searchFiles',
+  'drive.getFileInfo',
+  'drive.listRecent',
+  'drive.statsByCategory',
+  'drive.findDuplicates',
+  'drive.createFolder',
+  'drive.moveFile',
+  'drive.moveFolder',
+  'drive.renameFile',
+  'drive.renameFolder',
+  'drive.deleteFile',
+  'drive.deleteFolder',
+]);
 
 const slugify = (input: string) => {
   return String(input || 'skill')
@@ -22,6 +38,12 @@ function isVisibleToUser(skill: any, userId: string, visibility: VisibilityFilte
   return skill.visibility === 'global' || (skill.visibility === 'private' && skill.ownerUserId === userId);
 }
 
+function validateTools(raw: unknown) {
+  const tools = Array.isArray(raw) ? raw.map((item) => String(item).trim()).filter(Boolean) : [];
+  const unknownTools = tools.filter((tool) => !supportedTools.has(tool));
+  return { tools, unknownTools };
+}
+
 export const setupSkillMocks = () => {
   Mock.mock(/\/api\/v1\/agent\/skills(?:\?.*)?$/, 'get', (options) => {
     const url = new URL(options.url, 'http://localhost');
@@ -89,6 +111,15 @@ export const setupSkillMocks = () => {
         data: null,
       };
     }
+    const { tools, unknownTools } = validateTools(payload.toolWhitelist);
+    if (unknownTools.length) {
+      return {
+        success: false,
+        code: 422,
+        message: 'Unknown agent tool in toolWhitelist',
+        data: { unknownTools },
+      };
+    }
 
     let key = '';
     for (let i = 0; i < 8; i += 1) {
@@ -103,7 +134,7 @@ export const setupSkillMocks = () => {
       name,
       description,
       triggersText: payload.triggersText ?? null,
-      toolWhitelist: Array.isArray(payload.toolWhitelist) ? payload.toolWhitelist : [],
+      toolWhitelist: tools,
       planTemplate: payload.planTemplate || {},
       inputsSchema: payload.inputsSchema || {},
       outputsSchema: payload.outputsSchema || {},
@@ -142,7 +173,18 @@ export const setupSkillMocks = () => {
     if (payload.name !== undefined) skill.name = String(payload.name || '').trim() || skill.name;
     if (payload.description !== undefined) skill.description = String(payload.description || '').trim() || skill.description;
     if (payload.triggersText !== undefined) skill.triggersText = payload.triggersText;
-    if (payload.toolWhitelist !== undefined) skill.toolWhitelist = Array.isArray(payload.toolWhitelist) ? payload.toolWhitelist : [];
+    if (payload.toolWhitelist !== undefined) {
+      const { tools, unknownTools } = validateTools(payload.toolWhitelist);
+      if (unknownTools.length) {
+        return {
+          success: false,
+          code: 422,
+          message: 'Unknown agent tool in toolWhitelist',
+          data: { unknownTools },
+        };
+      }
+      skill.toolWhitelist = tools;
+    }
     if (payload.planTemplate !== undefined) skill.planTemplate = payload.planTemplate || {};
     if (payload.inputsSchema !== undefined) skill.inputsSchema = payload.inputsSchema || {};
     if (payload.outputsSchema !== undefined) skill.outputsSchema = payload.outputsSchema || {};
@@ -227,6 +269,15 @@ export const setupSkillMocks = () => {
 
     const results: Array<{ skillKey: string; action: 'created' | 'updated' }> = [];
     for (const item of items) {
+      const { tools, unknownTools } = validateTools(item.toolWhitelist);
+      if (unknownTools.length) {
+        return {
+          success: false,
+          code: 422,
+          message: 'Unknown agent tool in toolWhitelist',
+          data: { unknownTools },
+        };
+      }
       const skillKey = String(item.skillKey || '').trim();
       const name = String(item.name || '').trim();
       const description = String(item.description || '').trim();
@@ -239,7 +290,7 @@ export const setupSkillMocks = () => {
           name,
           description,
           triggersText: item.triggersText ?? null,
-          toolWhitelist: Array.isArray(item.toolWhitelist) ? item.toolWhitelist : [],
+          toolWhitelist: tools,
           planTemplate: item.planTemplate || {},
           inputsSchema: item.inputsSchema || {},
           outputsSchema: item.outputsSchema || {},
@@ -253,7 +304,7 @@ export const setupSkillMocks = () => {
         existing.name = name;
         existing.description = description;
         existing.triggersText = item.triggersText ?? null;
-        existing.toolWhitelist = Array.isArray(item.toolWhitelist) ? item.toolWhitelist : [];
+        existing.toolWhitelist = tools;
         existing.planTemplate = item.planTemplate || {};
         existing.inputsSchema = item.inputsSchema || {};
         existing.outputsSchema = item.outputsSchema || {};
diff --git a/web/src/mock/handlers/user.ts b/web/src/mock/handlers/user.ts
index fbd0d9d..7bbdf21 100644
--- a/web/src/mock/handlers/user.ts
+++ b/web/src/mock/handlers/user.ts
@@ -5,6 +5,7 @@ import {
   getCurrentUser,
   mockLogs,
   mockRegistrationEmailDomainRules,
+  mockUsageEvents,
   mockUsers,
   paginate,
 } from '../state';
@@ -43,6 +44,32 @@ function isAllowedEmailDomain(email: string) {
   });
 }
 
+function usageWindow(url: URL) {
+  const usageFrom = url.searchParams.get('usageFrom');
+  const usageTo = url.searchParams.get('usageTo');
+  const now = Date.now();
+  const from = usageFrom ? Date.parse(usageFrom) : now - 7 * 24 * 60 * 60 * 1000;
+  const to = usageTo ? Date.parse(usageTo) : now;
+  return {
+    from: Number.isFinite(from) ? from : now - 7 * 24 * 60 * 60 * 1000,
+    to: Number.isFinite(to) ? to : now,
+  };
+}
+
+function usageStatsForUser(userId: string, window: { from: number; to: number }) {
+  return mockUsageEvents.reduce((stats, event) => {
+    if (event.userId !== userId) return stats;
+    const occurredAt = Date.parse(event.occurredAt);
+    if (!Number.isFinite(occurredAt) || occurredAt < window.from || occurredAt > window.to) {
+      return stats;
+    }
+    return {
+      trafficBytes: stats.trafficBytes + event.trafficBytes,
+      agentTokens: stats.agentTokens + event.agentTokens,
+    };
+  }, { trafficBytes: 0, agentTokens: 0 });
+}
+
 export const setupUserMocks = () => {
   Mock.mock(/\/api\/v1\/users(?:\?.*)?$/, 'get', (options) => {
     const url = new URL(options.url, 'http://localhost');
@@ -80,6 +107,7 @@ export const setupUserMocks = () => {
     const search = (url.searchParams.get('search') || '').toLowerCase();
     const statusFilter = url.searchParams.get('status');
     const roleFilter = url.searchParams.get('role');
+    const window = usageWindow(url);
 
     const filtered = mockUsers.filter((user) => {
       if (search) {
@@ -88,7 +116,7 @@ export const setupUserMocks = () => {
         if (!hit) return false;
       }
       if (statusFilter && user.status !== statusFilter) return false;
-      if (roleFilter && user.role !== roleFilter) return false;
+      if (roleFilter && user.role.toUpperCase() !== roleFilter.toUpperCase()) return false;
       return true;
     });
 
@@ -101,8 +129,10 @@ export const setupUserMocks = () => {
       emailVerified: user.emailVerified,
       emailVerifiedAt: user.emailVerifiedAt,
       createdAt: user.createdAt,
-      role: user.role,
+      role: user.role.toUpperCase(),
       status: user.status,
+      usagePercentage: Number(((user.storageUsed / user.storageLimit) * 100).toFixed(2)),
+      usageStats: usageStatsForUser(user.userId, window),
       lastActiveAt: new Date(Date.now() - Mock.Random.integer(1, 72) * 3600000).toISOString(),
       lastLoginAt: new Date(Date.now() - Mock.Random.integer(1, 240) * 3600000).toISOString(),
     }));
diff --git a/web/src/mock/state.ts b/web/src/mock/state.ts
index 8789787..6413739 100644
--- a/web/src/mock/state.ts
+++ b/web/src/mock/state.ts
@@ -15,6 +15,13 @@ export type MockUserRecord = User & {
   preference: UserPreference;
 };
 
+export interface MockUsageEvent {
+  userId: string;
+  occurredAt: string;
+  trafficBytes: number;
+  agentTokens: number;
+}
+
 const now = () => new Date().toISOString();
 
 const randomRecentTime = (maxHours = 72) => {
@@ -35,7 +42,22 @@ export const mockSkills: AgentSkillItem[] = [
     name: 'Organize By Type',
     description: 'Organize files into folders by mime/type.',
     triggersText: 'organize, classify, sort by type',
-    toolWhitelist: ['files.list', 'folders.create', 'files.move'],
+    toolWhitelist: [
+      'drive.listFolder',
+      'drive.countFiles',
+      'drive.searchFiles',
+      'drive.getFileInfo',
+      'drive.listRecent',
+      'drive.statsByCategory',
+      'drive.findDuplicates',
+      'drive.createFolder',
+      'drive.moveFile',
+      'drive.moveFolder',
+      'drive.renameFile',
+      'drive.renameFolder',
+      'drive.deleteFile',
+      'drive.deleteFolder',
+    ],
     planTemplate: {},
     inputsSchema: {},
     outputsSchema: {},
@@ -50,7 +72,7 @@ export const mockSkills: AgentSkillItem[] = [
     name: 'Cleanup Downloads',
     description: 'Find and cleanup old downloads.',
     triggersText: 'cleanup, downloads, remove old files',
-    toolWhitelist: ['files.list', 'files.delete'],
+    toolWhitelist: ['drive.searchFiles', 'drive.listRecent', 'drive.deleteFile'],
     planTemplate: {},
     inputsSchema: {},
     outputsSchema: {},
@@ -174,6 +196,25 @@ export const mockUsers: MockUserRecord[] = [
   },
 ];
 
+export const mockUsageEvents: MockUsageEvent[] = mockUsers.flatMap((user, index) => {
+  const recentAt = new Date(Date.now() - (index + 1) * 24 * 60 * 60 * 1000).toISOString();
+  const olderAt = new Date(Date.now() - (index + 20) * 24 * 60 * 60 * 1000).toISOString();
+  return [
+    {
+      userId: user.userId,
+      occurredAt: recentAt,
+      trafficBytes: (index + 1) * 256 * 1024 * 1024,
+      agentTokens: (index + 1) * 1250,
+    },
+    {
+      userId: user.userId,
+      occurredAt: olderAt,
+      trafficBytes: (index + 1) * 64 * 1024 * 1024,
+      agentTokens: (index + 1) * 300,
+    },
+  ];
+});
+
 export const mockShares: Array<Share & { ownerUserId: string }> = [
   {
     shareId: 'share_1001',
diff --git a/web/src/pages/__dev/Library.vue b/web/src/pages/__dev/Library.vue
index 4802ede..29a6091 100644
--- a/web/src/pages/__dev/Library.vue
+++ b/web/src/pages/__dev/Library.vue
@@ -217,9 +217,22 @@ const agPolicy = ref<'planOnly' | 'confirm' | 'autopilot'>('confirm');
 const agReasoningEffort = ref<'adaptive' | 'low' | 'medium' | 'high' | 'xhigh' | 'max'>('adaptive');
 
 const makeTurn = (status: 'pending' | 'running' | 'succeeded' | 'failed' | 'canceled', withPlan = true): AgentTurn => ({
-  user: { id: `u-${status}`, role: 'user', content: 'Sort by year then month', status: 'succeeded', timestamp: '2026-05-20T00:00:00Z' },
+  user: { id: `u-${status}`, role: 'user', content: 'Sort by year then month', status: 'succeeded', events: [], timestamp: '2026-05-20T00:00:00Z' },
   agent: {
     id: `a-${status}`, role: 'agent', content: '', status,
+    events: [
+      {
+        id: `e-${status}-1`,
+        jobId: `job-${status}`,
+        taskType: 'agent.execute',
+        type: 'job.running',
+        status: 'running',
+        agentPhase: 'executing',
+        message: '正在执行计划。',
+        data: {},
+        timestamp: '2026-05-20T00:00:00Z',
+      },
+    ],
     timestamp: '2026-05-20T00:00:00Z',
     planHash: withPlan && status !== 'pending' ? 'h-' + status : undefined,
     planResult: withPlan && status !== 'pending' ? {
diff --git a/web/src/pages/agent/workspace/AgentWorkspace.vue b/web/src/pages/agent/workspace/AgentWorkspace.vue
index a713cb7..864b523 100644
--- a/web/src/pages/agent/workspace/AgentWorkspace.vue
+++ b/web/src/pages/agent/workspace/AgentWorkspace.vue
@@ -14,7 +14,8 @@ import { ui } from '../../../utils/ui';
 const {
   sessions, activeSessionId, activeTurns, policy, reasoningEffort, taskInput, isSending,
   createSession, switchSession, deleteSession,
-  sendMessage, runExecute, cancel,
+  sendMessage, runExecute, cancel, replyToAsk,
+  pauseTurn, resumeTurn, skipStep, approveStep, denyStep,
 } = useAgentSession();
 
 const localeStore = useLocaleStore();
@@ -31,8 +32,21 @@ const turnOf = (id: string): ChatMessage | null =>
 
 const onExecute = (id: string) => { const m = turnOf(id); if (m) runExecute(m); };
 const onCancel  = (id: string) => { const m = turnOf(id); if (m) cancel(m); };
+const onReply = (id: string, value: unknown) => { const m = turnOf(id); if (m) replyToAsk(m, value); };
+const onPause = (id: string) => { const m = turnOf(id); if (m) pauseTurn(m); };
+const onResume = (id: string) => { const m = turnOf(id); if (m) resumeTurn(m); };
+const onSkip = (id: string) => { const m = turnOf(id); if (m) skipStep(m); };
+const onApprove = (id: string) => { const m = turnOf(id); if (m) approveStep(m); };
+const onDeny = (id: string) => { const m = turnOf(id); if (m) denyStep(m); };
 const onHint = (text: string) => { taskInput.value = text; sendMessage(); };
 
+const isInputLocked = computed(() =>
+  isSending.value ||
+  activeTurns.value.some(
+    (turn) => turn.agent.status === 'waiting_for_user' || turn.agent.status === 'paused',
+  ),
+);
+
 const onDeleteSession = async (id: string) => {
   const target = sessions.value.find((s) => s.id === id);
   const ok = await ui.confirm({
@@ -63,6 +77,12 @@ const onDeleteSession = async (id: string) => {
         :focused-id="focusedTurnId"
         @execute="onExecute"
         @cancel="onCancel"
+        @reply="onReply"
+        @pause="onPause"
+        @resume="onResume"
+        @skip="onSkip"
+        @approve="onApprove"
+        @deny="onDeny"
         @focus-turn="focusedTurnId = $event"
         @hint-pick="onHint"
       />
@@ -70,7 +90,7 @@ const onDeleteSession = async (id: string) => {
         v-model="taskInput"
         :policy="policy"
         :reasoning-effort="reasoningEffort"
-        :disabled="isSending"
+        :disabled="isInputLocked"
         @update:policy="policy = $event"
         @update:reasoning-effort="reasoningEffort = $event"
         @submit="sendMessage"
diff --git a/web/src/pages/console/users/UsersPage.spec.ts b/web/src/pages/console/users/UsersPage.spec.ts
new file mode 100644
index 0000000..c91475b
--- /dev/null
+++ b/web/src/pages/console/users/UsersPage.spec.ts
@@ -0,0 +1,101 @@
+import { flushPromises, mount } from '@vue/test-utils';
+import { afterEach, beforeEach, describe, expect, it, vi } from 'vitest';
+
+vi.mock('../../../api/user', () => ({
+  getAdminUsers: vi.fn(),
+  updateUserStatus: vi.fn(),
+}));
+
+vi.mock('../../../utils/ui', () => ({
+  ui: {
+    toast: vi.fn(),
+  },
+}));
+
+import { getAdminUsers } from '../../../api/user';
+import UsersPage from './UsersPage.vue';
+
+const getAdminUsersMock = vi.mocked(getAdminUsers);
+
+function pageData() {
+  return {
+    items: [
+      {
+        userId: '1',
+        username: 'alice',
+        email: 'alice@example.com',
+        role: 'USER' as const,
+        status: 'active' as const,
+        emailVerified: true,
+        emailVerifiedAt: null,
+        storageLimit: 1024,
+        storageUsed: 0,
+        usagePercentage: 0,
+        lastLoginAt: null,
+        lastActiveAt: null,
+        createdAt: '2026-05-01T00:00:00Z',
+        usageStats: {
+          trafficBytes: 1536,
+          agentTokens: 12345,
+        },
+      },
+    ],
+    pagination: {
+      totalItems: 1,
+      totalPages: 1,
+      perPage: 20,
+      currentPage: 1,
+      hasPrev: false,
+      hasNext: false,
+    },
+  };
+}
+
+describe('UsersPage', () => {
+  beforeEach(() => {
+    vi.useFakeTimers();
+    vi.setSystemTime(new Date('2026-05-26T12:00:00.000Z'));
+    getAdminUsersMock.mockResolvedValue(pageData());
+  });
+
+  afterEach(() => {
+    vi.useRealTimers();
+    vi.clearAllMocks();
+  });
+
+  it('loads the default previous 7 day usage window', async () => {
+    mount(UsersPage);
+    await flushPromises();
+
+    expect(getAdminUsersMock).toHaveBeenCalledWith(expect.objectContaining({
+      page: 1,
+      perPage: 20,
+      usageFrom: '2026-05-19T00:00:00.000Z',
+      usageTo: '2026-05-26T23:59:59.999Z',
+    }));
+  });
+
+  it('reloads with the edited usage window after apply', async () => {
+    const wrapper = mount(UsersPage);
+    await flushPromises();
+
+    const dateInputs = wrapper.findAll('input[type="date"]');
+    await dateInputs[0].setValue('2026-05-01');
+    await dateInputs[1].setValue('2026-05-10');
+    await wrapper.find('.filter-bar__apply').trigger('click');
+    await flushPromises();
+
+    expect(getAdminUsersMock).toHaveBeenLastCalledWith(expect.objectContaining({
+      usageFrom: '2026-05-01T00:00:00.000Z',
+      usageTo: '2026-05-10T23:59:59.999Z',
+    }));
+  });
+
+  it('renders upload traffic and agent tokens', async () => {
+    const wrapper = mount(UsersPage);
+    await flushPromises();
+
+    expect(wrapper.text()).toContain('Uploaded 1.5 KB');
+    expect(wrapper.text()).toContain('Agent 12,345 tokens');
+  });
+});
diff --git a/web/src/pages/console/users/UsersPage.vue b/web/src/pages/console/users/UsersPage.vue
index db14822..1a27a93 100644
--- a/web/src/pages/console/users/UsersPage.vue
+++ b/web/src/pages/console/users/UsersPage.vue
@@ -2,23 +2,46 @@
 import { onMounted, ref } from 'vue';
 import { getAdminUsers, updateUserStatus } from '../../../api/user';
 import { AdminTable, FilterBar, StatusBadge } from '../../../components/console';
+import type { AdminUserItem } from '../../../types/user';
 import { ui } from '../../../utils/ui';
 
-interface AdminUser {
-  userId: string;
-  username: string;
-  email: string;
-  role: string;
-  status: 'active' | 'suspended';
-  lastLoginAt: string | null;
-  createdAt: string;
+const DAY_MS = 24 * 60 * 60 * 1000;
+
+function toDateInput(date: Date) {
+  return date.toISOString().slice(0, 10);
+}
+
+function startOfUtcDay(value: string) {
+  return `${value}T00:00:00.000Z`;
+}
+
+function endOfUtcDay(value: string) {
+  return `${value}T23:59:59.999Z`;
+}
+
+function formatBytes(bytes: number) {
+  const units = ['B', 'KB', 'MB', 'GB', 'TB'];
+  let value = Math.max(0, bytes);
+  let unitIndex = 0;
+  while (value >= 1024 && unitIndex < units.length - 1) {
+    value /= 1024;
+    unitIndex += 1;
+  }
+  return `${value.toFixed(unitIndex === 0 ? 0 : 1)} ${units[unitIndex]}`;
+}
+
+function formatNumber(value: number) {
+  return new Intl.NumberFormat('en-US').format(value);
 }
 
-const items = ref<AdminUser[]>([]);
+const today = new Date();
+const items = ref<AdminUserItem[]>([]);
 const totalPages = ref(1);
 const currentPage = ref(1);
 const search = ref('');
 const status = ref<'all' | 'active' | 'suspended'>('all');
+const usageFrom = ref(toDateInput(new Date(today.getTime() - 7 * DAY_MS)));
+const usageTo = ref(toDateInput(today));
 const loading = ref(false);
 
 async function load(page = 1) {
@@ -29,8 +52,12 @@ async function load(page = 1) {
       perPage: 20,
       ...(search.value ? { search: search.value.trim() } : {}),
       ...(status.value !== 'all' ? { status: status.value } : {}),
+      ...(usageFrom.value && usageTo.value ? {
+        usageFrom: startOfUtcDay(usageFrom.value),
+        usageTo: endOfUtcDay(usageTo.value),
+      } : {}),
     });
-    items.value = resp.items as AdminUser[];
+    items.value = resp.items;
     totalPages.value = resp.pagination.totalPages;
     currentPage.value = resp.pagination.currentPage;
   } finally {
@@ -38,7 +65,8 @@ async function load(page = 1) {
   }
 }
 
-async function toggleStatus(user: AdminUser) {
+async function toggleStatus(user: AdminUserItem) {
+  if (user.status !== 'active' && user.status !== 'suspended') return;
   const next = user.status === 'active' ? 'suspended' : 'active';
   await updateUserStatus(user.userId, next);
   user.status = next;
@@ -59,6 +87,14 @@ onMounted(() => load(1));
         <option value="active">Active</option>
         <option value="suspended">Suspended</option>
       </select>
+      <label class="filter-field">
+        <span>Usage from</span>
+        <input v-model="usageFrom" type="date" />
+      </label>
+      <label class="filter-field">
+        <span>Usage to</span>
+        <input v-model="usageTo" type="date" />
+      </label>
     </FilterBar>
 
     <AdminTable
@@ -71,16 +107,20 @@ onMounted(() => load(1));
       <template #row="{ row }">
         <div class="row">
           <div class="row__main">
-            <strong>{{ (row as AdminUser).username }}</strong>
-            <small>{{ (row as AdminUser).email }} · {{ (row as AdminUser).role }}</small>
+            <strong>{{ (row as AdminUserItem).username }}</strong>
+            <small>{{ (row as AdminUserItem).email }} · {{ (row as AdminUserItem).role }}</small>
+            <div class="row__usage">
+              <span>Uploaded {{ formatBytes((row as AdminUserItem).usageStats.trafficBytes) }}</span>
+              <span>Agent {{ formatNumber((row as AdminUserItem).usageStats.agentTokens) }} tokens</span>
+            </div>
           </div>
           <div class="row__actions">
             <StatusBadge
-              :value="(row as AdminUser).status"
-              :tone="(row as AdminUser).status === 'active' ? 'positive' : 'danger'"
+              :value="(row as AdminUserItem).status"
+              :tone="(row as AdminUserItem).status === 'active' ? 'positive' : 'danger'"
             />
-            <button class="row__btn" @click="toggleStatus(row as AdminUser)">
-              {{ (row as AdminUser).status === 'active' ? 'Suspend' : 'Activate' }}
+            <button class="row__btn" @click="toggleStatus(row as AdminUserItem)">
+              {{ (row as AdminUserItem).status === 'active' ? 'Suspend' : 'Activate' }}
             </button>
           </div>
         </div>
@@ -103,6 +143,14 @@ onMounted(() => load(1));
   font-weight: var(--weight-medium);
   letter-spacing: var(--tracking-snug);
 }
+.filter-field {
+  display: flex;
+  gap: var(--sp-xs);
+  align-items: center;
+  color: var(--text-tertiary);
+  font-family: var(--font-mono);
+  font-size: var(--text-small);
+}
 .row {
   display: flex;
   justify-content: space-between;
@@ -123,6 +171,15 @@ onMounted(() => load(1));
   font-family: var(--font-mono);
   font-size: var(--text-small);
 }
+.row__usage {
+  display: flex;
+  flex-wrap: wrap;
+  gap: var(--sp-sm);
+  margin-top: 6px;
+  color: var(--text-secondary);
+  font-family: var(--font-mono);
+  font-size: var(--text-small);
+}
 .row__actions { display: flex; gap: var(--sp-sm); align-items: center; }
 .row__btn {
   height: 28px;
diff --git a/web/src/types/agent.d.ts b/web/src/types/agent.d.ts
index f143e2b..d515943 100644
--- a/web/src/types/agent.d.ts
+++ b/web/src/types/agent.d.ts
@@ -12,6 +12,22 @@ export type AgentJobPhase =
   | 'completed'
   | 'failed'
   | 'canceled';
+export type AgentJobEventType =
+  | 'job.queued'
+  | 'job.running'
+  | 'plan.ready'
+  | 'tool.started'
+  | 'tool.succeeded'
+  | 'tool.failed'
+  | 'tool.partial'
+  | 'agent.thinking'
+  | 'agent.progress'
+  | 'agent.ask'
+  | 'agent.paused'
+  | 'agent.resumed'
+  | 'job.succeeded'
+  | 'job.failed'
+  | 'job.canceled';
 
 export interface AgentDataPolicy {
   allowFileContent: boolean;
@@ -68,6 +84,13 @@ export interface AgentChosenSkill {
   name: string;
 }
 
+export interface AgentPlanningEvidence {
+  step: number;
+  tool: string;
+  input: Record<string, any>;
+  outputPreview: Record<string, any>;
+}
+
 export interface AgentPlanResult {
   planJobId: string;
   planHash: string;
@@ -76,6 +99,7 @@ export interface AgentPlanResult {
   summary: string;
   requiresConfirmation: boolean;
   costEstimate: AgentCostEstimate;
+  planningEvidence?: AgentPlanningEvidence[] | null;
 }
 
 export interface ExecuteAgentRequest {
@@ -95,12 +119,6 @@ export interface ExecuteAgentResponse {
   taskType: 'agent.execute';
 }
 
-export interface CancelAgentResponse {
-  jobId: string;
-  status: string;
-  canceledAt: string;
-}
-
 export interface AgentExecutionResult {
   planJobId: string;
   executeJobId: string;
@@ -112,7 +130,69 @@ export interface AgentExecutionResult {
   finishedAt: string;
 }
 
+export interface AgentJobEvent {
+  id: string;
+  jobId: string;
+  taskType: string;
+  type: AgentJobEventType;
+  status: string;
+  agentPhase?: AgentJobPhase | string | null;
+  message: string;
+  data: Record<string, any>;
+  timestamp: string;
+}
+
 export type AgentBackgroundJob<T = Record<string, any>> = BackgroundJob<T> & {
   agentPhase?: AgentJobPhase | null;
   cancelRequestedAt?: string | null;
 };
+
+// ----------------- Inbox (upstream channel) -----------------
+
+export type AgentInboxMessageKind =
+  | 'reply'
+  | 'control.pause'
+  | 'control.resume'
+  | 'control.approve'
+  | 'control.deny'
+  | 'control.skip'
+  | 'control.cancel';
+
+export interface AgentInboxMessageRequest {
+  kind: AgentInboxMessageKind;
+  replyTo?: string;
+  value?: unknown;
+  metadata?: Record<string, unknown>;
+}
+
+export interface AgentInboxMessageResponse {
+  inboxMessageId: string;
+  kind: AgentInboxMessageKind;
+  acceptedAt: string;
+}
+
+// ----------------- New event payloads -----------------
+
+export interface AgentAskPayload {
+  messageId: string;
+  prompt: string;
+  schema: Record<string, unknown>;
+  timeoutSec: number;
+}
+
+export interface AgentProgressPayload {
+  step: number;
+  total: number;
+  message?: string;
+  percent?: number;
+}
+
+export interface AgentThinkingPayload {
+  text: string;
+}
+
+export interface AgentToolPartialPayload {
+  step: number;
+  tool: string;
+  chunk: unknown;
+}
diff --git a/web/src/types/user.d.ts b/web/src/types/user.d.ts
index 971023a..fc2e7a2 100644
--- a/web/src/types/user.d.ts
+++ b/web/src/types/user.d.ts
@@ -23,6 +23,38 @@ export interface User {
   avatar?: string | null;
 }
 
+export interface AdminUserUsageStats {
+  trafficBytes: number;
+  agentTokens: number;
+}
+
+export interface AdminUserItem {
+  userId: string;
+  username: string;
+  email: string;
+  role: 'USER' | 'ADMIN';
+  status: UserStatus | 'pending_verification';
+  emailVerified: boolean;
+  emailVerifiedAt?: string | null;
+  storageLimit: number;
+  storageUsed: number;
+  usagePercentage: number;
+  lastLoginAt?: string | null;
+  lastActiveAt?: string | null;
+  createdAt: string;
+  usageStats: AdminUserUsageStats;
+}
+
+export interface GetAdminUsersParams {
+  page?: number;
+  perPage?: number;
+  search?: string;
+  status?: UserStatus;
+  role?: 'USER' | 'ADMIN';
+  usageFrom?: string;
+  usageTo?: string;
+}
+
 export interface LoginResponse {
   token: string;
   tokenType: string;