```

feat(engine): 添加技能查看工具并优化异步任务管理 - 添加SkillViewTool到引擎加载器中，增强技能管理功能 - 在AgentLoop中引入_active_direct_task来跟踪活跃任务 - 实现直接任务执行时的同步处理逻辑 - 更新工具实例化方式以支持依赖注入 feat(config): 增加智能体运行时参数配置支持 - 扩展AgentDefaultsConfig添加max_tokens和temperature字段 - 实现配置解析函数_first_config_value处理多个配置源 - 支持通过Web API动态更新智能体运行时参数 - 添加前端页面配置表单和验证逻辑 refactor(provider): 统一最大令牌数参数类型为可选整型 - 将所有LLM提供者的max_tokens参数改为int | None类型 - 为AnthropicProvider实现模型特定的最大令牌数默认值 - 调整参数传递逻辑，优先级：调用参数 > 配置文件 > 模型默认值 - 移除硬编码的默认值，改用条件判断 feat(process): 增强事件投影功能 - 添加工具调用开始/结束事件的映射逻辑 - 实现技能激活事件的识别和展示 - 添加辅助函数处理工具调用名称和参数提取 - 优化运行记录关联逻辑，提升事件匹配准确性 fix(web): 更新网络请求客户端信任环境设置 - 将WebFetchTool和WebSearchTool的trust_env参数设为True - 确保HTTP客户端能够正确使用系统代理配置 - 修复可能的网络连接问题 test: 添加配置加载和事件投影相关测试 - 新增智能体默认参数配置测试用例 - 实现API配置持久化和重载测试 - 添加技能卡片和工具事件的投影测试 ```
2026-05-27 13:37:06 +08:00
parent 55b39563a0
commit 33a9845566
75 changed files with 2599 additions and 114 deletions
--- a/app-instance/backend/agents/registry.json
+++ b/app-instance/backend/agents/registry.json
@ -0,0 +1,145 @@
+{
+  "agents": [
+    {
+      "agent_id": "researcher",
+      "capabilities": [
+        "research",
+        "analysis",
+        "source review",
+        "requirements"
+      ],
+      "created_at": "2026-05-27T05:25:11.756341+00:00",
+      "description": "Finds facts, references, constraints, and implementation options.",
+      "display_name": "Researcher",
+      "metadata": {},
+      "model": null,
+      "name": "researcher",
+      "priority": 50,
+      "provider_name": null,
+      "role": "research",
+      "skill_names": [],
+      "source": "builtin",
+      "status": "active",
+      "system_prompt": "You are a research specialist. Gather concise evidence and tradeoffs for the parent task.",
+      "tags": [
+        "planning",
+        "research"
+      ],
+      "tool_hints": [],
+      "updated_at": "2026-05-27T05:25:11.756349+00:00"
+    },
+    {
+      "agent_id": "implementer",
+      "capabilities": [
+        "implementation",
+        "coding",
+        "refactor",
+        "integration"
+      ],
+      "created_at": "2026-05-27T05:25:11.756351+00:00",
+      "description": "Builds scoped implementation slices and proposes concrete changes.",
+      "display_name": "Implementer",
+      "metadata": {},
+      "model": null,
+      "name": "implementer",
+      "priority": 45,
+      "provider_name": null,
+      "role": "implementation",
+      "skill_names": [],
+      "source": "builtin",
+      "status": "active",
+      "system_prompt": "You are an implementation specialist. Produce practical, scoped implementation output.",
+      "tags": [
+        "coding",
+        "build"
+      ],
+      "tool_hints": [],
+      "updated_at": "2026-05-27T05:25:11.756353+00:00"
+    },
+    {
+      "agent_id": "reviewer",
+      "capabilities": [
+        "review",
+        "quality",
+        "risk",
+        "verification"
+      ],
+      "created_at": "2026-05-27T05:25:11.756355+00:00",
+      "description": "Reviews plans, code, outputs, and risks before final synthesis.",
+      "display_name": "Reviewer",
+      "metadata": {},
+      "model": null,
+      "name": "reviewer",
+      "priority": 45,
+      "provider_name": null,
+      "role": "review",
+      "skill_names": [],
+      "source": "builtin",
+      "status": "active",
+      "system_prompt": "You are a review specialist. Focus on defects, missing requirements, and risks.",
+      "tags": [
+        "review",
+        "quality"
+      ],
+      "tool_hints": [],
+      "updated_at": "2026-05-27T05:25:11.756356+00:00"
+    },
+    {
+      "agent_id": "tester",
+      "capabilities": [
+        "testing",
+        "verification",
+        "regression",
+        "qa"
+      ],
+      "created_at": "2026-05-27T05:25:11.756358+00:00",
+      "description": "Designs and executes verification checks for task outputs.",
+      "display_name": "Tester",
+      "metadata": {},
+      "model": null,
+      "name": "tester",
+      "priority": 40,
+      "provider_name": null,
+      "role": "testing",
+      "skill_names": [],
+      "source": "builtin",
+      "status": "active",
+      "system_prompt": "You are a testing specialist. Identify focused checks and report pass/fail evidence.",
+      "tags": [
+        "test",
+        "quality"
+      ],
+      "tool_hints": [],
+      "updated_at": "2026-05-27T05:25:11.756358+00:00"
+    },
+    {
+      "agent_id": "documenter",
+      "capabilities": [
+        "documentation",
+        "explanation",
+        "migration notes",
+        "release notes"
+      ],
+      "created_at": "2026-05-27T05:25:11.756360+00:00",
+      "description": "Writes and reconciles user-facing and internal documentation updates.",
+      "display_name": "Documenter",
+      "metadata": {},
+      "model": null,
+      "name": "documenter",
+      "priority": 35,
+      "provider_name": null,
+      "role": "documentation",
+      "skill_names": [],
+      "source": "builtin",
+      "status": "active",
+      "system_prompt": "You are a documentation specialist. Produce concise docs aligned with the implementation.",
+      "tags": [
+        "docs",
+        "communication"
+      ],
+      "tool_hints": [],
+      "updated_at": "2026-05-27T05:25:11.756360+00:00"
+    }
+  ],
+  "version": 1
+}
--- a/app-instance/backend/beaver/engine/loader.py
+++ b/app-instance/backend/beaver/engine/loader.py
@ -44,6 +44,7 @@ from beaver.tools.builtins import (
    SpawnTool,
    SessionSearchTool,
    SkillManageTool,
+    SkillViewTool,
    SkillsListTool,
    TerminalTool,
    TodoTool,
@ -220,16 +221,17 @@ class EngineLoader:
                    ObjectBackedTool(WriteFileTool()),
                    ObjectBackedTool(PatchFileTool()),
                    ObjectBackedTool(WebFetchTool()),
-            ObjectBackedTool(WebSearchTool()),
-            ObjectBackedTool(TerminalTool()),
-            ObjectBackedTool(ProcessTool()),
-            ObjectBackedTool(ExecuteCodeTool()),
-            ObjectBackedTool(TodoTool()),
-            ObjectBackedTool(ClarifyTool()),
-            ObjectBackedTool(SendMessageTool()),
-            ObjectBackedTool(DelegateTool()),
-            ObjectBackedTool(SpawnTool()),
-            SkillsListTool(),
+                    ObjectBackedTool(WebSearchTool()),
+                    ObjectBackedTool(TerminalTool()),
+                    ObjectBackedTool(ProcessTool()),
+                    ObjectBackedTool(ExecuteCodeTool()),
+                    ObjectBackedTool(TodoTool()),
+                    ObjectBackedTool(ClarifyTool()),
+                    ObjectBackedTool(SendMessageTool()),
+                    ObjectBackedTool(DelegateTool()),
+                    ObjectBackedTool(SpawnTool()),
+                    SkillsListTool(),
+                    ObjectBackedTool(SkillViewTool(loader=skills_loader)),
                    SkillManageTool(),
                    CronTool(),
                ]
--- a/app-instance/backend/beaver/engine/loop.py
+++ b/app-instance/backend/beaver/engine/loop.py
@ -48,7 +48,7 @@ class AgentProfile:
    name: str = "default"
    system_prompt: str = ""
    default_model: str = "gpt-4.1-mini"
-    max_tokens: int = 4096
+    max_tokens: int | None = None
    max_context_messages: int = 1000
    temperature: float = 0.2
    max_tool_iterations: int = 30
@ -89,6 +89,7 @@ class AgentLoop:
        self.loaded: EngineLoadResult | None = None
        self.runtime_services: dict[str, Any] = {}
        self._run_queue: asyncio.Queue[_DirectRunRequest | None] | None = None
+        self._active_direct_task: asyncio.Task[Any] | None = None
        self._running = False
        self._stop_requested = False

@ -130,6 +131,8 @@ class AgentLoop:
                if item.future.cancelled():
                    continue

+                previous_direct_task = self._active_direct_task
+                self._active_direct_task = asyncio.current_task()
                try:
                    result = await self._process_direct_impl(item.task, **item.kwargs)
                except asyncio.CancelledError:
@ -142,6 +145,8 @@ class AgentLoop:
                else:
                    if not item.future.done():
                        item.future.set_result(result)
+                finally:
+                    self._active_direct_task = previous_direct_task
        finally:
            if self._run_queue is not None:
                while True:
@ -183,6 +188,9 @@ class AgentLoop:
        if self._stop_requested:
            raise RuntimeError("AgentLoop.submit_direct() is not accepting new tasks after stop()")

+        if asyncio.current_task() is self._active_direct_task:
+            return await self._process_direct_impl(task, **kwargs)
+
        future: asyncio.Future[AgentRunResult] = asyncio.get_running_loop().create_future()
        await self._run_queue.put(_DirectRunRequest(task=task, kwargs=dict(kwargs), future=future))
        return await future
@ -363,7 +371,7 @@ class AgentLoop:
        resolved_request_timeout_seconds = configured_provider.get("request_timeout_seconds")
        resolved_embedding_model = embedding_model or config.default_embedding_model
        resolved_embedding_target = embedding_target or config.resolve_embedding_target()
-        resolved_max_tokens = max_tokens or self.profile.max_tokens
+        resolved_max_tokens = self.profile.max_tokens if max_tokens is None else max_tokens
        resolved_temperature = self.profile.temperature if temperature is None else temperature
        resolved_max_tool_iterations = (
            self.profile.max_tool_iterations if max_tool_iterations is None else max_tool_iterations
@ -892,7 +900,7 @@ class AgentLoop:
        provider: Any,
        messages: list[dict[str, Any]],
        model: str,
-        max_tokens: int,
+        max_tokens: int | None,
        temperature: float,
        thinking_enabled: bool | None,
    ) -> str:
--- a/app-instance/backend/beaver/engine/providers/anthropic.py
+++ b/app-instance/backend/beaver/engine/providers/anthropic.py
@ -43,7 +43,7 @@ class AnthropicProvider(LLMProvider):
        messages: list[dict[str, Any]],
        tools: list[dict[str, Any]] | None = None,
        model: str | None = None,
-        max_tokens: int = 4096,
+        max_tokens: int | None = None,
        temperature: float = 0.7,
        thinking_enabled: bool | None = None,
    ) -> LLMResponse:
@ -57,9 +57,14 @@ class AnthropicProvider(LLMProvider):
            "model": model or self.default_model,
            "system": system_prompt or "",
            "messages": anthropic_messages,
-            "max_tokens": max(1, max_tokens),
            "temperature": temperature,
        }
+        resolved_max_tokens = (
+            _default_max_tokens_for_model(model or self.default_model)
+            if max_tokens is None
+            else max(1, max_tokens)
+        )
+        kwargs["max_tokens"] = resolved_max_tokens
        if tools:
            kwargs["tools"] = _convert_tools(tools)

@ -100,6 +105,17 @@ class AnthropicProvider(LLMProvider):
        return self.default_model


+def _default_max_tokens_for_model(model: str) -> int:
+    """Return a conservative native output ceiling for Anthropic Messages."""
+
+    normalized = model.lower().replace("_", "-")
+    if "sonnet-4" in normalized or "opus-4" in normalized or "3-7" in normalized or "3.7" in normalized:
+        return 64_000
+    if "haiku" in normalized:
+        return 4_096
+    return 8_192
+
+
 def _convert_messages(messages: list[dict[str, Any]]) -> tuple[str, list[dict[str, Any]]]:
    system_prompt = ""
    converted: list[dict[str, Any]] = []
--- a/app-instance/backend/beaver/engine/providers/base.py
+++ b/app-instance/backend/beaver/engine/providers/base.py
@ -88,7 +88,7 @@ class LLMProvider(ABC):
        messages: list[dict[str, Any]],
        tools: list[dict[str, Any]] | None = None,
        model: str | None = None,
-        max_tokens: int = 4096,
+        max_tokens: int | None = None,
        temperature: float = 0.7,
        thinking_enabled: bool | None = None,
    ) -> LLMResponse:
--- a/app-instance/backend/beaver/engine/providers/chain.py
+++ b/app-instance/backend/beaver/engine/providers/chain.py
@ -56,7 +56,7 @@ class FallbackProviderChain(LLMProvider):
        messages: list[dict],
        tools: list[dict] | None = None,
        model: str | None = None,
-        max_tokens: int = 4096,
+        max_tokens: int | None = None,
        temperature: float = 0.7,
        thinking_enabled: bool | None = None,
    ) -> LLMResponse:
@ -115,7 +115,7 @@ class FallbackProviderChain(LLMProvider):
        messages: list[dict],
        tools: list[dict] | None,
        model: str,
-        max_tokens: int,
+        max_tokens: int | None,
        temperature: float,
        thinking_enabled: bool | None,
    ) -> LLMResponse:
--- a/app-instance/backend/beaver/engine/providers/codex.py
+++ b/app-instance/backend/beaver/engine/providers/codex.py
@ -39,7 +39,7 @@ class OpenAICodexProvider(LLMProvider):
        messages: list[dict[str, Any]],
        tools: list[dict[str, Any]] | None = None,
        model: str | None = None,
-        max_tokens: int = 4096,
+        max_tokens: int | None = None,
        temperature: float = 0.7,
        thinking_enabled: bool | None = None,
    ) -> LLMResponse:
--- a/app-instance/backend/beaver/engine/providers/custom.py
+++ b/app-instance/backend/beaver/engine/providers/custom.py
@ -47,7 +47,7 @@ class CustomProvider(LLMProvider):
        messages: list[dict[str, Any]],
        tools: list[dict[str, Any]] | None = None,
        model: str | None = None,
-        max_tokens: int = 4096,
+        max_tokens: int | None = None,
        temperature: float = 0.7,
        thinking_enabled: bool | None = None,
    ) -> LLMResponse:
@ -55,9 +55,10 @@ class CustomProvider(LLMProvider):
        kwargs: dict[str, Any] = {
            "model": model or self.default_model,
            "messages": self.sanitize_empty_content(messages),
-            "max_tokens": max(1, max_tokens),
            "temperature": temperature,
        }
+        if max_tokens is not None:
+            kwargs["max_tokens"] = max(1, max_tokens)
        if tools:
            kwargs.update(tools=tools, tool_choice="auto")
        try:
--- a/app-instance/backend/beaver/engine/providers/litellm.py
+++ b/app-instance/backend/beaver/engine/providers/litellm.py
@ -197,7 +197,7 @@ class LiteLLMProvider(LLMProvider):
        messages: list[dict[str, Any]],
        tools: list[dict[str, Any]] | None = None,
        model: str | None = None,
-        max_tokens: int = 4096,
+        max_tokens: int | None = None,
        temperature: float = 0.7,
        thinking_enabled: bool | None = None,
    ) -> LLMResponse:
@ -210,10 +210,11 @@ class LiteLLMProvider(LLMProvider):
        kwargs: dict[str, Any] = {
            "model": resolved_model,
            "messages": sanitized_messages,
-            "max_tokens": max(1, max_tokens),
            "temperature": temperature,
            "timeout": self.request_timeout_seconds or 45.0,
        }
+        if max_tokens is not None:
+            kwargs["max_tokens"] = max(1, max_tokens)
        if self.api_key:
            kwargs["api_key"] = self.api_key
        if self.api_base:
--- a/app-instance/backend/beaver/foundation/config/loader.py
+++ b/app-instance/backend/beaver/foundation/config/loader.py
@ -86,18 +86,25 @@ def _parse_agent_defaults(data: dict[str, Any]) -> AgentDefaultsConfig:
        model=_string(defaults.get("model") or data.get("model")),
        provider=_string(defaults.get("provider") or data.get("provider")),
        embedding_model=_string(defaults.get("embeddingModel") or defaults.get("embedding_model") or data.get("embeddingModel")),
+        max_tokens=_int(_first_config_value(
+            defaults.get("maxTokens"),
+            defaults.get("max_tokens"),
+            data.get("maxTokens"),
+            data.get("max_tokens"),
+        )),
+        temperature=_float(_first_config_value(defaults.get("temperature"), data.get("temperature"))),
        max_context_messages=_int(
            defaults.get("maxContextMessages")
            or defaults.get("max_context_messages")
            or data.get("maxContextMessages")
            or data.get("max_context_messages")
        ),
-        max_tool_iterations=_int(
-            defaults.get("maxToolIterations")
-            or defaults.get("max_tool_iterations")
-            or data.get("maxToolIterations")
-            or data.get("max_tool_iterations")
-        ),
+        max_tool_iterations=_int(_first_config_value(
+            defaults.get("maxToolIterations"),
+            defaults.get("max_tool_iterations"),
+            data.get("maxToolIterations"),
+            data.get("max_tool_iterations"),
+        )),
    )


@ -204,6 +211,13 @@ def _as_dict(value: Any) -> dict[str, Any]:
    return value if isinstance(value, dict) else {}


+def _first_config_value(*values: Any) -> Any:
+    for value in values:
+        if value not in (None, ""):
+            return value
+    return None
+
+
 def _string(value: Any) -> str | None:
    if value is None:
        return None
--- a/app-instance/backend/beaver/foundation/config/schema.py
+++ b/app-instance/backend/beaver/foundation/config/schema.py
@ -25,6 +25,8 @@ class AgentDefaultsConfig:
    model: str | None = None
    provider: str | None = None
    embedding_model: str | None = None
+    max_tokens: int | None = None
+    temperature: float | None = None
    max_context_messages: int | None = None
    max_tool_iterations: int | None = None

--- a/app-instance/backend/beaver/interfaces/web/app.py
+++ b/app-instance/backend/beaver/interfaces/web/app.py
@ -51,6 +51,8 @@ from .schemas import (
    WebChatRequest,
    WebChatResponse,
    WebErrorResponse,
+    WebAgentConfigRequest,
+    WebAgentConfigResponse,
    WebProviderConfigRequest,
    WebProviderConfigResponse,
    WebStatusResponse,
@ -595,6 +597,38 @@ def create_app(
        _reload_agent_config(agent_service, config_path)
        return WebProviderConfigResponse(ok=True, provider=spec.name, enabled=payload.enabled)

+    @app.post("/api/agent-config", response_model=WebAgentConfigResponse)
+    async def update_agent_config(
+        request: Request,
+        payload: WebAgentConfigRequest,
+    ) -> WebAgentConfigResponse:
+        if payload.max_tokens is not None and payload.max_tokens <= 0:
+            raise HTTPException(status_code=400, detail="max_tokens must be a positive integer or null")
+        if payload.temperature < 0 or payload.temperature > 2:
+            raise HTTPException(status_code=400, detail="temperature must be between 0 and 2")
+        if payload.max_tool_iterations < 0:
+            raise HTTPException(status_code=400, detail="max_tool_iterations must be zero or greater")
+
+        agent_service = get_agent_service(request)
+        config_path = agent_service.loader.config.config_path or default_config_path(workspace=agent_service.loader.workspace)
+        raw = _read_config_json(config_path)
+        agents = _ensure_dict(raw, "agents")
+        defaults = _ensure_dict(agents, "defaults")
+
+        if payload.max_tokens is None:
+            defaults.pop("maxTokens", None)
+            defaults.pop("max_tokens", None)
+        else:
+            defaults["maxTokens"] = payload.max_tokens
+            defaults.pop("max_tokens", None)
+        defaults["temperature"] = payload.temperature
+        defaults["maxToolIterations"] = payload.max_tool_iterations
+        defaults.pop("max_tool_iterations", None)
+
+        _write_config_json(config_path, raw)
+        _reload_agent_config(agent_service, config_path)
+        return WebAgentConfigResponse(ok=True)
+
    @app.get("/api/sessions")
    async def list_sessions(request: Request) -> list[dict[str, Any]]:
        loaded = get_agent_service(request).create_loop().boot()
--- a/app-instance/backend/beaver/interfaces/web/schemas/init.py
+++ b/app-instance/backend/beaver/interfaces/web/schemas/init.py
@ -8,6 +8,8 @@ from .chat import (
    WebChatRequest,
    WebChatResponse,
    WebErrorResponse,
+    WebAgentConfigRequest,
+    WebAgentConfigResponse,
    WebProviderConfigRequest,
    WebProviderConfigResponse,
    WebProviderTarget,
@ -22,6 +24,8 @@ __all__ = [
    "WebChatRequest",
    "WebChatResponse",
    "WebErrorResponse",
+    "WebAgentConfigRequest",
+    "WebAgentConfigResponse",
    "WebProviderConfigRequest",
    "WebProviderConfigResponse",
    "WebProviderTarget",
--- a/app-instance/backend/beaver/interfaces/web/schemas/chat.py
+++ b/app-instance/backend/beaver/interfaces/web/schemas/chat.py
@ -139,6 +139,20 @@ class WebProviderConfigResponse(BaseModel):
    enabled: bool


+class WebAgentConfigRequest(BaseModel):
+    """Agent runtime defaults update from the settings page."""
+
+    max_tokens: int | None = None
+    temperature: float
+    max_tool_iterations: int
+
+
+class WebAgentConfigResponse(BaseModel):
+    """Agent runtime defaults update result."""
+
+    ok: bool
+
+
 class WebStatusResponse(BaseModel):
    """Web 宿主层状态响应。"""

--- a/app-instance/backend/beaver/services/agent_service.py
+++ b/app-instance/backend/beaver/services/agent_service.py
@ -68,6 +68,14 @@ class AgentService:

    def _apply_configured_profile_defaults(self) -> None:
        defaults = self.loader.config.agents_defaults
+        self.profile.max_tokens = None
+        self.profile.temperature = 0.2
+        self.profile.max_context_messages = 1000
+        self.profile.max_tool_iterations = 30
+        if defaults.max_tokens is not None:
+            self.profile.max_tokens = max(1, defaults.max_tokens)
+        if defaults.temperature is not None:
+            self.profile.temperature = defaults.temperature
        if defaults.max_context_messages is not None:
            self.profile.max_context_messages = max(1, defaults.max_context_messages)
        if defaults.max_tool_iterations is not None:
--- a/app-instance/backend/beaver/services/process_service.py
+++ b/app-instance/backend/beaver/services/process_service.py
@ -50,10 +50,11 @@ class SessionProcessProjector:

        for record in records:
            payload = dict(record.event_payload or {})
-            task_id = payload.get("task_id")
+            run_record_for_event = run_records.get(str(record.run_id)) if record.run_id else None
+            task_id = payload.get("task_id") or getattr(run_record_for_event, "task_id", None)
            if not task_id:
                continue
-            attempt_index = int(payload.get("attempt_index") or 1)
+            attempt_index = int(payload.get("attempt_index") or getattr(run_record_for_event, "attempt_index", None) or 1)
            root_run_id = f"task:{task_id}:attempt:{attempt_index}"
            created_at = _timestamp(record.timestamp)
            root = runs.setdefault(
@ -73,7 +74,61 @@ class SessionProcessProjector:
                },
            )

-            if record.event_type == "task_execution_planned":
+            if record.event_type == "assistant_message_added" and record.tool_calls:
+                run_id = record.run_id or root_run_id
+                parent_run_id = root_run_id if run_id != root_run_id else None
+                for index, tool_call in enumerate(record.tool_calls):
+                    if not isinstance(tool_call, dict):
+                        continue
+                    tool_name = _tool_call_name(tool_call)
+                    add_event(
+                        event_id=f"{_event_id(record, 'tool-call')}:{index}",
+                        run_id=run_id,
+                        parent_run_id=parent_run_id,
+                        kind="tool_call_started",
+                        actor_type="tool",
+                        actor_id=tool_name,
+                        actor_name=tool_name,
+                        text=f"Calling tool: {tool_name}.",
+                        created_at=created_at,
+                        status="running",
+                        metadata={
+                            "task_id": task_id,
+                            "attempt_index": attempt_index,
+                            "timeline_type": "tool_call",
+                            "tool_name": tool_name,
+                            "tool_call_id": tool_call.get("id"),
+                            "arguments": _tool_call_arguments(tool_call),
+                        },
+                    )
+
+            elif record.event_type == "tool_result_recorded":
+                run_id = record.run_id or root_run_id
+                parent_run_id = root_run_id if run_id != root_run_id else None
+                tool_name = str(record.tool_name or payload.get("tool_name") or "tool")
+                add_event(
+                    event_id=_event_id(record, "tool-result"),
+                    run_id=run_id,
+                    parent_run_id=parent_run_id,
+                    kind="tool_call_finished",
+                    actor_type="tool",
+                    actor_id=tool_name,
+                    actor_name=tool_name,
+                    text=_truncate(str(record.content or payload.get("error") or "")),
+                    created_at=created_at,
+                    status="done" if payload.get("success", True) else "error",
+                    metadata={
+                        **dict(payload),
+                        "task_id": task_id,
+                        "attempt_index": attempt_index,
+                        "timeline_type": "tool_result",
+                        "tool_name": tool_name,
+                        "tool_call_id": record.tool_call_id,
+                        "result_summary": _truncate(str(record.content or payload.get("error") or "")),
+                    },
+                )
+
+            elif record.event_type == "task_execution_planned":
                plan_mode = payload.get("plan_mode") or "single"
                strategy = payload.get("strategy") or "single"
                node_ids = payload.get("node_ids") or []
@ -241,6 +296,7 @@ class SessionProcessProjector:
                main_run_id = str(payload.get("main_run_id") or "")
                if main_run_id:
                    run_record = run_records.get(main_run_id)
+                    activated_skill_names = _activated_skill_names(run_record)
                    runs[main_run_id] = {
                        "run_id": main_run_id,
                        "parent_run_id": root_run_id,
@ -254,8 +310,32 @@ class SessionProcessProjector:
                        "started_at": run_record.started_at if run_record is not None else created_at,
                        "finished_at": run_record.ended_at if run_record is not None else created_at,
                        "summary": _truncate(run_record.task_text if run_record is not None else ""),
-                        "metadata": {"task_id": task_id, "attempt_index": attempt_index},
+                        "metadata": {
+                            "task_id": task_id,
+                            "attempt_index": attempt_index,
+                            "skill_names": activated_skill_names,
+                        },
                    }
+                    if activated_skill_names:
+                        add_event(
+                            event_id=_event_id(record, "synthesis-skills"),
+                            run_id=main_run_id,
+                            parent_run_id=root_run_id,
+                            kind="skill_selected",
+                            actor_type="system",
+                            actor_id="skill-selector",
+                            actor_name="Skill Selector",
+                            text=f"Selected skill guidance: {', '.join(activated_skill_names)}.",
+                            created_at=created_at,
+                            status="done",
+                            metadata={
+                                "task_id": task_id,
+                                "attempt_index": attempt_index,
+                                "timeline_type": "skill",
+                                "skill_names": activated_skill_names,
+                                "activation_reasons": _activated_skill_reasons(run_record),
+                            },
+                        )
                    add_event(
                        event_id=_event_id(record, "synthesis"),
                        run_id=main_run_id,
@ -335,3 +415,49 @@ def _truncate(text: str, limit: int = 800) -> str:
    if len(cleaned) <= limit:
        return cleaned
    return cleaned[: limit - 1] + "..."
+
+
+def _activated_skill_names(run_record: Any | None) -> list[str]:
+    if run_record is None:
+        return []
+    names = []
+    for receipt in getattr(run_record, "activated_skills", []) or []:
+        skill_name = str(getattr(receipt, "skill_name", "") or "").strip()
+        if skill_name:
+            names.append(skill_name)
+    return list(dict.fromkeys(names))
+
+
+def _activated_skill_reasons(run_record: Any | None) -> list[str]:
+    if run_record is None:
+        return []
+    reasons = []
+    for receipt in getattr(run_record, "activated_skills", []) or []:
+        reason = str(getattr(receipt, "activation_reason", "") or "").strip()
+        if reason:
+            reasons.append(reason)
+    return reasons
+
+
+def _tool_call_name(tool_call: dict[str, Any]) -> str:
+    function_payload = tool_call.get("function")
+    if isinstance(function_payload, dict):
+        name = function_payload.get("name")
+        if name:
+            return str(name)
+    for key in ("name", "tool_name"):
+        value = tool_call.get(key)
+        if value:
+            return str(value)
+    return "tool"
+
+
+def _tool_call_arguments(tool_call: dict[str, Any]) -> Any:
+    function_payload = tool_call.get("function")
+    if isinstance(function_payload, dict) and "arguments" in function_payload:
+        return function_payload.get("arguments")
+    if "arguments" in tool_call:
+        return tool_call.get("arguments")
+    if "args" in tool_call:
+        return tool_call.get("args")
+    return None
--- a/app-instance/backend/beaver/tools/builtins/web.py
+++ b/app-instance/backend/beaver/tools/builtins/web.py
@ -51,7 +51,7 @@ class WebFetchTool:
        try:
            safe_url = _safe_url(url)
            limit = max(1000, min(int(max_chars or 12000), 50000))
-            async with httpx.AsyncClient(timeout=20, follow_redirects=True, trust_env=False) as client:
+            async with httpx.AsyncClient(timeout=20, follow_redirects=True, trust_env=True) as client:
                response = await client.get(
                    safe_url,
                    headers={"User-Agent": "Mozilla/5.0 Beaver/1.0"},
@ -96,7 +96,7 @@ class WebSearchTool:
                raise ValueError("query is required")
            bounded = max(1, min(int(limit or 5), 10))
            url = f"https://duckduckgo.com/html/?q={quote_plus(query)}"
-            async with httpx.AsyncClient(timeout=20, follow_redirects=True, trust_env=False) as client:
+            async with httpx.AsyncClient(timeout=20, follow_redirects=True, trust_env=True) as client:
                response = await client.get(url, headers={"User-Agent": "Mozilla/5.0 Beaver/1.0"})
            response.raise_for_status()
            html = response.text
--- a/app-instance/backend/tests/unit/test_agent_loop.py
+++ b/app-instance/backend/tests/unit/test_agent_loop.py
@ -0,0 +1,47 @@
+import asyncio
+from contextlib import suppress
+from typing import Any
+
+from beaver.engine import AgentLoop, AgentRunResult, EngineLoader
+
+
+def _run_result(run_id: str, output_text: str) -> AgentRunResult:
+    return AgentRunResult(
+        session_id="web:test",
+        run_id=run_id,
+        output_text=output_text,
+        finish_reason="stop",
+        tool_iterations=0,
+    )
+
+
+def test_running_loop_handles_reentrant_submit_direct(tmp_path) -> None:
+    async def run_case() -> None:
+        loop = AgentLoop(loader=EngineLoader(workspace=tmp_path))
+        calls: list[str] = []
+
+        async def fake_process_direct(task: str, **kwargs: Any) -> AgentRunResult:
+            calls.append(task)
+            if task == "outer":
+                return await loop.submit_direct("inner", session_id="web:test")
+            return _run_result(task, "inner completed")
+
+        loop._process_direct_impl = fake_process_direct  # type: ignore[method-assign]
+
+        loop_task = asyncio.create_task(loop.run())
+        await asyncio.sleep(0)
+        try:
+            result = await asyncio.wait_for(loop.submit_direct("outer", session_id="web:test"), timeout=1)
+        finally:
+            await loop.stop()
+            with suppress(asyncio.TimeoutError):
+                await asyncio.wait_for(loop_task, timeout=1)
+            if not loop_task.done():
+                loop_task.cancel()
+                with suppress(asyncio.CancelledError):
+                    await loop_task
+
+        assert result.output_text == "inner completed"
+        assert calls == ["outer", "inner"]
+
+    asyncio.run(run_case())
--- a/app-instance/backend/tests/unit/test_config_loader.py
+++ b/app-instance/backend/tests/unit/test_config_loader.py
@ -1,10 +1,12 @@
 import json

+from fastapi.testclient import TestClient
+
 from beaver.engine import AgentLoop, EngineLoader
 from beaver.engine.providers import make_provider_bundle
 from beaver.engine.providers.litellm import LiteLLMProvider
 from beaver.foundation.config import load_config
-from beaver.interfaces.web.app import _reload_agent_config
+from beaver.interfaces.web.app import create_app, _reload_agent_config
 from beaver.services.agent_service import AgentService


@ -161,6 +163,88 @@ def test_reload_agent_config_updates_booted_loop_config(tmp_path) -> None:
    service.close()


+def test_agent_defaults_include_runtime_controls(tmp_path) -> None:
+    config_path = tmp_path / "config.json"
+    config_path.write_text(
+        json.dumps(
+            {
+                "agents": {
+                    "defaults": {
+                        "maxTokens": 12345,
+                        "temperature": 0.4,
+                        "maxToolIterations": 9,
+                    }
+                }
+            }
+        ),
+        encoding="utf-8",
+    )
+
+    config = load_config(config_path=config_path)
+    service = AgentService(config_path=config_path)
+
+    assert config.agents_defaults.max_tokens == 12345
+    assert config.agents_defaults.temperature == 0.4
+    assert config.agents_defaults.max_tool_iterations == 9
+    assert service.profile.max_tokens == 12345
+    assert service.profile.temperature == 0.4
+    assert service.profile.max_tool_iterations == 9
+    service.close()
+
+
+def test_agent_config_api_persists_and_reloads_defaults(tmp_path) -> None:
+    config_path = tmp_path / "config.json"
+    config_path.write_text(json.dumps({"agents": {"defaults": {}}}), encoding="utf-8")
+    service = AgentService(config_path=config_path)
+    app = create_app(service=service, manage_service_lifecycle=False)
+
+    with TestClient(app) as client:
+        response = client.post(
+            "/api/agent-config",
+            json={"max_tokens": 8192, "temperature": 0.6, "max_tool_iterations": 12},
+        )
+        status = client.get("/api/status")
+
+    saved = json.loads(config_path.read_text(encoding="utf-8"))
+    defaults = saved["agents"]["defaults"]
+
+    assert response.status_code == 200
+    assert response.json() == {"ok": True}
+    assert defaults["maxTokens"] == 8192
+    assert defaults["temperature"] == 0.6
+    assert defaults["maxToolIterations"] == 12
+    assert service.profile.max_tokens == 8192
+    assert service.profile.temperature == 0.6
+    assert service.profile.max_tool_iterations == 12
+    assert status.json()["max_tokens"] == 8192
+    assert status.json()["temperature"] == 0.6
+    assert status.json()["max_tool_iterations"] == 12
+    service.close()
+
+
+def test_agent_config_api_accepts_zero_temperature_and_iterations(tmp_path) -> None:
+    config_path = tmp_path / "config.json"
+    service = AgentService(config_path=config_path)
+    app = create_app(service=service, manage_service_lifecycle=False)
+
+    with TestClient(app) as client:
+        response = client.post(
+            "/api/agent-config",
+            json={"max_tokens": None, "temperature": 0, "max_tool_iterations": 0},
+        )
+
+    config = load_config(config_path=config_path)
+
+    assert response.status_code == 200
+    assert config.agents_defaults.max_tokens is None
+    assert config.agents_defaults.temperature == 0
+    assert config.agents_defaults.max_tool_iterations == 0
+    assert service.profile.max_tokens is None
+    assert service.profile.temperature == 0
+    assert service.profile.max_tool_iterations == 0
+    service.close()
+
+
 def test_openai_compatible_qwen_config_keeps_openai_provider() -> None:
    bundle = make_provider_bundle(
        model="qwen-plus",
--- a/app-instance/backend/tests/unit/test_initial_skill_tool_hints.py
+++ b/app-instance/backend/tests/unit/test_initial_skill_tool_hints.py
@ -0,0 +1,58 @@
+from __future__ import annotations
+
+import json
+from pathlib import Path
+
+from beaver.engine import EngineLoader
+from beaver.skills.catalog.utils import parse_frontmatter
+
+
+REPO_ROOT = Path(__file__).resolve().parents[4]
+
+EXPECTED_INITIAL_SKILL_TOOLS = {
+    "cron-scheduler": ["cron"],
+    "filesystem-operation": ["read_file", "write_file", "patch_file", "search_files", "list_directory"],
+    "memory-management": ["memory"],
+    "outlook-mail": [
+        "mcp_outlook_mcp_mail_list_folders",
+        "mcp_outlook_mcp_mail_list_messages",
+        "mcp_outlook_mcp_mail_search_messages",
+        "mcp_outlook_mcp_mail_get_message",
+        "mcp_outlook_mcp_mail_send_email",
+        "mcp_outlook_mcp_mail_reply_to_message",
+        "mcp_outlook_mcp_mail_forward_message",
+        "mcp_outlook_mcp_mail_move_message",
+        "mcp_outlook_mcp_mail_delta_sync",
+        "mcp_outlook_mcp_calendar_list_events",
+        "mcp_outlook_mcp_calendar_create_event",
+        "mcp_outlook_mcp_calendar_update_event",
+        "mcp_outlook_mcp_calendar_get_schedule",
+        "mcp_outlook_mcp_calendar_find_meeting_times",
+        "mcp_outlook_mcp_calendar_delta_sync",
+    ],
+    "skills-admin": ["skills_list", "skill_manage", "skill_view"],
+    "terminal-operation": ["terminal", "process", "execute_code"],
+    "utility-tools": ["clarify", "delegate", "send_message", "spawn", "todo"],
+    "web-operation": ["web_fetch", "web_search"],
+}
+
+
+def test_initial_skill_tool_hints_match_runtime_tool_names() -> None:
+    for skill_name, expected_tools in EXPECTED_INITIAL_SKILL_TOOLS.items():
+        skill_dir = REPO_ROOT / "skills" / skill_name / "versions" / "v0001"
+        frontmatter, _body = parse_frontmatter((skill_dir / "SKILL.md").read_text(encoding="utf-8"))
+        version = json.loads((skill_dir / "version.json").read_text(encoding="utf-8"))
+
+        assert frontmatter["tools"] == expected_tools
+        assert version["frontmatter"]["tools"] == expected_tools
+        assert version["tool_hints"] == expected_tools
+
+
+def test_default_runtime_registers_skill_view_tool(tmp_path: Path) -> None:
+    loaded = EngineLoader(workspace=tmp_path).load()
+    try:
+        assert "skill_view" in loaded.tools
+        assert loaded.tool_registry is not None
+        assert loaded.tool_registry.get("skill_view") is not None
+    finally:
+        loaded.close()
--- a/app-instance/backend/tests/unit/test_max_tokens_defaults.py
+++ b/app-instance/backend/tests/unit/test_max_tokens_defaults.py
@ -0,0 +1,64 @@
+import asyncio
+from types import SimpleNamespace
+
+from beaver.engine.loop import AgentProfile
+from beaver.engine.providers.anthropic import AnthropicProvider
+from beaver.engine.providers.litellm import LiteLLMProvider
+
+
+def test_agent_profile_uses_provider_output_default() -> None:
+    assert AgentProfile().max_tokens is None
+
+
+def test_litellm_omits_max_tokens_when_unset(monkeypatch) -> None:
+    captured_kwargs: dict = {}
+
+    async def fake_acompletion(**kwargs):
+        captured_kwargs.update(kwargs)
+        return SimpleNamespace(
+            choices=[
+                SimpleNamespace(
+                    message=SimpleNamespace(content="ok", tool_calls=[]),
+                    finish_reason="stop",
+                )
+            ],
+            usage=None,
+        )
+
+    monkeypatch.setattr("beaver.engine.providers.litellm.acompletion", fake_acompletion)
+
+    async def run_case():
+        provider = LiteLLMProvider(default_model="openai/gpt-test")
+        return await provider.chat(messages=[{"role": "user", "content": "hi"}], max_tokens=None)
+
+    response = asyncio.run(run_case())
+
+    assert response.content == "ok"
+    assert "max_tokens" not in captured_kwargs
+
+
+def test_anthropic_uses_model_output_ceiling_when_unset(monkeypatch) -> None:
+    captured_kwargs: dict = {}
+
+    class FakeMessages:
+        async def create(self, **kwargs):
+            captured_kwargs.update(kwargs)
+            return SimpleNamespace(
+                content=[SimpleNamespace(type="text", text="ok")],
+                usage=None,
+                stop_reason="stop",
+            )
+
+    class FakeClient:
+        messages = FakeMessages()
+
+    monkeypatch.setattr(AnthropicProvider, "_client_or_raise", lambda self: FakeClient())
+
+    async def run_case():
+        provider = AnthropicProvider(default_model="claude-sonnet-4-5")
+        return await provider.chat(messages=[{"role": "user", "content": "hi"}], max_tokens=None)
+
+    response = asyncio.run(run_case())
+
+    assert response.content == "ok"
+    assert captured_kwargs["max_tokens"] == 64_000
--- a/app-instance/backend/tests/unit/test_process_projection.py
+++ b/app-instance/backend/tests/unit/test_process_projection.py
@ -5,6 +5,7 @@ from pathlib import Path
 from beaver.engine.session import SessionManager
 from beaver.memory.runs import RunMemoryStore, RunRecord
 from beaver.services.process_service import SessionProcessProjector
+from beaver.skills.specs import SkillActivationReceipt


 def test_process_projection_maps_task_team_events(tmp_path: Path) -> None:
@ -238,6 +239,130 @@ def test_process_projection_uses_normalized_plan_metadata_defaults(tmp_path: Pat
    assert planned_event["metadata"]["strategy"] == "single"


+def test_process_projection_emits_skill_card_from_main_run_receipts(tmp_path: Path) -> None:
+    session = SessionManager(tmp_path)
+    run_store = RunMemoryStore(tmp_path / "memory" / "runs")
+    run_store.append_run_record(
+        RunRecord(
+            run_id="main-run",
+            session_id="web:test",
+            task_id="task-1",
+            attempt_index=1,
+            task_text="main task",
+            started_at="2026-01-01T00:00:03+00:00",
+            ended_at="2026-01-01T00:00:04+00:00",
+            success=True,
+            finish_reason="stop",
+            activated_skills=[
+                SkillActivationReceipt(
+                    run_id="main-run",
+                    session_id="web:test",
+                    skill_name="web-operation",
+                    skill_version="1",
+                    content_hash="hash",
+                    activated_at="2026-01-01T00:00:03+00:00",
+                    activation_reason="Needs live web lookup.",
+                )
+            ],
+        )
+    )
+    session.append_message(
+        "web:test",
+        role="system",
+        event_type="task_execution_planned",
+        event_payload={
+            "task_id": "task-1",
+            "attempt_index": 1,
+            "plan_mode": "single",
+            "strategy": "single",
+            "selected_skill_names": [],
+        },
+        context_visible=False,
+    )
+    session.append_message(
+        "web:test",
+        role="system",
+        event_type="task_synthesis_completed",
+        event_payload={"task_id": "task-1", "attempt_index": 1, "main_run_id": "main-run"},
+        context_visible=False,
+    )
+
+    projection = SessionProcessProjector(session, run_store).project("web:test")
+
+    skill_events = [
+        event
+        for event in projection["events"]
+        if event["kind"] == "skill_selected" and event["run_id"] == "main-run"
+    ]
+    assert skill_events
+    assert skill_events[0]["metadata"]["timeline_type"] == "skill"
+    assert skill_events[0]["metadata"]["skill_names"] == ["web-operation"]
+
+
+def test_process_projection_emits_tool_cards_from_run_messages(tmp_path: Path) -> None:
+    session = SessionManager(tmp_path)
+    run_store = RunMemoryStore(tmp_path / "memory" / "runs")
+    run_store.append_run_record(
+        RunRecord(
+            run_id="main-run",
+            session_id="web:test",
+            task_id="task-1",
+            attempt_index=1,
+            task_text="main task",
+            started_at="2026-01-01T00:00:03+00:00",
+            ended_at="2026-01-01T00:00:04+00:00",
+            success=True,
+            finish_reason="stop",
+        )
+    )
+    session.append_message(
+        "web:test",
+        role="system",
+        event_type="task_execution_planned",
+        event_payload={"task_id": "task-1", "attempt_index": 1},
+        context_visible=False,
+    )
+    session.append_message(
+        "web:test",
+        run_id="main-run",
+        role="assistant",
+        event_type="assistant_message_added",
+        event_payload={"task_id": "task-1"},
+        content="Searching",
+        tool_calls=[
+            {
+                "id": "call-1",
+                "name": "multi_search",
+                "arguments": {"query": "Macau cafe near Bóvia"},
+            }
+        ],
+        context_visible=False,
+    )
+    session.append_message(
+        "web:test",
+        run_id="main-run",
+        role="tool",
+        event_type="tool_result_recorded",
+        event_payload={"success": True, "error": None},
+        content="Found 3 restaurants",
+        tool_name="multi_search",
+        tool_call_id="call-1",
+        context_visible=True,
+    )
+
+    projection = SessionProcessProjector(session, run_store).project("web:test")
+
+    tool_call = next(event for event in projection["events"] if event["kind"] == "tool_call_started")
+    assert tool_call["metadata"]["timeline_type"] == "tool_call"
+    assert tool_call["metadata"]["tool_name"] == "multi_search"
+    assert tool_call["run_id"] == "main-run"
+
+    tool_result = next(event for event in projection["events"] if event["kind"] == "tool_call_finished")
+    assert tool_result["metadata"]["timeline_type"] == "tool_result"
+    assert tool_result["metadata"]["tool_name"] == "multi_search"
+    assert tool_result["metadata"]["success"] is True
+
+
 def test_process_projection_exposes_ephemeral_guidance_artifacts(tmp_path: Path) -> None:
    session = SessionManager(tmp_path)
    run_store = RunMemoryStore(tmp_path / "memory" / "runs")
--- a/app-instance/backend/tests/unit/test_web_tools.py
+++ b/app-instance/backend/tests/unit/test_web_tools.py
@ -0,0 +1,44 @@
+from __future__ import annotations
+
+import asyncio
+
+from beaver.tools.builtins import web
+
+
+class _FakeResponse:
+    headers = {"content-type": "text/html"}
+    status_code = 200
+    text = '<a class="result__a" href="https://example.com">Example</a>'
+    url = "https://example.com"
+
+    def raise_for_status(self) -> None:
+        return None
+
+
+class _FakeAsyncClient:
+    calls: list[dict[str, object]] = []
+
+    def __init__(self, **kwargs: object) -> None:
+        self.calls.append(kwargs)
+
+    async def __aenter__(self) -> "_FakeAsyncClient":
+        return self
+
+    async def __aexit__(self, *args: object) -> None:
+        return None
+
+    async def get(self, *args: object, **kwargs: object) -> _FakeResponse:
+        return _FakeResponse()
+
+
+def test_web_tools_use_environment_proxy_settings(monkeypatch) -> None:
+    _FakeAsyncClient.calls = []
+    monkeypatch.setattr(web.httpx, "AsyncClient", _FakeAsyncClient)
+
+    async def _run() -> None:
+        await web.WebFetchTool().execute(url="https://example.com")
+        await web.WebSearchTool().execute(query="example")
+
+    asyncio.run(_run())
+
+    assert [call.get("trust_env") for call in _FakeAsyncClient.calls] == [True, True]