添加 DEFAULT_TEAM_NODE_MAX_TOOL_ITERATIONS 配置项以控制团队节点的最大工具迭代次数, 并修改 LocalAgentRunner 中的逻辑来使用此默认值当 envelope 中未指定时。 fix(runtime): 修复团队节点运行成功判断逻辑 更新运行成功判断条件,将 finish_reason 为 "max_tool_iterations_finalized" 的情况 视为运行失败,并添加对原始工具调用输出的检测,避免将其误判为成功完成。 feat(mcp): 添加团队工作流MCP工具类别支持 增加新的本地MCP工具类别 "team_workflow" 及其对应的工具创建功能, 为团队工作流提供本地工具支持。 refactor(engine): 调整AgentLoop最大工具迭代次数设置 将 AgentProfile 中的默认 max_tool_iterations 从 30 增加到 100, 同时移除 TaskExecutionPlanner 构造函数中的重复参数传递。 perf(mcp): 优化MCP连接管理避免重复连接 添加 mcp_connected 标志来跟踪MCP连接状态,确保 connect_all 只执行一次, 提高性能并避免不必要的重复连接。 refactor(skills): 移除技能团队模板相关功能 移除与技能团队模板相关的代码,包括解析、存储和处理逻辑, 简化技能记录结构和加载流程。 feat(process): 增强会话过程投影器功能 添加技能激活快照事件处理,改进团队运行完成消息显示, 并增强技能激活事件的时间戳记录功能。 refactor(tasks): 简化任务尝试编排器团队执行逻辑 移除团队执行相关代码,将所有任务统一按单步执行处理, 简化任务编排器的复杂度并提升执行效率。 fix(evidence): 修复节点证据评估中需求验证逻辑 更新节点证据评估逻辑,跳过自然语言证据需求的确定性验证, 只执行机器可读的需求验证,避免因自然语言需求导致的节点失败。
121 lines
3.6 KiB
Python
121 lines
3.6 KiB
Python
from __future__ import annotations
|
|
|
|
import asyncio
|
|
from types import SimpleNamespace
|
|
from typing import Any
|
|
|
|
from beaver.coordinator import AgentDescriptor, ExecutionGraph, ExecutionNode
|
|
from beaver.engine import AgentRunResult
|
|
from beaver.tasks import TaskExecutionPlan, TaskRecord
|
|
from beaver.tasks.attempt_orchestrator import TaskAttemptOrchestrator
|
|
|
|
|
|
class FakeTaskService:
|
|
def start_run(self, task_id: str, **_: Any) -> None:
|
|
return None
|
|
|
|
def append_run(self, task_id: str, run_id: str, **_: Any) -> TaskRecord:
|
|
return self.task
|
|
|
|
|
|
class FakeSessionManager:
|
|
def __init__(self) -> None:
|
|
self.events: list[dict[str, Any]] = []
|
|
|
|
def append_message(self, session_id: str, **kwargs: Any) -> None:
|
|
self.events.append({"session_id": session_id, **kwargs})
|
|
|
|
def update_latest_assistant_event_payload(self, *args: Any, **kwargs: Any) -> None:
|
|
return None
|
|
|
|
def get_run_event_records(self, session_id: str, run_id: str) -> list[Any]:
|
|
return []
|
|
|
|
|
|
class LegacyTeamPlanner:
|
|
async def plan(self, **_: Any) -> TaskExecutionPlan:
|
|
return TaskExecutionPlan(
|
|
mode="team",
|
|
reason="legacy plan should be ignored by orchestrator",
|
|
graph=ExecutionGraph(
|
|
strategy="sequence",
|
|
nodes=[
|
|
ExecutionNode("collect", "Collect", AgentDescriptor(name="collect")),
|
|
],
|
|
),
|
|
)
|
|
|
|
|
|
def _task() -> TaskRecord:
|
|
return TaskRecord(
|
|
task_id="task-1",
|
|
session_id="session-1",
|
|
description="finance comparison",
|
|
goal="finance comparison",
|
|
constraints=[],
|
|
priority=0,
|
|
status="open",
|
|
creator="test",
|
|
created_at="now",
|
|
updated_at="now",
|
|
)
|
|
|
|
|
|
def test_builtin_tools_do_not_export_legacy_agent_team_tool() -> None:
|
|
import beaver.tools.builtins as builtins
|
|
|
|
assert "AgentTeamTool" not in builtins.__all__
|
|
assert not hasattr(builtins, "AgentTeamTool")
|
|
|
|
|
|
def test_task_orchestrator_does_not_execute_legacy_planner_team_graph() -> None:
|
|
task = _task()
|
|
task_service = FakeTaskService()
|
|
task_service.task = task
|
|
session_manager = FakeSessionManager()
|
|
loaded = SimpleNamespace(
|
|
task_service=task_service,
|
|
task_execution_planner=LegacyTeamPlanner(),
|
|
session_manager=session_manager,
|
|
run_memory_store=None,
|
|
)
|
|
orchestrator = TaskAttemptOrchestrator(
|
|
loaded=loaded,
|
|
create_loop=lambda: None,
|
|
make_provider_bundle_for_task=lambda *_: None,
|
|
)
|
|
|
|
async def fail_if_called(*args: Any, **kwargs: Any) -> Any:
|
|
raise AssertionError("legacy planner team graph must not start TeamService")
|
|
|
|
async def runner(message: str, **kwargs: Any) -> AgentRunResult:
|
|
return AgentRunResult(
|
|
session_id="session-1",
|
|
run_id="main-run",
|
|
output_text="single path",
|
|
finish_reason="stop",
|
|
tool_iterations=0,
|
|
)
|
|
|
|
orchestrator._run_team_for_task = fail_if_called # type: ignore[method-assign]
|
|
result = asyncio.run(
|
|
orchestrator.run(
|
|
message="compare finance",
|
|
runner=runner,
|
|
kwargs={
|
|
"session_id": "session-1",
|
|
"provider_bundle": SimpleNamespace(),
|
|
"include_skill_assembly": False,
|
|
},
|
|
task=task,
|
|
)
|
|
)
|
|
|
|
assert result.output_text == "single path"
|
|
synthesis_events = [
|
|
event
|
|
for event in session_manager.events
|
|
if event.get("event_type") == "task_synthesis_completed"
|
|
]
|
|
assert synthesis_events[0]["event_payload"]["task_outcome"] == "single"
|