feat(engine): 添加技能查看工具并优化异步任务管理 - 添加SkillViewTool到引擎加载器中,增强技能管理功能 - 在AgentLoop中引入_active_direct_task来跟踪活跃任务 - 实现直接任务执行时的同步处理逻辑 - 更新工具实例化方式以支持依赖注入 feat(config): 增加智能体运行时参数配置支持 - 扩展AgentDefaultsConfig添加max_tokens和temperature字段 - 实现配置解析函数_first_config_value处理多个配置源 - 支持通过Web API动态更新智能体运行时参数 - 添加前端页面配置表单和验证逻辑 refactor(provider): 统一最大令牌数参数类型为可选整型 - 将所有LLM提供者的max_tokens参数改为int | None类型 - 为AnthropicProvider实现模型特定的最大令牌数默认值 - 调整参数传递逻辑,优先级:调用参数 > 配置文件 > 模型默认值 - 移除硬编码的默认值,改用条件判断 feat(process): 增强事件投影功能 - 添加工具调用开始/结束事件的映射逻辑 - 实现技能激活事件的识别和展示 - 添加辅助函数处理工具调用名称和参数提取 - 优化运行记录关联逻辑,提升事件匹配准确性 fix(web): 更新网络请求客户端信任环境设置 - 将WebFetchTool和WebSearchTool的trust_env参数设为True - 确保HTTP客户端能够正确使用系统代理配置 - 修复可能的网络连接问题 test: 添加配置加载和事件投影相关测试 - 新增智能体默认参数配置测试用例 - 实现API配置持久化和重载测试 - 添加技能卡片和工具事件的投影测试 ```
109 lines
3.8 KiB
Python
109 lines
3.8 KiB
Python
"""Direct OpenAI-compatible provider — bypasses LiteLLM."""
|
|
|
|
from __future__ import annotations
|
|
|
|
from typing import Any
|
|
|
|
from .base import LLMProvider, LLMResponse, ToolCallRequest
|
|
|
|
try: # pragma: no cover - optional dependency
|
|
import json_repair
|
|
except ModuleNotFoundError: # pragma: no cover
|
|
json_repair = None # type: ignore[assignment]
|
|
|
|
try: # pragma: no cover - optional dependency
|
|
from openai import AsyncOpenAI
|
|
except ModuleNotFoundError: # pragma: no cover
|
|
AsyncOpenAI = None # type: ignore[assignment]
|
|
|
|
|
|
class CustomProvider(LLMProvider):
|
|
"""直接连接任意 OpenAI-compatible endpoint。"""
|
|
|
|
def __init__(
|
|
self,
|
|
api_key: str = "no-key",
|
|
api_base: str = "http://localhost:8000/v1",
|
|
default_model: str = "default",
|
|
request_timeout_seconds: float | None = None,
|
|
) -> None:
|
|
super().__init__(api_key, api_base, request_timeout_seconds=request_timeout_seconds)
|
|
self.default_model = default_model
|
|
self._client = None
|
|
|
|
def _client_or_raise(self):
|
|
if AsyncOpenAI is None:
|
|
raise RuntimeError("openai package is not installed")
|
|
if self._client is None:
|
|
self._client = AsyncOpenAI(
|
|
api_key=self.api_key,
|
|
base_url=self.api_base,
|
|
timeout=self.request_timeout_seconds,
|
|
)
|
|
return self._client
|
|
|
|
async def chat(
|
|
self,
|
|
messages: list[dict[str, Any]],
|
|
tools: list[dict[str, Any]] | None = None,
|
|
model: str | None = None,
|
|
max_tokens: int | None = None,
|
|
temperature: float = 0.7,
|
|
thinking_enabled: bool | None = None,
|
|
) -> LLMResponse:
|
|
client = self._client_or_raise()
|
|
kwargs: dict[str, Any] = {
|
|
"model": model or self.default_model,
|
|
"messages": self.sanitize_empty_content(messages),
|
|
"temperature": temperature,
|
|
}
|
|
if max_tokens is not None:
|
|
kwargs["max_tokens"] = max(1, max_tokens)
|
|
if tools:
|
|
kwargs.update(tools=tools, tool_choice="auto")
|
|
try:
|
|
response = await client.chat.completions.create(**kwargs)
|
|
except Exception as exc:
|
|
return LLMResponse(content=f"Error: {exc}", finish_reason="error", provider_name="custom")
|
|
|
|
choice = response.choices[0]
|
|
message = choice.message
|
|
parsed_tool_calls: list[ToolCallRequest] = []
|
|
for tool_call in message.tool_calls or []:
|
|
raw_arguments = tool_call.function.arguments
|
|
if isinstance(raw_arguments, str):
|
|
if json_repair is not None:
|
|
arguments = json_repair.loads(raw_arguments)
|
|
else:
|
|
import json
|
|
arguments = json.loads(raw_arguments)
|
|
else:
|
|
arguments = raw_arguments
|
|
parsed_tool_calls.append(
|
|
ToolCallRequest(
|
|
id=tool_call.id,
|
|
name=tool_call.function.name,
|
|
arguments=arguments,
|
|
)
|
|
)
|
|
usage = getattr(response, "usage", None)
|
|
usage_payload = {}
|
|
if usage is not None:
|
|
usage_payload = {
|
|
"prompt_tokens": getattr(usage, "prompt_tokens", 0),
|
|
"completion_tokens": getattr(usage, "completion_tokens", 0),
|
|
"total_tokens": getattr(usage, "total_tokens", 0),
|
|
}
|
|
return LLMResponse(
|
|
content=message.content,
|
|
tool_calls=parsed_tool_calls,
|
|
finish_reason=choice.finish_reason or "stop",
|
|
usage=usage_payload,
|
|
reasoning_content=getattr(message, "reasoning_content", None),
|
|
provider_name="custom",
|
|
model=model or self.default_model,
|
|
)
|
|
|
|
def get_default_model(self) -> str:
|
|
return self.default_model
|