Now we have server tool and client tool
This commit is contained in:
@@ -22,6 +22,7 @@ from loguru import logger
|
||||
from app.config import settings
|
||||
from core.conversation import ConversationManager, ConversationState
|
||||
from core.events import get_event_bus
|
||||
from core.tool_executor import execute_server_tool
|
||||
from core.transports import BaseTransport
|
||||
from models.ws_v1 import ev
|
||||
from processors.eou import EouDetector
|
||||
@@ -214,6 +215,7 @@ class DuplexPipeline:
|
||||
self._runtime_knowledge: Dict[str, Any] = {}
|
||||
self._runtime_knowledge_base_id: Optional[str] = None
|
||||
self._runtime_tools: List[Any] = []
|
||||
self._runtime_tool_executor: Dict[str, str] = {}
|
||||
self._pending_tool_waiters: Dict[str, asyncio.Future] = {}
|
||||
self._early_tool_results: Dict[str, Dict[str, Any]] = {}
|
||||
self._completed_tool_call_ids: set[str] = set()
|
||||
@@ -270,6 +272,10 @@ class DuplexPipeline:
|
||||
tools_payload = metadata.get("tools")
|
||||
if isinstance(tools_payload, list):
|
||||
self._runtime_tools = tools_payload
|
||||
self._runtime_tool_executor = self._resolved_tool_executor_map()
|
||||
elif "tools" in metadata:
|
||||
self._runtime_tools = []
|
||||
self._runtime_tool_executor = {}
|
||||
|
||||
if self.llm_service and hasattr(self.llm_service, "set_knowledge_config"):
|
||||
self.llm_service.set_knowledge_config(self._resolved_knowledge_config())
|
||||
@@ -675,6 +681,10 @@ class DuplexPipeline:
|
||||
|
||||
fn = item.get("function")
|
||||
if isinstance(fn, dict) and fn.get("name"):
|
||||
fn_name = str(fn.get("name"))
|
||||
executor = str(item.get("executor") or item.get("run_on") or "").strip().lower()
|
||||
if executor in {"client", "server"}:
|
||||
self._runtime_tool_executor[fn_name] = executor
|
||||
schemas.append(
|
||||
{
|
||||
"type": "function",
|
||||
@@ -688,6 +698,10 @@ class DuplexPipeline:
|
||||
continue
|
||||
|
||||
if item.get("name"):
|
||||
fn_name = str(item.get("name"))
|
||||
executor = str(item.get("executor") or item.get("run_on") or "").strip().lower()
|
||||
if executor in {"client", "server"}:
|
||||
self._runtime_tool_executor[fn_name] = executor
|
||||
schemas.append(
|
||||
{
|
||||
"type": "function",
|
||||
@@ -700,6 +714,49 @@ class DuplexPipeline:
|
||||
)
|
||||
return schemas
|
||||
|
||||
def _resolved_tool_executor_map(self) -> Dict[str, str]:
|
||||
result: Dict[str, str] = {}
|
||||
for item in self._runtime_tools:
|
||||
if not isinstance(item, dict):
|
||||
continue
|
||||
fn = item.get("function")
|
||||
if isinstance(fn, dict) and fn.get("name"):
|
||||
name = str(fn.get("name"))
|
||||
else:
|
||||
name = str(item.get("name") or "").strip()
|
||||
if not name:
|
||||
continue
|
||||
executor = str(item.get("executor") or item.get("run_on") or "").strip().lower()
|
||||
if executor in {"client", "server"}:
|
||||
result[name] = executor
|
||||
return result
|
||||
|
||||
def _tool_name(self, tool_call: Dict[str, Any]) -> str:
|
||||
fn = tool_call.get("function")
|
||||
if isinstance(fn, dict):
|
||||
return str(fn.get("name") or "").strip()
|
||||
return ""
|
||||
|
||||
def _tool_executor(self, tool_call: Dict[str, Any]) -> str:
|
||||
name = self._tool_name(tool_call)
|
||||
if name and name in self._runtime_tool_executor:
|
||||
return self._runtime_tool_executor[name]
|
||||
# Default to server execution unless explicitly marked as client.
|
||||
return "server"
|
||||
|
||||
async def _emit_tool_result(self, result: Dict[str, Any], source: str) -> None:
|
||||
await self._send_event(
|
||||
{
|
||||
**ev(
|
||||
"assistant.tool_result",
|
||||
trackId=self.session_id,
|
||||
source=source,
|
||||
result=result,
|
||||
)
|
||||
},
|
||||
priority=22,
|
||||
)
|
||||
|
||||
async def handle_tool_call_results(self, results: List[Dict[str, Any]]) -> None:
|
||||
"""Handle client tool execution results."""
|
||||
if not isinstance(results, list):
|
||||
@@ -807,13 +864,16 @@ class DuplexPipeline:
|
||||
if not tool_call:
|
||||
continue
|
||||
allow_text_output = False
|
||||
tool_calls.append(tool_call)
|
||||
executor = self._tool_executor(tool_call)
|
||||
enriched_tool_call = dict(tool_call)
|
||||
enriched_tool_call["executor"] = executor
|
||||
tool_calls.append(enriched_tool_call)
|
||||
await self._send_event(
|
||||
{
|
||||
**ev(
|
||||
"assistant.tool_call",
|
||||
trackId=self.session_id,
|
||||
tool_call=tool_call,
|
||||
tool_call=enriched_tool_call,
|
||||
)
|
||||
},
|
||||
priority=22,
|
||||
@@ -917,7 +977,16 @@ class DuplexPipeline:
|
||||
call_id = str(call.get("id") or "").strip()
|
||||
if not call_id:
|
||||
continue
|
||||
tool_results.append(await self._wait_for_single_tool_result(call_id))
|
||||
executor = str(call.get("executor") or "server").strip().lower()
|
||||
if executor == "client":
|
||||
result = await self._wait_for_single_tool_result(call_id)
|
||||
await self._emit_tool_result(result, source="client")
|
||||
tool_results.append(result)
|
||||
continue
|
||||
|
||||
result = await execute_server_tool(call)
|
||||
await self._emit_tool_result(result, source="server")
|
||||
tool_results.append(result)
|
||||
|
||||
messages = [
|
||||
*messages,
|
||||
@@ -928,7 +997,7 @@ class DuplexPipeline:
|
||||
LLMMessage(
|
||||
role="system",
|
||||
content=(
|
||||
"Tool execution results were returned by the client. "
|
||||
"Tool execution results are available. "
|
||||
"Continue answering the user naturally using these results. "
|
||||
"Do not request the same tool again in this turn.\n"
|
||||
f"tool_calls={json.dumps(tool_calls, ensure_ascii=False)}\n"
|
||||
|
||||
118
engine/core/tool_executor.py
Normal file
118
engine/core/tool_executor.py
Normal file
@@ -0,0 +1,118 @@
|
||||
"""Server-side tool execution helpers."""
|
||||
|
||||
import ast
|
||||
import operator
|
||||
from typing import Any, Dict
|
||||
|
||||
|
||||
_BIN_OPS = {
|
||||
ast.Add: operator.add,
|
||||
ast.Sub: operator.sub,
|
||||
ast.Mult: operator.mul,
|
||||
ast.Div: operator.truediv,
|
||||
ast.Mod: operator.mod,
|
||||
}
|
||||
|
||||
_UNARY_OPS = {
|
||||
ast.UAdd: operator.pos,
|
||||
ast.USub: operator.neg,
|
||||
}
|
||||
|
||||
|
||||
def _safe_eval_expr(expression: str) -> float:
|
||||
tree = ast.parse(expression, mode="eval")
|
||||
|
||||
def _eval(node: ast.AST) -> float:
|
||||
if isinstance(node, ast.Expression):
|
||||
return _eval(node.body)
|
||||
if isinstance(node, ast.Constant) and isinstance(node.value, (int, float)):
|
||||
return float(node.value)
|
||||
if isinstance(node, ast.BinOp):
|
||||
op = _BIN_OPS.get(type(node.op))
|
||||
if not op:
|
||||
raise ValueError("unsupported operator")
|
||||
return float(op(_eval(node.left), _eval(node.right)))
|
||||
if isinstance(node, ast.UnaryOp):
|
||||
op = _UNARY_OPS.get(type(node.op))
|
||||
if not op:
|
||||
raise ValueError("unsupported unary operator")
|
||||
return float(op(_eval(node.operand)))
|
||||
raise ValueError("unsupported expression")
|
||||
|
||||
return _eval(tree)
|
||||
|
||||
|
||||
def _extract_tool_name(tool_call: Dict[str, Any]) -> str:
|
||||
function_payload = tool_call.get("function")
|
||||
if isinstance(function_payload, dict):
|
||||
return str(function_payload.get("name") or "").strip()
|
||||
return ""
|
||||
|
||||
|
||||
def _extract_tool_args(tool_call: Dict[str, Any]) -> Dict[str, Any]:
|
||||
function_payload = tool_call.get("function")
|
||||
if not isinstance(function_payload, dict):
|
||||
return {}
|
||||
raw = function_payload.get("arguments")
|
||||
if isinstance(raw, dict):
|
||||
return raw
|
||||
if not isinstance(raw, str):
|
||||
return {}
|
||||
text = raw.strip()
|
||||
if not text:
|
||||
return {}
|
||||
try:
|
||||
import json
|
||||
|
||||
parsed = json.loads(text)
|
||||
return parsed if isinstance(parsed, dict) else {}
|
||||
except Exception:
|
||||
return {}
|
||||
|
||||
|
||||
async def execute_server_tool(tool_call: Dict[str, Any]) -> Dict[str, Any]:
|
||||
"""Execute a server-side tool and return normalized result payload."""
|
||||
call_id = str(tool_call.get("id") or "").strip()
|
||||
tool_name = _extract_tool_name(tool_call)
|
||||
args = _extract_tool_args(tool_call)
|
||||
|
||||
if tool_name == "calculator":
|
||||
expression = str(args.get("expression") or "").strip()
|
||||
if not expression:
|
||||
return {
|
||||
"tool_call_id": call_id,
|
||||
"name": tool_name,
|
||||
"output": {"error": "missing expression"},
|
||||
"status": {"code": 400, "message": "bad_request"},
|
||||
}
|
||||
if len(expression) > 200:
|
||||
return {
|
||||
"tool_call_id": call_id,
|
||||
"name": tool_name,
|
||||
"output": {"expression": expression, "error": "expression too long"},
|
||||
"status": {"code": 422, "message": "invalid_expression"},
|
||||
}
|
||||
try:
|
||||
value = _safe_eval_expr(expression)
|
||||
if value.is_integer():
|
||||
value = int(value)
|
||||
return {
|
||||
"tool_call_id": call_id,
|
||||
"name": tool_name,
|
||||
"output": {"expression": expression, "result": value},
|
||||
"status": {"code": 200, "message": "ok"},
|
||||
}
|
||||
except Exception as exc:
|
||||
return {
|
||||
"tool_call_id": call_id,
|
||||
"name": tool_name,
|
||||
"output": {"expression": expression, "error": str(exc)},
|
||||
"status": {"code": 422, "message": "invalid_expression"},
|
||||
}
|
||||
|
||||
return {
|
||||
"tool_call_id": call_id,
|
||||
"name": tool_name or "unknown_tool",
|
||||
"output": {"message": "server tool not implemented"},
|
||||
"status": {"code": 501, "message": "not_implemented"},
|
||||
}
|
||||
@@ -161,7 +161,9 @@ Common events:
|
||||
- `assistant.response.final`
|
||||
- Fields: `trackId`, `text`
|
||||
- `assistant.tool_call`
|
||||
- Fields: `trackId`, `tool_call`
|
||||
- Fields: `trackId`, `tool_call` (`tool_call.executor` is `client` or `server`)
|
||||
- `assistant.tool_result`
|
||||
- Fields: `trackId`, `source`, `result`
|
||||
- `output.audio.start`
|
||||
- Fields: `trackId`
|
||||
- `output.audio.end`
|
||||
|
||||
@@ -136,6 +136,7 @@ async def test_turn_with_tool_call_then_results(monkeypatch):
|
||||
type="tool_call",
|
||||
tool_call={
|
||||
"id": "call_ok",
|
||||
"executor": "client",
|
||||
"type": "function",
|
||||
"function": {"name": "weather", "arguments": "{\"city\":\"hz\"}"},
|
||||
},
|
||||
@@ -183,6 +184,7 @@ async def test_turn_with_tool_call_timeout(monkeypatch):
|
||||
type="tool_call",
|
||||
tool_call={
|
||||
"id": "call_timeout",
|
||||
"executor": "client",
|
||||
"type": "function",
|
||||
"function": {"name": "search", "arguments": "{\"query\":\"x\"}"},
|
||||
},
|
||||
@@ -217,3 +219,36 @@ async def test_duplicate_tool_results_are_ignored(monkeypatch):
|
||||
result = await pipeline._wait_for_single_tool_result("call_dup")
|
||||
|
||||
assert result.get("output", {}).get("value") == 1
|
||||
|
||||
|
||||
@pytest.mark.asyncio
|
||||
async def test_server_calculator_emits_tool_result(monkeypatch):
|
||||
pipeline, events = _build_pipeline(
|
||||
monkeypatch,
|
||||
[
|
||||
[
|
||||
LLMStreamEvent(
|
||||
type="tool_call",
|
||||
tool_call={
|
||||
"id": "call_calc",
|
||||
"executor": "server",
|
||||
"type": "function",
|
||||
"function": {"name": "calculator", "arguments": "{\"expression\":\"1+2\"}"},
|
||||
},
|
||||
),
|
||||
LLMStreamEvent(type="done"),
|
||||
],
|
||||
[
|
||||
LLMStreamEvent(type="text_delta", text="done."),
|
||||
LLMStreamEvent(type="done"),
|
||||
],
|
||||
],
|
||||
)
|
||||
|
||||
await pipeline._handle_turn("calc")
|
||||
|
||||
tool_results = [e for e in events if e.get("type") == "assistant.tool_result"]
|
||||
assert tool_results
|
||||
payload = tool_results[-1].get("result", {})
|
||||
assert payload.get("status", {}).get("code") == 200
|
||||
assert payload.get("output", {}).get("result") == 3
|
||||
|
||||
@@ -1000,37 +1000,6 @@ const TOOL_PARAMETER_HINTS: Record<string, any> = {
|
||||
const getDefaultToolParameters = (toolId: string) =>
|
||||
TOOL_PARAMETER_HINTS[toolId] || { type: 'object', properties: {} };
|
||||
|
||||
const parseToolArgs = (raw: unknown): Record<string, any> => {
|
||||
if (raw && typeof raw === 'object') return raw as Record<string, any>;
|
||||
if (typeof raw !== 'string') return {};
|
||||
const text = raw.trim();
|
||||
if (!text) return {};
|
||||
try {
|
||||
const parsed = JSON.parse(text);
|
||||
return parsed && typeof parsed === 'object' ? parsed : {};
|
||||
} catch {
|
||||
return {};
|
||||
}
|
||||
};
|
||||
|
||||
const evaluateCalculatorExpression = (expression: string): { ok: true; result: number } | { ok: false; error: string } => {
|
||||
const expr = String(expression || '').trim();
|
||||
if (!expr) return { ok: false, error: 'empty expression' };
|
||||
if (expr.length > 200) return { ok: false, error: 'expression too long' };
|
||||
if (!/^[0-9+\-*/().%\s]+$/.test(expr)) return { ok: false, error: 'invalid characters' };
|
||||
if (expr.includes('**') || expr.includes('//')) return { ok: false, error: 'unsupported operator' };
|
||||
|
||||
try {
|
||||
const value = Function(`"use strict"; return (${expr});`)();
|
||||
if (typeof value !== 'number' || !Number.isFinite(value)) {
|
||||
return { ok: false, error: 'expression is not finite number' };
|
||||
}
|
||||
return { ok: true, result: value };
|
||||
} catch {
|
||||
return { ok: false, error: 'invalid expression' };
|
||||
}
|
||||
};
|
||||
|
||||
// Stable transcription log so the scroll container is not recreated on every render (avoids scroll jumping)
|
||||
const TranscriptionLog: React.FC<{
|
||||
scrollRef: React.RefObject<HTMLDivElement | null>;
|
||||
@@ -1165,12 +1134,18 @@ export const DebugDrawer: React.FC<{
|
||||
const byId = new Map(tools.map((t) => [t.id, t]));
|
||||
return ids.map((id) => {
|
||||
const item = byId.get(id);
|
||||
const toolId = item?.id || id;
|
||||
const isClientTool =
|
||||
toolId.startsWith('client_') ||
|
||||
toolId.startsWith('browser_') ||
|
||||
['camera', 'microphone', 'page_control', 'local_file'].includes(toolId);
|
||||
return {
|
||||
type: 'function',
|
||||
executor: isClientTool ? 'client' : 'server',
|
||||
function: {
|
||||
name: item?.id || id,
|
||||
name: toolId,
|
||||
description: item?.description || item?.name || id,
|
||||
parameters: getDefaultToolParameters(item?.id || id),
|
||||
parameters: getDefaultToolParameters(toolId),
|
||||
},
|
||||
};
|
||||
});
|
||||
@@ -1760,64 +1735,25 @@ export const DebugDrawer: React.FC<{
|
||||
const toolCall = payload?.tool_call || {};
|
||||
const toolCallId = String(toolCall?.id || '').trim();
|
||||
const toolName = String(toolCall?.function?.name || toolCall?.name || 'unknown_tool');
|
||||
const executor = String(toolCall?.executor || 'server').toLowerCase();
|
||||
const rawArgs = String(toolCall?.function?.arguments || '');
|
||||
const argText = rawArgs.length > 160 ? `${rawArgs.slice(0, 160)}...` : rawArgs;
|
||||
setMessages((prev) => [
|
||||
...prev,
|
||||
{
|
||||
role: 'tool',
|
||||
text: `call ${toolName}${argText ? ` args=${argText}` : ''}`,
|
||||
text: `call ${toolName} executor=${executor}${argText ? ` args=${argText}` : ''}`,
|
||||
},
|
||||
]);
|
||||
if (toolCallId && ws.readyState === WebSocket.OPEN) {
|
||||
const argsObj = parseToolArgs(toolCall?.function?.arguments);
|
||||
const normalizedToolName = toolName.trim().toLowerCase();
|
||||
let resultPayload: any = {
|
||||
if (executor === 'client' && toolCallId && ws.readyState === WebSocket.OPEN) {
|
||||
const resultPayload: any = {
|
||||
tool_call_id: toolCallId,
|
||||
name: toolName,
|
||||
output: {
|
||||
message: 'Tool execution is not implemented in debug web client',
|
||||
message: 'Client tool execution is not implemented in debug web client',
|
||||
},
|
||||
status: { code: 501, message: 'not_implemented' },
|
||||
};
|
||||
|
||||
const isCalculatorTool =
|
||||
normalizedToolName === 'calculator' ||
|
||||
normalizedToolName.endsWith('.calculator') ||
|
||||
normalizedToolName.includes('calculator');
|
||||
|
||||
if (isCalculatorTool) {
|
||||
const expression = String(argsObj.expression || argsObj.input || '').trim();
|
||||
if (!expression) {
|
||||
resultPayload = {
|
||||
tool_call_id: toolCallId,
|
||||
name: toolName,
|
||||
output: { error: 'missing expression' },
|
||||
status: { code: 400, message: 'bad_request' },
|
||||
};
|
||||
} else {
|
||||
const calc = evaluateCalculatorExpression(expression);
|
||||
if (calc.ok) {
|
||||
resultPayload = {
|
||||
tool_call_id: toolCallId,
|
||||
name: toolName,
|
||||
output: {
|
||||
expression,
|
||||
result: calc.result,
|
||||
},
|
||||
status: { code: 200, message: 'ok' },
|
||||
};
|
||||
} else {
|
||||
resultPayload = {
|
||||
tool_call_id: toolCallId,
|
||||
name: toolName,
|
||||
output: { expression, error: calc.error },
|
||||
status: { code: 422, message: 'invalid_expression' },
|
||||
};
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
ws.send(
|
||||
JSON.stringify({
|
||||
type: 'tool_call.results',
|
||||
@@ -1841,6 +1777,21 @@ export const DebugDrawer: React.FC<{
|
||||
return;
|
||||
}
|
||||
|
||||
if (type === 'assistant.tool_result') {
|
||||
const result = payload?.result || {};
|
||||
const toolName = String(result?.name || 'unknown_tool');
|
||||
const statusCode = Number(result?.status?.code || 500);
|
||||
const statusMessage = String(result?.status?.message || 'error');
|
||||
const source = String(payload?.source || 'server');
|
||||
const output = result?.output;
|
||||
const resultText =
|
||||
statusCode === 200
|
||||
? `result ${toolName} source=${source} ${JSON.stringify(output)}`
|
||||
: `result ${toolName} source=${source} status=${statusCode} ${statusMessage}`;
|
||||
setMessages((prev) => [...prev, { role: 'tool', text: resultText }]);
|
||||
return;
|
||||
}
|
||||
|
||||
if (type === 'session.started') {
|
||||
wsReadyRef.current = true;
|
||||
setWsStatus('ready');
|
||||
|
||||
Reference in New Issue
Block a user