Files
ai-video-fullstack/backend/services/brains/fastgpt_llm.py
Xin Wang 809b634420 Enhance AssistantConfig and pipeline for FastGPT integration
- Add new fields in AssistantConfig for FastGPT connection details, including `fastgpt_api_url`, `fastgpt_api_key`, and `fastgpt_app_id`.
- Update the pipeline to utilize the new FastGPT configuration, ensuring proper integration with external services.
- Introduce type handling for different assistant types, including support for realtime modes and external brain management.
- Refactor frontend components to include hints for FastGPT configuration inputs, improving user guidance during setup.
2026-06-16 16:55:51 +08:00

162 lines
5.5 KiB
Python

"""FastGPT 作为 pipecat LLM 槽位。
与普通 LLM 的关键不同:context / 知识库 / 工具全在 FastGPT 服务端,靠 chatId
维持会话。所以本服务只发「最后一条 user 文本」+ 稳定 chatId,把流式 answer
事件转成 LLMTextFrame 交给下游 TTS;不消费/不依赖本地 LLMContext 的历史。
"""
from __future__ import annotations
from typing import Any
from fastgpt_client import AsyncChatClient, aiter_stream_events
from loguru import logger
from models import AssistantConfig
from pipecat.frames.frames import (
Frame,
LLMContextFrame,
LLMFullResponseEndFrame,
LLMFullResponseStartFrame,
LLMTextFrame,
)
from pipecat.processors.frame_processor import FrameDirection
from pipecat.services.llm_service import LLMService
from pipecat.services.settings import LLMSettings
# 承载回复文本的事件种类。detail=False 时 FastGPT 走 OpenAI 兼容流,文本以裸
# data: 块下发(无 event 名 → kind="data");detail=True / 旧版则用 answer/fastAnswer。
_ANSWER_KINDS = {"data", "answer", "fastAnswer"}
# SDK 会自动在 base_url 后拼 /api/v1/chat/completions(并去掉末尾 /api)。
# 用户常把「完整接口地址」填进 api_url,这里剥掉这些后缀,归一成主机根地址,
# 避免路径重复导致 404。
_ENDPOINT_SUFFIXES = (
"/api/v1/chat/completions",
"/v1/chat/completions",
"/chat/completions",
)
def normalize_base_url(url: str) -> str:
base = (url or "").strip().rstrip("/")
for suffix in _ENDPOINT_SUFFIXES:
if base.endswith(suffix):
base = base[: -len(suffix)]
break
return base or "http://localhost:3000"
def _last_user_text(messages: list[dict]) -> str:
"""取最近一条 user 消息的纯文本(兼容多模态分片)。"""
for message in reversed(messages or []):
if message.get("role") != "user":
continue
content = message.get("content")
if isinstance(content, str):
return content
if isinstance(content, list):
return "".join(
str(part.get("text") or "")
for part in content
if isinstance(part, dict)
)
return ""
def _event_text(data: Any) -> str:
"""从一个流事件里取增量文本。
兼容两种形态(对齐 SDK examples 的解析):
- 直接 text 字段(answer/fastAnswer 详情流);
- OpenAI 兼容块 choices[0].delta.content / message.content(detail=False)。
"""
if not isinstance(data, dict):
return ""
text = data.get("text")
if isinstance(text, str) and text:
return text
choices = data.get("choices")
if not isinstance(choices, list) or not choices:
return ""
first = choices[0] if isinstance(choices[0], dict) else {}
delta = first.get("delta")
if isinstance(delta, dict):
content = delta.get("content")
if isinstance(content, str) and content:
return content
message = first.get("message")
if isinstance(message, dict):
content = message.get("content")
if isinstance(content, str) and content:
return content
return ""
class FastGPTLLMService(LLMService):
"""包 FastGPT OpenAPI 的伪 LLM 服务。"""
def __init__(self, cfg: AssistantConfig, chat_id: str):
# FastGPT 自管 model/温度等参数,这里把所有 LLM 设置初始化为 None,
# 满足基类 validate_complete(否则启动期会报 NOT_GIVEN)。
super().__init__(
settings=LLMSettings(
model=None,
system_instruction=None,
temperature=None,
max_tokens=None,
top_p=None,
top_k=None,
frequency_penalty=None,
presence_penalty=None,
seed=None,
filter_incomplete_user_turns=None,
user_turn_completion_config=None,
)
)
self._chat_id = chat_id
self._base_url = normalize_base_url(cfg.fastgpt_api_url)
self._client = AsyncChatClient(
api_key=cfg.fastgpt_api_key,
base_url=self._base_url,
)
async def process_frame(self, frame: Frame, direction: FrameDirection):
await super().process_frame(frame, direction)
if not isinstance(frame, LLMContextFrame):
await self.push_frame(frame, direction)
return
user_text = _last_user_text(frame.context.get_messages())
if not user_text:
return
await self.push_frame(LLMFullResponseStartFrame())
try:
response = await self._client.create_chat_completion(
messages=[{"role": "user", "content": user_text}],
stream=True,
chatId=self._chat_id,
detail=False,
)
async for event in aiter_stream_events(response):
if event.kind in _ANSWER_KINDS:
text = _event_text(event.data)
if text:
await self.push_frame(LLMTextFrame(text))
elif event.kind == "error":
logger.error(f"FastGPT 流式错误: {event.data}")
except Exception as exc: # noqa: BLE001 - 单轮失败不应中断通话
logger.error(
f"FastGPT 调用失败: {exc} "
f"(base_url={self._base_url},拼接后应为 {self._base_url}/api/v1/chat/completions)"
)
finally:
await self.push_frame(LLMFullResponseEndFrame())