提示词添加车辆预先提取和手机号多次拼接输入

add nostream chat example
Add stream text output
2026-02-03 17:33:45 +08:00 · 2026-02-02 18:16:51 +08:00 · 2026-02-02 17:54:55 +08:00
10 changed files with 5011 additions and 10 deletions
--- a/docs/chat-stream-mode.md
+++ b/docs/chat-stream-mode.md
@@ -0,0 +1,56 @@
+# /chat 流式响应模式说明
+
+## 接口地址
+
+```
+POST http://localhost:8000/chat?stream=true
+```
+
+## 请求参数
+
+| 参数 | 类型 | 必填 | 说明 |
+|------|------|------|------|
+| sessionId | string | 是 | 会话 ID |
+| timeStamp | string | 是 | 时间戳 |
+| text | string | 是 | 用户输入文本 |
+| stream | bool | 否 | 设为 true 启用流式响应 |
+
+## SSE 事件类型
+
+| 事件类型 | 说明 | 数据格式 |
+|----------|------|----------|
+| `stage_code` | 阶段状态码 | `{"nextStageCode": "0000", "nextStage": "结束通话"}` |
+| `text_delta` | 流式文本片段 | `{"text": "您好..."}` |
+| `done` | 流式结束 | `{"status": "completed"}` |
+| `error` | 错误信息 | `{"msg": "错误描述", "code": "500"}` |
+
+## 状态码映射
+
+| 状态码 | 含义 |
+|--------|------|
+| 0000 | 结束通话 |
+| 0001 | 转接人工 |
+| 0002 | 语义无法识别转接人工 |
+| 0003 | 有人伤转接人工 |
+| 1001 | 未准备好通话 |
+| 1002 | 通话中 |
+| 2000 | 进入单车拍照 |
+| ... | ... |
+
+## 示例
+
+### 请求
+
+```bash
+python examples/stream_chat.py session-001 "发生了交通事故"
+```
+
+### 响应
+
+```
+Status: 200
+--------------------------------------------------
+[stage_code] {"nextStageCode": "1002", "nextStage": "通话中"}
+[text_delta] {"text": "您好，请问发生了什么情况？"}
+[done] {"status": "completed"}
+```
--- a/examples/nostream_chat.py
+++ b/examples/nostream_chat.py
@@ -0,0 +1,55 @@
+#!/usr/bin/env python3
+"""
+Simple CLI script to interact with /chat endpoint in non-stream mode.
+"""
+
+import asyncio
+import aiohttp
+import json
+import sys
+from datetime import datetime
+
+
+API_BASE_URL = "http://localhost:8000"
+
+
+async def chat(session_id: str, text: str):
+    """Send a non-streaming chat request."""
+    timestamp = datetime.now().isoformat()
+
+    payload = {
+        "sessionId": session_id,
+        "timeStamp": timestamp,
+        "text": text
+    }
+
+    async with aiohttp.ClientSession() as http_session:
+        async with http_session.post(
+            f"{API_BASE_URL}/chat",
+            json=payload,
+        ) as response:
+            data = await response.json()
+
+            print(f"Status: {response.status}")
+            print("-" * 50)
+            print(json.dumps(data, indent=2, ensure_ascii=False))
+
+
+async def main():
+    if len(sys.argv) < 3:
+        print("Usage: python nostream_chat.py <session_id> <message>")
+        print("Example: python nostream_chat.py test-session-123 '发生了交通事故'")
+        sys.exit(1)
+
+    session_id = sys.argv[1]
+    text = " ".join(sys.argv[2:])
+
+    print(f"Session ID: {session_id}")
+    print(f"Message: {text}")
+    print("-" * 50)
+
+    await chat(session_id, text)
+
+
+if __name__ == "__main__":
+    asyncio.run(main())
--- a/examples/stream_chat.py
+++ b/examples/stream_chat.py
@@ -0,0 +1,90 @@
+#!/usr/bin/env python3
+"""
+Stream Chat CLI - 与 /chat 端点进行流式交互的脚本。
+
+用法:
+    python stream_chat.py <session_id> <消息>
+
+示例:
+    python stream_chat.py test-001 "发生了交通事故"
+
+输出说明:
+    - [stage_code]: 阶段状态码，如 {"nextStageCode": "0000", "nextStage": "结束通话"}
+    - [text_delta]: 流式文本片段
+    - [done]: 流式结束
+    - [error]: 错误信息
+"""
+
+import asyncio
+import aiohttp
+import json
+import sys
+from datetime import datetime
+
+
+API_BASE_URL = "http://localhost:8000"
+
+
+async def stream_chat(session_id: str, text: str):
+    """Send a streaming chat request."""
+    timestamp = datetime.now().isoformat()
+
+    payload = {
+        "sessionId": session_id,
+        "timeStamp": timestamp,
+        "text": text
+    }
+
+    async with aiohttp.ClientSession() as http_session:
+        async with http_session.post(
+            f"{API_BASE_URL}/chat",
+            json=payload,
+            params={"stream": "true"},
+        ) as response:
+            print(f"Status: {response.status}")
+            print("-" * 50)
+
+            buffer = ""
+            # Use async iterator on response.content
+            async for chunk in response.content.iter_chunked(1024):
+                chunk_str = chunk.decode("utf-8")
+                buffer += chunk_str
+
+                # Process complete SSE messages
+                while "\n\n" in buffer:
+                    message, buffer = buffer.split("\n\n", 1)
+                    if message.startswith("event: "):
+                        event_type = message[7:].split("\n")[0]
+                        data_line = message.split("data: ", 1)[-1]
+                        try:
+                            data = json.loads(data_line)
+                            print(f"[{event_type}] {json.dumps(data, ensure_ascii=False)}")
+                        except json.JSONDecodeError:
+                            print(f"[{event_type}] {data_line}")
+                    elif message.startswith("data: "):
+                        data_str = message[6:]
+                        try:
+                            data = json.loads(data_str)
+                            print(f"[data] {json.dumps(data, ensure_ascii=False)}")
+                        except json.JSONDecodeError:
+                            print(f"[data] {data_str}")
+
+
+async def main():
+    if len(sys.argv) < 3:
+        print("Usage: python stream_chat.py <session_id> <message>")
+        print("Example: python stream_chat.py test-session-123 '发生了交通事故'")
+        sys.exit(1)
+
+    session_id = sys.argv[1]
+    text = " ".join(sys.argv[2:])
+
+    print(f"Session ID: {session_id}")
+    print(f"Message: {text}")
+    print("-" * 50)
+
+    await stream_chat(session_id, text)
+
+
+if __name__ == "__main__":
+    asyncio.run(main())
--- a/src/api/endpoints.py
+++ b/src/api/endpoints.py
@@ -1,4 +1,5 @@
 from fastapi import APIRouter, HTTPException, Depends
+from fastapi.responses import StreamingResponse
 from ..schemas.models import ProcessRequest_chat, ProcessResponse_chat, ProcessRequest_get, ProcessResponse_get, ProcessRequest_set, ProcessResponse_set, ProcessResponse_delete_session, ProcessRequest_delete_session
 from fastgpt_client import AsyncChatClient
 from fastgpt_client.exceptions import (
@@ -98,15 +99,104 @@ async def delete_last_two_chat_records(
 #     logging.error(f"Validation Error: {exc.errors()}")
 #     raise HTTPException(status_code=422, detail=exc.errors())

+def create_sse_event(event: str, data: dict) -> str:
+    """Format data as an SSE event."""
+    return f"event: {event}\ndata: {json.dumps(data, ensure_ascii=False)}\n\n"
+
@router.post("/chat", response_model=ProcessResponse_chat)
 async def chat(
    request: ProcessRequest_chat,
+    stream: bool = False,
    client: AsyncChatClient = Depends(get_fastgpt_client)
 ):
    """Handle chat completion request."""
    json_data = request.model_dump()
-    logger.info(f"用户请求信息ProcessRequest_chat: {json_data}")
+    logger.info(f"用户请求信息ProcessRequest_chat: {json_data}, stream={stream}")
    
+    if stream:
+        async def event_generator():
+            try:
+                # Use SDK's create_chat_completion with stream=True
+                response = await client.create_chat_completion(
+                    messages=[{"role": "user", "content": json_data['text']}],
+                    chatId=json_data['sessionId'],
+                    stream=True,
+                    detail=True
+                )
+                
+                buffer = ""
+                state_code_found = False
+                
+                async for chunk in response.aiter_lines():
+                    if chunk.startswith('data: '):
+                        data_str = chunk[6:].strip()
+                        if data_str == '[DONE]':
+                            break
+                        try:
+                            data = json.loads(data_str)
+                            try:
+                                delta_content = data['choices'][0]['delta'].get('content', '')
+                            except (KeyError, IndexError):
+                                delta_content = ''
+                            if delta_content:
+                                buffer += delta_content
+                                
+                                if not state_code_found:
+                                    # Check for <state>XXXX</state> pattern
+                                    match = re.search(r"<state>(.*?)</state>", buffer)
+                                    if match:
+                                        state_code = match.group(1)
+                                        
+                                        # Apply logic to map/adjust state code
+                                        nextStageCode = state_code
+                                        if nextStageCode in ['3001', '3002', '1002']:
+                                            nextStageCode = '1002'
+                                        elif nextStageCode == '2006':
+                                            nextStageCode = '2004'
+                                        elif nextStageCode == '2017':
+                                            nextStageCode = '2016'
+                                        elif nextStageCode == '2020':
+                                            nextStageCode = '0002'
+                                        nextStage = STATUS_CODE_MAP.get(nextStageCode, '')
+                                        
+                                        # Send stage code event
+                                        yield create_sse_event("stage_code", {
+                                            "nextStageCode": nextStageCode,
+                                            "nextStage": nextStage
+                                        })
+                                        
+                                        state_code_found = True
+                                        
+                                        # Send remaining content as text_delta
+                                        remaining_content = buffer[match.end():]
+                                        if remaining_content:
+                                            yield create_sse_event("text_delta", {"text": remaining_content})
+                                        buffer = "" # Clear buffer after extracting state
+                                else:
+                                    # State code already found, just stream text
+                                    yield create_sse_event("text_delta", {"text": delta_content})
+                                    buffer = "" # Do not buffer text after state found
+                                    
+                        except json.JSONDecodeError:
+                            continue
+                        except Exception as e:
+                            print(data)
+                            logger.error(f"Error processing chunk: {e}")
+                            continue
+
+                # If stream ends and no state code found (unlikely if format is strict), 
+                # we might want to send what we have
+                if not state_code_found and buffer:
+                     yield create_sse_event("text_delta", {"text": buffer})
+
+                yield create_sse_event("done", {"status": "completed"})
+                
+            except Exception as e:
+                logger.error(f"Streaming error: {e}")
+                yield create_sse_event("error", {"msg": str(e), "code": "500"})
+
+        return StreamingResponse(event_generator(), media_type="text/event-stream")
+
    try:
        # Use SDK's create_chat_completion
        response = await client.create_chat_completion(
--- a/test/api/fastapi.http
+++ b/test/api/fastapi.http
@@ -38,37 +38,37 @@ HTTP/1.1 200  - OK
 connection: close
 content-length: 97
 content-type: application/json
-date: Thu, 08 Jan 2026 09:26:31 GMT
+date: Thu, 08 Jan 2026 09:27:05 GMT
 server: uvicorn
 ###
 POST http://127.0.0.1:8080/set_info
 content-type: application/json

 {
-    "sessionId": "a0009",
+    "sessionId": "a1002",
    "timeStamp": "202503310303",
    "key": "hphm1",
-    "value": "沪A8938"
+    "value": "沪A8939"
 }

 HTTP/1.1 200  - OK
 connection: close
 content-length: 70
 content-type: application/json
-date: Thu, 08 Jan 2026 09:25:49 GMT
+date: Thu, 08 Jan 2026 09:27:00 GMT
 server: uvicorn
 ###
-DELETE http://127.0.0.1:8000/delete_session
+DELETE http://127.0.0.1:8080/delete_session
 content-type: application/json

 {
-    "sessionId": "a0009",
+    "sessionId": "a1002",
    "timeStamp": "202503310303"
 }

 HTTP/1.1 200  - OK
-date: Fri, 20 Jun 2025 05:56:25 GMT
-server: uvicorn
+connection: close
 content-length: 70
 content-type: application/json
-connection: close
+date: Thu, 08 Jan 2026 09:27:24 GMT
+server: uvicorn
--- a/workflow/20250419/事故信息采集20250419.json
+++ b/workflow/20250419/事故信息采集20250419.json
--- a/workflow/20250419/单车拍照流程插件.json
+++ b/workflow/20250419/单车拍照流程插件.json
--- a/workflow/20250419/单车插件.json
+++ b/workflow/20250419/单车插件.json
--- a/workflow/20250419/双车拍照流程插件.json
+++ b/workflow/20250419/双车拍照流程插件.json
--- a/workflow/20251108/事故信息采集20251108.json
+++ b/workflow/20251108/事故信息采集20251108.json
Author	SHA1	Message	Date
Xin Wang	87e616ab55	提示词添加车辆预先提取和手机号多次拼接输入	2026-02-03 17:33:45 +08:00
Xin Wang	34848dd6a0	add nostream chat example	2026-02-02 18:16:51 +08:00
Xin Wang	30306addee	Add stream text output	2026-02-02 17:54:55 +08:00