优化流式响应处理并添加测试用例

- 修复流式响应中的完成标记逻辑 - 添加非流式调用测试 - 添加流式调用测试 - 优化JSON序列化，支持非ASCII字符 - 确保生成器在完成标记后立即结束
2025-01-15 20:18:17 +08:00
parent f15f97a51d
commit 23f838ec94
2 changed files with 103 additions and 36 deletions
--- a/lightrag/api/lightrag_ollama.py
+++ b/lightrag/api/lightrag_ollama.py
@@ -706,18 +706,21 @@ def create_app(args):
                    try:
                        # 确保 response 是异步生成器
                        if isinstance(response, str):
                            # 如果是字符串，作为单个完整响应发送
                            data = {
-                                'model': LIGHTRAG_MODEL,
+                                "model": LIGHTRAG_MODEL,
-                                'created_at': LIGHTRAG_CREATED_AT,
+                                "created_at": LIGHTRAG_CREATED_AT,
-                                'message': {
+                                "message": {
-                                    'role': 'assistant',
+                                    "role": "assistant",
-                                    'content': response
+                                    "content": response
                                },
-                                'done': True
+                                "done": True
                            }
-                            yield f"data: {json.dumps(data)}\n\n"
+                            yield f"data: {json.dumps(data, ensure_ascii=False)}\n\n"
                        else:
                            # 流式响应
                            async for chunk in response:
                                if chunk:  # 只发送非空内容
                                    data = {
                                        "model": LIGHTRAG_MODEL,
                                        "created_at": LIGHTRAG_CREATED_AT,
@@ -727,17 +730,7 @@ def create_app(args):
                                        },
                                        "done": False
                                    }
-                                yield f"data: {json.dumps(data)}\n\n"
+                                    yield f"data: {json.dumps(data, ensure_ascii=False)}\n\n"
                            data = {
                                "model": LIGHTRAG_MODEL,
                                "created_at": LIGHTRAG_CREATED_AT,
                                "message": {
                                    "role": "assistant",
                                    "content": chunk
                                },
                                "done": False
                            }
                            yield f"data: {json.dumps(data)}\n\n"
                            # 发送完成标记
                            data = {
@@ -749,7 +742,8 @@ def create_app(args):
                                },
                                "done": True
                            }
-                        yield f"data: {json.dumps(data)}\n\n"
+                            yield f"data: {json.dumps(data, ensure_ascii=False)}\n\n"
                            return  # 确保生成器在发送完成标记后立即结束
                    except Exception as e:
                        logging.error(f"Error in stream_generator: {str(e)}")
                        raise
--- a/test_lightrag_ollama_chat.py
+++ b/test_lightrag_ollama_chat.py
@@ -0,0 +1,73 @@
 import requests
 import json
 import sseclient
 def test_non_stream_chat():
    """测试非流式调用 /api/chat 接口"""
    url = "http://localhost:9621/api/chat"
    # 构造请求数据
    data = {
        "model": "lightrag:latest",
        "messages": [
            {
                "role": "user",
                "content": "孙悟空"
            }
        ],
        "stream": False
    }
    # 发送请求
    response = requests.post(url, json=data)
    # 打印响应
    print("\n=== 非流式调用响应 ===")
    print(json.dumps(response.json(), ensure_ascii=False, indent=2))
 def test_stream_chat():
    """测试流式调用 /api/chat 接口"""
    url = "http://localhost:9621/api/chat"
    # 构造请求数据
    data = {
        "model": "lightrag:latest",
        "messages": [
            {
                "role": "user",
                "content": "/naive 孙悟空有什么法力，性格特征是什么"
            }
        ],
        "stream": True
    }
    # 发送请求并获取 SSE 流
    response = requests.post(url, json=data, stream=True)
    client = sseclient.SSEClient(response)
    print("\n=== 流式调用响应 ===")
    output_buffer = []
    try:
        for event in client.events():
            try:
                data = json.loads(event.data)
                message = data.get("message", {})
                content = message.get("content", "")
                if content:  # 只收集非空内容
                    output_buffer.append(content)
                if data.get("done", False):  # 如果收到完成标记，退出循环
                    break
            except json.JSONDecodeError:
                print("Error decoding JSON from SSE event")
    finally:
        response.close()  # 确保关闭响应连接
    # 一次性打印所有收集到的内容
    print("".join(output_buffer))
 if __name__ == "__main__":
    # 先测试非流式调用
    test_non_stream_chat()
    # 再测试流式调用
    test_stream_chat()