feat: improve error handling for streaming responses

• Add CancelledError handling for streams • Send error details to client in JSON • Add error status codes and messages • Always send final completion marker • Refactor stream generator error handling
2025-02-05 09:46:56 +08:00
parent 0c8a2bface
commit 69f200faf2
1 changed files with 75 additions and 40 deletions
--- a/lightrag/api/lightrag_server.py
+++ b/lightrag/api/lightrag_server.py
@@ -12,7 +12,7 @@ from fastapi import (
 # Add this to store progress globally
 from typing import Dict
 import threading
-
+import asyncio
 import json
 import os
@@ -1718,11 +1718,11 @@ def create_app(args):
                    )
                async def stream_generator():
                    try:
                    first_chunk_time = None
                    last_chunk_time = None
                    total_response = ""
                    try:
                        # Ensure response is an async generator
                        if isinstance(response, str):
                            # If it's a string, send in two parts
@@ -1760,6 +1760,7 @@ def create_app(args):
                            }
                            yield f"{json.dumps(data, ensure_ascii=False)}\n"
                        else:
                            try:
                                async for chunk in response:
                                    if chunk:
                                        if first_chunk_time is None:
@@ -1779,7 +1780,20 @@ def create_app(args):
                                            "done": False,
                                        }
                                        yield f"{json.dumps(data, ensure_ascii=False)}\n"
                            except asyncio.CancelledError:
                                error_data = {
                                    "model": ollama_server_infos.LIGHTRAG_MODEL,
                                    "created_at": ollama_server_infos.LIGHTRAG_CREATED_AT,
                                    "error": {
                                        "code": "STREAM_CANCELLED",
                                        "message": "Stream was cancelled by server"
                                    },
                                    "done": False
                                }
                                yield f"{json.dumps(error_data, ensure_ascii=False)}\n"
                                raise
                            if last_chunk_time is not None:
                                completion_tokens = estimate_tokens(total_response)
                                total_time = last_chunk_time - start_time
                                prompt_eval_time = first_chunk_time - start_time
@@ -1797,9 +1811,30 @@ def create_app(args):
                                    "eval_duration": eval_time,
                                }
                                yield f"{json.dumps(data, ensure_ascii=False)}\n"
-                            return  # Ensure the generator ends immediately after sending the completion marker
+
                    except Exception as e:
-                        logging.error(f"Error in stream_generator: {str(e)}")
+                        error_msg = f"Error in stream_generator: {str(e)}"
                        logging.error(error_msg)
                        # 发送错误消息给客户端
                        error_data = {
                            "model": ollama_server_infos.LIGHTRAG_MODEL,
                            "created_at": ollama_server_infos.LIGHTRAG_CREATED_AT,
                            "error": {
                                "code": "STREAM_ERROR",
                                "message": error_msg
                            },
                            "done": False
                        }
                        yield f"{json.dumps(error_data, ensure_ascii=False)}\n"
                        # 确保发送结束标记
                        final_data = {
                            "model": ollama_server_infos.LIGHTRAG_MODEL,
                            "created_at": ollama_server_infos.LIGHTRAG_CREATED_AT,
                            "done": True
                        }
                        yield f"{json.dumps(final_data, ensure_ascii=False)}\n"
                        raise
                return StreamingResponse(