Implement Gunicorn+Uvicorn integration for shared data preloading

- Create run_with_gunicorn.py script to properly initialize shared data in the main process before forking worker processes - Revert unvicorn to single process mode only, and let gunicorn do all the multi-process jobs
2025-02-27 13:25:22 +08:00
parent 7c237920b1
commit 7aec78833c
4 changed files with 365 additions and 23 deletions
--- a/gunicorn_config.py
+++ b/gunicorn_config.py
@@ -0,0 +1,80 @@
 # gunicorn_config.py
 import os
 import multiprocessing
 from lightrag.kg.shared_storage import finalize_share_data
 from lightrag.api.utils_api import parse_args
 # Parse command line arguments
 args = parse_args()
 # Determine worker count - from environment variable or command line arguments
 workers = int(os.getenv('WORKERS', args.workers))
 # If not specified, use CPU count * 2 + 1 (Gunicorn recommended configuration)
 if workers <= 1:
    workers = multiprocessing.cpu_count() * 2 + 1
 # Binding address
 bind = f"{os.getenv('HOST', args.host)}:{os.getenv('PORT', args.port)}"
 # Enable preload_app option
 preload_app = True
 # Use Uvicorn worker
 worker_class = "uvicorn.workers.UvicornWorker"
 # Other Gunicorn configurations
 timeout = int(os.getenv('TIMEOUT', 120))
 keepalive = 5
 # Optional SSL configuration
 if args.ssl:
    certfile = args.ssl_certfile
    keyfile = args.ssl_keyfile
 # Logging configuration
 errorlog = os.getenv('ERROR_LOG', '-')  # '-' means stderr
 accesslog = os.getenv('ACCESS_LOG', '-')  # '-' means stderr
 loglevel = os.getenv('LOG_LEVEL', 'info')
 def on_starting(server):
    """
    Executed when Gunicorn starts, before forking the first worker processes
    You can use this function to do more initialization tasks for all processes
    """
    print("=" * 80)
    print(f"GUNICORN MASTER PROCESS: on_starting jobs for all {workers} workers")
    print(f"Process ID: {os.getpid()}")
    print("=" * 80)
    # Memory usage monitoring
    try:
        import psutil
        process = psutil.Process(os.getpid())
        memory_info = process.memory_info()
        msg = f"Memory usage after initialization: {memory_info.rss / 1024 / 1024:.2f} MB"
        print(msg)
    except ImportError:
        print("psutil not installed, skipping memory usage reporting")
    print("=" * 80)
    print("Gunicorn initialization complete, forking workers...")
    print("=" * 80)
 def on_exit(server):
    """
    Executed when Gunicorn is shutting down.
    This is a good place to release shared resources.
    """
    print("=" * 80)
    print("GUNICORN MASTER PROCESS: Shutting down")
    print(f"Process ID: {os.getpid()}")
    print("=" * 80)
    # Release shared resources
    finalize_share_data()
    print("=" * 80)
    print("Gunicorn shutdown complete")
    print("=" * 80)
--- a/lightrag/api/lightrag_server.py
+++ b/lightrag/api/lightrag_server.py
@@ -483,17 +483,28 @@ def main():
    display_splash_screen(args)
-    from lightrag.kg.shared_storage import initialize_share_data
+    # Check if running under Gunicorn
-    initialize_share_data(args.workers)
+    if 'GUNICORN_CMD_ARGS' in os.environ:
        # If started with Gunicorn, return directly as Gunicorn will call get_application
        print("Running under Gunicorn - worker management handled by Gunicorn")
        return
    # If not running under Gunicorn, initialize shared data here
    from lightrag.kg.shared_storage import initialize_share_data
    print("Starting in single-process mode")
    initialize_share_data(1)  # Force single process mode
    # Create application instance directly instead of using factory function
    app = create_app(args)
    # Start Uvicorn in single process mode
    uvicorn_config = {
-        "app": "lightrag.api.lightrag_server:get_application",
+        "app": app,  # Pass application instance directly instead of string path
        "factory": True,
        "host": args.host,
        "port": args.port,
        "workers": args.workers,
        "log_config": None,  # Disable default config
    }
    if args.ssl:
        uvicorn_config.update(
            {
@@ -501,6 +512,8 @@ def main():
                "ssl_keyfile": args.ssl_keyfile,
            }
        )
    print(f"Starting Uvicorn server in single-process mode on {args.host}:{args.port}")
    uvicorn.run(**uvicorn_config)
--- a/lightrag/kg/shared_storage.py
+++ b/lightrag/kg/shared_storage.py
@@ -1,10 +1,19 @@
 import os
 import sys
 from multiprocessing.synchronize import Lock as ProcessLock
 from threading import Lock as ThreadLock
 from multiprocessing import Manager
 from typing import Any, Dict, Optional, Union
 from lightrag.utils import logger
 # Define a direct print function for critical logs that must be visible in all processes
 def direct_log(message, level="INFO"):
    """
    Log a message directly to stderr to ensure visibility in all processes,
    including the Gunicorn master process.
    """    
    print(f"{level}: {message}", file=sys.stderr, flush=True)
 LockType = Union[ProcessLock, ThreadLock]
 _manager = None
@@ -21,41 +30,60 @@ _global_lock: Optional[LockType] = None
 def initialize_share_data(workers: int = 1):
-    """Initialize storage data"""
+    """
    Initialize shared storage data for single or multi-process mode.
    When used with Gunicorn's preload feature, this function is called once in the
    master process before forking worker processes, allowing all workers to share
    the same initialized data.
    In single-process mode, this function is called during LightRAG object initialization.
    The function determines whether to use cross-process shared variables for data storage
    based on the number of workers. If workers=1, it uses thread locks and local dictionaries.
    If workers>1, it uses process locks and shared dictionaries managed by multiprocessing.Manager.
    Args:
        workers (int): Number of worker processes. If 1, single-process mode is used.
                      If > 1, multi-process mode with shared memory is used.
    """
    global _manager, _is_multiprocess, is_multiprocess, _global_lock, _shared_dicts, _share_objects, _init_flags, _initialized
    # Check if already initialized
    if _initialized and _initialized.value:
        is_multiprocess = _is_multiprocess.value
-        if _is_multiprocess.value:
+        direct_log(f"Process {os.getpid()} storage data already initialized (multiprocess={_is_multiprocess.value})!")
-            logger.info(f"Process {os.getpid()} storage data already initialized!")
+        return
            return
    _manager = Manager()
    _initialized = _manager.Value("b", False)
    _is_multiprocess = _manager.Value("b", False)
-    if workers == 1:
+    # Force multi-process mode if workers > 1
-        _is_multiprocess.value = False
+    if workers > 1:
        _global_lock = ThreadLock()
        _shared_dicts = {}
        _share_objects = {}
        _init_flags = {}
        logger.info(f"Process {os.getpid()} storage data created for Single Process")
    else:
        _is_multiprocess.value = True
        _global_lock = _manager.Lock() 
        # Create shared dictionaries with manager
        _shared_dicts = _manager.dict()
        _share_objects = _manager.dict()
-        _init_flags = _manager.dict()  # 使用共享字典存储初始化标志
+        _init_flags = _manager.dict()  # Use shared dictionary to store initialization flags
-        logger.info(f"Process {os.getpid()} storage data created for Multiple Process")
+        direct_log(f"Process {os.getpid()} storage data created for Multiple Process (workers={workers})")
    else:
        _is_multiprocess.value = False
        _global_lock = ThreadLock()
        _shared_dicts = {}
        _share_objects = {}
        _init_flags = {}
        direct_log(f"Process {os.getpid()} storage data created for Single Process")
    # Mark as initialized
    _initialized.value = True
    is_multiprocess = _is_multiprocess.value
 def try_initialize_namespace(namespace: str) -> bool:
    """
-    尝试初始化命名空间。返回True表示当前进程获得了初始化权限。
+    Try to initialize a namespace. Returns True if the current process gets initialization permission.
-    使用共享字典的原子操作确保只有一个进程能成功初始化。
+    Uses atomic operations on shared dictionaries to ensure only one process can successfully initialize.
    """
    global _init_flags, _manager
@@ -126,3 +154,52 @@ def get_namespace_data(namespace: str) -> Dict[str, Any]:
 def get_scan_progress() -> Dict[str, Any]:
    """get storage space for document scanning progress data"""
    return get_namespace_data("scan_progress")
 def finalize_share_data():
    """
    Release shared resources and clean up.
    This function should be called when the application is shutting down
    to properly release shared resources and avoid memory leaks.
    In multi-process mode, it shuts down the Manager and releases all shared objects.
    In single-process mode, it simply resets the global variables.
    """
    global _manager, _is_multiprocess, is_multiprocess, _global_lock, _shared_dicts, _share_objects, _init_flags, _initialized
    # Check if already initialized
    if not (_initialized and _initialized.value):
        direct_log(f"Process {os.getpid()} storage data not initialized, nothing to finalize")
        return
    direct_log(f"Process {os.getpid()} finalizing storage data (multiprocess={_is_multiprocess.value})")
    # In multi-process mode, shut down the Manager
    if _is_multiprocess.value and _manager is not None:
        try:
            # Clear shared dictionaries first
            if _shared_dicts is not None:
                _shared_dicts.clear()
            if _share_objects is not None:
                _share_objects.clear()
            if _init_flags is not None:
                _init_flags.clear()
            # Shut down the Manager
            _manager.shutdown()
            direct_log(f"Process {os.getpid()} Manager shutdown complete")
        except Exception as e:
            direct_log(f"Process {os.getpid()} Error shutting down Manager: {e}", level="ERROR")
    # Reset global variables
    _manager = None
    _initialized = None
    _is_multiprocess = None
    is_multiprocess = None
    _shared_dicts = None
    _share_objects = None
    _init_flags = None
    _global_lock = None
    direct_log(f"Process {os.getpid()} storage data finalization complete")
--- a/run_with_gunicorn.py
+++ b/run_with_gunicorn.py
@@ -0,0 +1,172 @@
 #!/usr/bin/env python
 """
 Start LightRAG server with Gunicorn
 """
 import os
 import sys
 import json
 import signal
 import argparse
 import subprocess
 from lightrag.api.utils_api import parse_args, display_splash_screen
 from lightrag.kg.shared_storage import initialize_share_data, finalize_share_data
 # Signal handler for graceful shutdown
 def signal_handler(sig, frame):
    print("\n\n" + "="*80)
    print("RECEIVED TERMINATION SIGNAL")
    print(f"Process ID: {os.getpid()}")
    print("="*80 + "\n")
    # Release shared resources
    finalize_share_data()
    # Exit with success status
    sys.exit(0)
 def main():
    # Register signal handlers for graceful shutdown
    signal.signal(signal.SIGINT, signal_handler)  # Ctrl+C
    signal.signal(signal.SIGTERM, signal_handler) # kill command
    # Create a parser to handle Gunicorn-specific parameters
    parser = argparse.ArgumentParser(
        description="Start LightRAG server with Gunicorn"
    )
    parser.add_argument(
        "--workers",
        type=int,
        help="Number of worker processes (overrides the default or config.ini setting)"
    )
    parser.add_argument(
        "--timeout",
        type=int,
        help="Worker timeout in seconds (default: 120)"
    )
    parser.add_argument(
        "--log-level",
        choices=["debug", "info", "warning", "error", "critical"],
        help="Gunicorn log level"
    )
    # Parse Gunicorn-specific arguments
    gunicorn_args, remaining_args = parser.parse_known_args()
    # Pass remaining arguments to LightRAG's parse_args
    sys.argv = [sys.argv[0]] + remaining_args
    args = parse_args()
    # If workers specified, override args value
    if gunicorn_args.workers:
        args.workers = gunicorn_args.workers
        os.environ["WORKERS"] = str(gunicorn_args.workers)
    # If timeout specified, set environment variable
    if gunicorn_args.timeout:
        os.environ["TIMEOUT"] = str(gunicorn_args.timeout)
    # If log-level specified, set environment variable
    if gunicorn_args.log_level:
        os.environ["LOG_LEVEL"] = gunicorn_args.log_level
    # Save all LightRAG args to environment variable for worker processes
    # This is the key step for passing arguments to lightrag_server.py
    os.environ["LIGHTRAG_ARGS"] = json.dumps(vars(args))
    # Display startup information
    display_splash_screen(args)
    print("🚀 Starting LightRAG with Gunicorn")
    print(f"🔄 Worker management: Gunicorn (workers={args.workers})")
    print("🔍 Preloading app: Enabled")
    print("📝 Note: Using Gunicorn's preload feature for shared data initialization")
    print("\n\n" + "="*80)
    print("MAIN PROCESS INITIALIZATION")
    print(f"Process ID: {os.getpid()}")
    print(f"Workers setting: {args.workers}")
    print("="*80 + "\n")
    # Start application with Gunicorn using direct Python API
    # Ensure WORKERS environment variable is set before importing gunicorn_config
    if args.workers > 1:
        os.environ["WORKERS"] = str(args.workers)
    # Import Gunicorn's StandaloneApplication
    from gunicorn.app.base import BaseApplication
    # Define a custom application class that loads our config
    class GunicornApp(BaseApplication):
        def __init__(self, app, options=None):
            self.options = options or {}
            self.application = app
            super().__init__()
        def load_config(self):
            # Define valid Gunicorn configuration options
            valid_options = {
                'bind', 'workers', 'worker_class', 'timeout', 'keepalive',
                'preload_app', 'errorlog', 'accesslog', 'loglevel',
                'certfile', 'keyfile', 'limit_request_line', 'limit_request_fields',
                'limit_request_field_size', 'graceful_timeout', 'max_requests',
                'max_requests_jitter'
            }
            # Special hooks that need to be set separately
            special_hooks = {
                'on_starting', 'on_reload', 'on_exit', 'pre_fork', 'post_fork',
                'pre_exec', 'pre_request', 'post_request', 'worker_init',
                'worker_exit', 'nworkers_changed', 'child_exit'
            }
            # Import the gunicorn_config module directly
            import importlib.util
            spec = importlib.util.spec_from_file_location("gunicorn_config", "gunicorn_config.py")
            self.config_module = importlib.util.module_from_spec(spec)
            spec.loader.exec_module(self.config_module)
            # Set configuration options
            for key in dir(self.config_module):
                if key in valid_options:
                    value = getattr(self.config_module, key)
                    # Skip functions like on_starting
                    if not callable(value):
                        self.cfg.set(key, value)
                # Set special hooks
                elif key in special_hooks:
                    value = getattr(self.config_module, key)
                    if callable(value):
                        self.cfg.set(key, value)
            # Override with command line arguments if provided
            if gunicorn_args.workers:
                self.cfg.set("workers", gunicorn_args.workers)
            if gunicorn_args.timeout:
                self.cfg.set("timeout", gunicorn_args.timeout)
            if gunicorn_args.log_level:
                self.cfg.set("loglevel", gunicorn_args.log_level)
        def load(self):
            # Import the application
            from lightrag.api.lightrag_server import get_application
            return get_application()
    # Create the application
    app = GunicornApp("")
    # Directly call initialize_share_data with the correct workers value
    from lightrag.kg.shared_storage import initialize_share_data
    # Force workers to be an integer and greater than 1 for multi-process mode
    workers_count = int(args.workers)
    if workers_count > 1:
        # Set a flag to indicate we're in the main process
        os.environ["LIGHTRAG_MAIN_PROCESS"] = "1"
        initialize_share_data(workers_count)
    else:
        initialize_share_data(1)
    # Run the application
    print("\nStarting Gunicorn with direct Python API...")
    app.run()
 if __name__ == "__main__":
    main()