Merge pull request #1208 from shane-lil/openai-client-config

feat(openai): add client configuration support to OpenAI integration
2025-04-03 17:43:57 +11:00
parent 7a67f6c2fd d45dc14069
commit 9648300b18
1 changed files with 101 additions and 26 deletions
--- a/lightrag/llm/openai.py
+++ b/lightrag/llm/openai.py
@@ -44,6 +44,43 @@ class InvalidResponseError(Exception):
    pass
 def create_openai_async_client(
    api_key: str | None = None,
    base_url: str | None = None,
    client_configs: dict[str, Any] = None,
 ) -> AsyncOpenAI:
    """Create an AsyncOpenAI client with the given configuration.
    Args:
        api_key: OpenAI API key. If None, uses the OPENAI_API_KEY environment variable.
        base_url: Base URL for the OpenAI API. If None, uses the default OpenAI API URL.
        client_configs: Additional configuration options for the AsyncOpenAI client.
            These will override any default configurations but will be overridden by
            explicit parameters (api_key, base_url).
    Returns:
        An AsyncOpenAI client instance.
    """
    if not api_key:
        api_key = os.environ["OPENAI_API_KEY"]
    default_headers = {
        "User-Agent": f"Mozilla/5.0 (Macintosh; Intel Mac OS X 10_15_8) LightRAG/{__api_version__}",
        "Content-Type": "application/json",
    }
    if client_configs is None:
        client_configs = {}
    # Create a merged config dict with precedence: explicit params > client_configs > defaults
    merged_configs = {**client_configs, "default_headers": default_headers, "api_key": api_key}
    if base_url is not None:
        merged_configs["base_url"] = base_url
    return AsyncOpenAI(**merged_configs)
@retry(
    stop=stop_after_attempt(3),
    wait=wait_exponential(multiplier=1, min=4, max=10),
@@ -61,29 +98,54 @@ async def openai_complete_if_cache(
    token_tracker: Any | None = None,
    **kwargs: Any,
 ) -> str:
    """Complete a prompt using OpenAI's API with caching support.
    Args:
        model: The OpenAI model to use.
        prompt: The prompt to complete.
        system_prompt: Optional system prompt to include.
        history_messages: Optional list of previous messages in the conversation.
        base_url: Optional base URL for the OpenAI API.
        api_key: Optional OpenAI API key. If None, uses the OPENAI_API_KEY environment variable.
        **kwargs: Additional keyword arguments to pass to the OpenAI API.
            Special kwargs:
            - openai_client_configs: Dict of configuration options for the AsyncOpenAI client.
                These will be passed to the client constructor but will be overridden by
                explicit parameters (api_key, base_url).
            - hashing_kv: Will be removed from kwargs before passing to OpenAI.
            - keyword_extraction: Will be removed from kwargs before passing to OpenAI.
    Returns:
        The completed text or an async iterator of text chunks if streaming.
    Raises:
        InvalidResponseError: If the response from OpenAI is invalid or empty.
        APIConnectionError: If there is a connection error with the OpenAI API.
        RateLimitError: If the OpenAI API rate limit is exceeded.
        APITimeoutError: If the OpenAI API request times out.
    """
    if history_messages is None:
        history_messages = []
    if not api_key:
        api_key = os.environ["OPENAI_API_KEY"]
    default_headers = {
        "User-Agent": "Mozilla/5.0 (Macintosh; Intel Mac OS X 10_15_8) LightRAG/{__api_version__}",
        "Content-Type": "application/json",
    }
    # Set openai logger level to INFO when VERBOSE_DEBUG is off
    if not VERBOSE_DEBUG and logger.level == logging.DEBUG:
        logging.getLogger("openai").setLevel(logging.INFO)
-    openai_async_client = (
+    # Extract client configuration options
-        AsyncOpenAI(default_headers=default_headers, api_key=api_key)
+    client_configs = kwargs.pop("openai_client_configs", {})
-        if base_url is None
+    
-        else AsyncOpenAI(
+    # Create the OpenAI client
-            base_url=base_url, default_headers=default_headers, api_key=api_key
+    openai_async_client = create_openai_async_client(
-        )
+        api_key=api_key,
        base_url=base_url,
        client_configs=client_configs
    )
    # Remove special kwargs that shouldn't be passed to OpenAI
    kwargs.pop("hashing_kv", None)
    kwargs.pop("keyword_extraction", None)
    # Prepare messages
    messages: list[dict[str, Any]] = []
    if system_prompt:
        messages.append({"role": "system", "content": system_prompt})
@@ -272,21 +334,34 @@ async def openai_embed(
    model: str = "text-embedding-3-small",
    base_url: str = None,
    api_key: str = None,
    client_configs: dict[str, Any] = None,
 ) -> np.ndarray:
-    if not api_key:
+    """Generate embeddings for a list of texts using OpenAI's API.
        api_key = os.environ["OPENAI_API_KEY"]
-    default_headers = {
+    Args:
-        "User-Agent": f"Mozilla/5.0 (Macintosh; Intel Mac OS X 10_15_8) LightRAG/{__api_version__}",
+        texts: List of texts to embed.
-        "Content-Type": "application/json",
+        model: The OpenAI embedding model to use.
-    }
+        base_url: Optional base URL for the OpenAI API.
-    openai_async_client = (
+        api_key: Optional OpenAI API key. If None, uses the OPENAI_API_KEY environment variable.
-        AsyncOpenAI(default_headers=default_headers, api_key=api_key)
+        client_configs: Additional configuration options for the AsyncOpenAI client.
-        if base_url is None
+            These will override any default configurations but will be overridden by
-        else AsyncOpenAI(
+            explicit parameters (api_key, base_url).
-            base_url=base_url, default_headers=default_headers, api_key=api_key
+            
-        )
+    Returns:
        A numpy array of embeddings, one per input text.
    Raises:
        APIConnectionError: If there is a connection error with the OpenAI API.
        RateLimitError: If the OpenAI API rate limit is exceeded.
        APITimeoutError: If the OpenAI API request times out.
    """
    # Create the OpenAI client
    openai_async_client = create_openai_async_client(
        api_key=api_key,
        base_url=base_url,
        client_configs=client_configs
    )
    response = await openai_async_client.embeddings.create(
        model=model, input=texts, encoding_format="float"
    )