完成ollma接口的代码编写

2025-01-15 14:31:49 +08:00
parent b97d1ecd72
commit be134878fe
2 changed files with 129 additions and 7 deletions
--- a/lightrag/api/lightrag_ollama.py
+++ b/lightrag/api/lightrag_ollama.py
@@ -2,14 +2,11 @@ from fastapi import FastAPI, HTTPException, File, UploadFile, Form
 from pydantic import BaseModel
 import logging
 import argparse
+from typing import List, Dict, Any, Optional
 from lightrag import LightRAG, QueryParam
-# from lightrag.llm import lollms_model_complete, lollms_embed
-# from lightrag.llm import ollama_model_complete, ollama_embed, openai_embedding
 from lightrag.llm import openai_complete_if_cache, ollama_embedding
-# from lightrag.llm import azure_openai_complete_if_cache, azure_openai_embedding

 from lightrag.utils import EmbeddingFunc
-from typing import Optional, List
 from enum import Enum
 from pathlib import Path
 import shutil
@@ -26,6 +23,13 @@ from starlette.status import HTTP_403_FORBIDDEN
 from dotenv import load_dotenv
 load_dotenv()

+# Constants for model information
+LIGHTRAG_NAME = "lightrag"
+LIGHTRAG_TAG = "latest"
+LIGHTRAG_MODEL = "{LIGHTRAG_NAME}:{LIGHTRAG_TAG}"
+LIGHTRAG_CREATED_AT = "2024-01-15T00:00:00Z"
+LIGHTRAG_DIGEST = "sha256:lightrag"
+
 async def llm_model_func(
    prompt, system_prompt=None, history_messages=[], keyword_extraction=False, **kwargs
 ) -> str:
@@ -219,21 +223,43 @@ class DocumentManager:
 class SearchMode(str, Enum):
    naive = "naive"
    local = "local"
-    global_ = "global"
+    global_ = "global"  # 使用 global_ 因为 global 是 Python 保留关键字，但枚举值会转换为字符串 "global"
    hybrid = "hybrid"

+# Ollama API compatible models
+class OllamaMessage(BaseModel):
+    role: str
+    content: str

+class OllamaChatRequest(BaseModel):
+    model: str = LIGHTRAG_MODEL
+    messages: List[OllamaMessage]
+    stream: bool = False
+    options: Optional[Dict[str, Any]] = None
+
+class OllamaChatResponse(BaseModel):
+    model: str
+    created_at: str
+    message: OllamaMessage
+    done: bool
+
+class OllamaVersionResponse(BaseModel):
+    version: str
+    build: str = "default"
+
+class OllamaTagResponse(BaseModel):
+    models: List[Dict[str, str]]
+
+# Original LightRAG models
 class QueryRequest(BaseModel):
    query: str
    mode: SearchMode = SearchMode.hybrid
    stream: bool = False
    only_need_context: bool = False

-
 class QueryResponse(BaseModel):
    response: str

-
 class InsertTextRequest(BaseModel):
    text: str
    description: Optional[str] = None
@@ -555,6 +581,101 @@ def create_app(args):
        except Exception as e:
            raise HTTPException(status_code=500, detail=str(e))

+    # Ollama compatible API endpoints
+    @app.get("/api/version")
+    async def get_version():
+        """Get Ollama version information"""
+        return OllamaVersionResponse(
+            version="0.1.0"
+        )
+
+    @app.get("/api/tags")
+    async def get_tags():
+        """Get available models"""
+        return OllamaTagResponse(
+            models=[{
+                "name": LIGHTRAG_NAME,
+                "tag": LIGHTRAG_TAG,
+                "size": 0,
+                "digest": LIGHTRAG_DIGEST,
+                "modified_at": LIGHTRAG_CREATED_AT
+            }]
+        )
+
+    def parse_query_mode(query: str) -> tuple[str, SearchMode]:
+        """Parse query prefix to determine search mode
+        Returns tuple of (cleaned_query, search_mode)
+        """
+        mode_map = {
+            "/local ": SearchMode.local,
+            "/global ": SearchMode.global_,  # global_ is used because 'global' is a Python keyword
+            "/naive ": SearchMode.naive,
+            "/hybrid ": SearchMode.hybrid
+        }
+        
+        for prefix, mode in mode_map.items():
+            if query.startswith(prefix):
+                return query[len(prefix):], mode
+                
+        return query, SearchMode.hybrid
+
+    @app.post("/api/chat")
+    async def chat(request: OllamaChatRequest):
+        """Handle chat completion requests"""
+        try:
+            # Convert chat format to query
+            query = request.messages[-1].content if request.messages else ""
+            
+            # Parse query mode and clean query
+            cleaned_query, mode = parse_query_mode(query)
+            
+            # Call RAG with determined mode
+            response = await rag.aquery(
+                cleaned_query,
+                param=QueryParam(
+                    mode=mode,
+                    stream=request.stream
+                )
+            )
+
+            if request.stream:
+                async def stream_generator():
+                    result = ""
+                    async for chunk in response:
+                        result += chunk
+                        yield OllamaChatResponse(
+                            model=LIGHTRAG_MODEL,
+                            created_at=LIGHTRAG_CREATED_AT,
+                            message=OllamaMessage(
+                                role="assistant",
+                                content=chunk
+                            ),
+                            done=False
+                        )
+                    # Send final message
+                    yield OllamaChatResponse(
+                        model=LIGHTRAG_MODEL,
+                        created_at=LIGHTRAG_CREATED_AT,
+                        message=OllamaMessage(
+                            role="assistant",
+                            content=result
+                        ),
+                        done=True
+                    )
+                return stream_generator()
+            else:
+                return OllamaChatResponse(
+                    model=LIGHTRAG_MODEL,
+                    created_at=LIGHTRAG_CREATED_AT,
+                    message=OllamaMessage(
+                        role="assistant",
+                        content=response
+                    ),
+                    done=True
+                )
+        except Exception as e:
+            raise HTTPException(status_code=500, detail=str(e))
+
    @app.get("/health", dependencies=[Depends(optional_api_key)])
    async def get_status():
        """Get current system status"""
--- a/setup.py
+++ b/setup.py
@@ -101,6 +101,7 @@ setuptools.setup(
    entry_points={
        "console_scripts": [
            "lightrag-server=lightrag.api.lightrag_server:main [api]",
+            "lightrag-ollama=lightrag.api.lightrag_ollama:main [api]",
        ],
    },
 )