Update lightrag_server.py

2025-01-28 15:30:36 +01:00
parent 9fdea743e4
commit d493830b10
1 changed files with 65 additions and 62 deletions
--- a/lightrag/api/lightrag_server.py
+++ b/lightrag/api/lightrag_server.py
@@ -47,7 +47,7 @@ def estimate_tokens(text: str) -> int:

    return int(tokens)

-
+class OllamaServerInfos:
    # Constants for emulated Ollama model information
    LIGHTRAG_NAME = "lightrag"
    LIGHTRAG_TAG = os.getenv("OLLAMA_EMULATING_MODEL_TAG", "latest")
@@ -61,6 +61,9 @@ DOC_STATUS_STORAGE = "JsonDocStatusStorage"
    GRAPH_STORAGE = "NetworkXStorage"
    VECTOR_STORAGE = "NanoVectorDBStorage"

+# Add infos
+ollama_server_infos = OllamaServerInfos()
+
 # read config.ini
 config = configparser.ConfigParser()
 config.read("config.ini", "utf-8")
@@ -68,8 +71,8 @@ config.read("config.ini", "utf-8")
 redis_uri = config.get("redis", "uri", fallback=None)
 if redis_uri:
    os.environ["REDIS_URI"] = redis_uri
-    KV_STORAGE = "RedisKVStorage"
-    DOC_STATUS_STORAGE = "RedisKVStorage"
+    ollama_server_infos.KV_STORAGE = "RedisKVStorage"
+    ollama_server_infos.DOC_STATUS_STORAGE = "RedisKVStorage"

 # Neo4j config
 neo4j_uri = config.get("neo4j", "uri", fallback=None)
@@ -79,7 +82,7 @@ if neo4j_uri:
    os.environ["NEO4J_URI"] = neo4j_uri
    os.environ["NEO4J_USERNAME"] = neo4j_username
    os.environ["NEO4J_PASSWORD"] = neo4j_password
-    GRAPH_STORAGE = "Neo4JStorage"
+    ollama_server_infos.GRAPH_STORAGE = "Neo4JStorage"

 # Milvus config
 milvus_uri = config.get("milvus", "uri", fallback=None)
@@ -91,7 +94,7 @@ if milvus_uri:
    os.environ["MILVUS_USER"] = milvus_user
    os.environ["MILVUS_PASSWORD"] = milvus_password
    os.environ["MILVUS_DB_NAME"] = milvus_db_name
-    VECTOR_STORAGE = "MilvusVectorDBStorge"
+    ollama_server_infos.VECTOR_STORAGE = "MilvusVectorDBStorge"

 # MongoDB config
 mongo_uri = config.get("mongodb", "uri", fallback=None)
@@ -99,8 +102,8 @@ mongo_database = config.get("mongodb", "LightRAG", fallback=None)
 if mongo_uri:
    os.environ["MONGO_URI"] = mongo_uri
    os.environ["MONGO_DATABASE"] = mongo_database
-    KV_STORAGE = "MongoKVStorage"
-    DOC_STATUS_STORAGE = "MongoKVStorage"
+    ollama_server_infos.KV_STORAGE = "MongoKVStorage"
+    ollama_server_infos.DOC_STATUS_STORAGE = "MongoKVStorage"


 def get_default_host(binding_type: str) -> str:
@@ -213,7 +216,7 @@ def display_splash_screen(args: argparse.Namespace) -> None:
    # System Configuration
    ASCIIColors.magenta("\n🛠️ System Configuration:")
    ASCIIColors.white("    ├─ Ollama Emulating Model: ", end="")
-    ASCIIColors.yellow(f"{LIGHTRAG_MODEL}")
+    ASCIIColors.yellow(f"{ollama_server_infos.LIGHTRAG_MODEL}")
    ASCIIColors.white("    ├─ Log Level: ", end="")
    ASCIIColors.yellow(f"{args.log_level}")
    ASCIIColors.white("    ├─ Timeout: ", end="")
@@ -487,13 +490,13 @@ def parse_args() -> argparse.Namespace:
    parser.add_argument(
        "--simulated-model-name",
        type=int,
-        default=get_env_value("SIMULATED_MODEL_NAME", LIGHTRAG_MODEL, str),
+        default=get_env_value("SIMULATED_MODEL_NAME", ollama_server_infos.LIGHTRAG_MODEL, str),
        help="Number of conversation history turns to include (default: from env or 3)",
    )

    args = parser.parse_args()

-    LIGHTRAG_MODEL = args.simulated_model_name
+    ollama_server_infos.LIGHTRAG_MODEL = args.simulated_model_name

    return args

@@ -547,7 +550,7 @@ class OllamaMessage(BaseModel):


 class OllamaChatRequest(BaseModel):
-    model: str = LIGHTRAG_MODEL
+    model: str = ollama_server_infos.LIGHTRAG_MODEL
    messages: List[OllamaMessage]
    stream: bool = True  # Default to streaming mode
    options: Optional[Dict[str, Any]] = None
@@ -562,7 +565,7 @@ class OllamaChatResponse(BaseModel):


 class OllamaGenerateRequest(BaseModel):
-    model: str = LIGHTRAG_MODEL
+    model: str = ollama_server_infos.LIGHTRAG_MODEL
    prompt: str
    system: Optional[str] = None
    stream: bool = False
@@ -851,10 +854,10 @@ def create_app(args):
            if args.llm_binding == "lollms" or args.llm_binding == "ollama"
            else {},
            embedding_func=embedding_func,
-            kv_storage=KV_STORAGE,
-            graph_storage=GRAPH_STORAGE,
-            vector_storage=VECTOR_STORAGE,
-            doc_status_storage=DOC_STATUS_STORAGE,
+            kv_storage=ollama_server_infos.KV_STORAGE,
+            graph_storage=ollama_server_infos.GRAPH_STORAGE,
+            vector_storage=ollama_server_infos.VECTOR_STORAGE,
+            doc_status_storage=ollama_server_infos.DOC_STATUS_STORAGE,
        )
    else:
        rag = LightRAG(
@@ -868,10 +871,10 @@ def create_app(args):
            llm_model_max_async=args.max_async,
            llm_model_max_token_size=args.max_tokens,
            embedding_func=embedding_func,
-            kv_storage=KV_STORAGE,
-            graph_storage=GRAPH_STORAGE,
-            vector_storage=VECTOR_STORAGE,
-            doc_status_storage=DOC_STATUS_STORAGE,
+            kv_storage=ollama_server_infos.KV_STORAGE,
+            graph_storage=ollama_server_infos.GRAPH_STORAGE,
+            vector_storage=ollama_server_infos.VECTOR_STORAGE,
+            doc_status_storage=ollama_server_infos.DOC_STATUS_STORAGE,
        )

    async def index_file(file_path: Union[str, Path]) -> None:
@@ -1432,16 +1435,16 @@ def create_app(args):
        return OllamaTagResponse(
            models=[
                {
-                    "name": LIGHTRAG_MODEL,
-                    "model": LIGHTRAG_MODEL,
-                    "size": LIGHTRAG_SIZE,
-                    "digest": LIGHTRAG_DIGEST,
-                    "modified_at": LIGHTRAG_CREATED_AT,
+                    "name": ollama_server_infos.LIGHTRAG_MODEL,
+                    "model": ollama_server_infos.LIGHTRAG_MODEL,
+                    "size": ollama_server_infos.LIGHTRAG_SIZE,
+                    "digest": ollama_server_infos.LIGHTRAG_DIGEST,
+                    "modified_at": ollama_server_infos.LIGHTRAG_CREATED_AT,
                    "details": {
                        "parent_model": "",
                        "format": "gguf",
-                        "family": LIGHTRAG_NAME,
-                        "families": [LIGHTRAG_NAME],
+                        "family": ollama_server_infos.LIGHTRAG_NAME,
+                        "families": [ollama_server_infos.LIGHTRAG_NAME],
                        "parameter_size": "13B",
                        "quantization_level": "Q4_0",
                    },
@@ -1504,8 +1507,8 @@ def create_app(args):
                            total_response = response

                            data = {
-                                "model": LIGHTRAG_MODEL,
-                                "created_at": LIGHTRAG_CREATED_AT,
+                                "model": ollama_server_infos.LIGHTRAG_MODEL,
+                                "created_at": ollama_server_infos.LIGHTRAG_CREATED_AT,
                                "response": response,
                                "done": False,
                            }
@@ -1517,8 +1520,8 @@ def create_app(args):
                            eval_time = last_chunk_time - first_chunk_time

                            data = {
-                                "model": LIGHTRAG_MODEL,
-                                "created_at": LIGHTRAG_CREATED_AT,
+                                "model": ollama_server_infos.LIGHTRAG_MODEL,
+                                "created_at": ollama_server_infos.LIGHTRAG_CREATED_AT,
                                "done": True,
                                "total_duration": total_time,
                                "load_duration": 0,
@@ -1538,8 +1541,8 @@ def create_app(args):

                                    total_response += chunk
                                    data = {
-                                        "model": LIGHTRAG_MODEL,
-                                        "created_at": LIGHTRAG_CREATED_AT,
+                                        "model": ollama_server_infos.LIGHTRAG_MODEL,
+                                        "created_at": ollama_server_infos.LIGHTRAG_CREATED_AT,
                                        "response": chunk,
                                        "done": False,
                                    }
@@ -1551,8 +1554,8 @@ def create_app(args):
                            eval_time = last_chunk_time - first_chunk_time

                            data = {
-                                "model": LIGHTRAG_MODEL,
-                                "created_at": LIGHTRAG_CREATED_AT,
+                                "model": ollama_server_infos.LIGHTRAG_MODEL,
+                                "created_at": ollama_server_infos.LIGHTRAG_CREATED_AT,
                                "done": True,
                                "total_duration": total_time,
                                "load_duration": 0,
@@ -1596,8 +1599,8 @@ def create_app(args):
                eval_time = last_chunk_time - first_chunk_time

                return {
-                    "model": LIGHTRAG_MODEL,
-                    "created_at": LIGHTRAG_CREATED_AT,
+                    "model": ollama_server_infos.LIGHTRAG_MODEL,
+                    "created_at": ollama_server_infos.LIGHTRAG_CREATED_AT,
                    "response": str(response_text),
                    "done": True,
                    "total_duration": total_time,
@@ -1669,8 +1672,8 @@ def create_app(args):
                            total_response = response

                            data = {
-                                "model": LIGHTRAG_MODEL,
-                                "created_at": LIGHTRAG_CREATED_AT,
+                                "model": ollama_server_infos.LIGHTRAG_MODEL,
+                                "created_at": ollama_server_infos.LIGHTRAG_CREATED_AT,
                                "message": {
                                    "role": "assistant",
                                    "content": response,
@@ -1686,8 +1689,8 @@ def create_app(args):
                            eval_time = last_chunk_time - first_chunk_time

                            data = {
-                                "model": LIGHTRAG_MODEL,
-                                "created_at": LIGHTRAG_CREATED_AT,
+                                "model": ollama_server_infos.LIGHTRAG_MODEL,
+                                "created_at": ollama_server_infos.LIGHTRAG_CREATED_AT,
                                "done": True,
                                "total_duration": total_time,
                                "load_duration": 0,
@@ -1707,8 +1710,8 @@ def create_app(args):

                                    total_response += chunk
                                    data = {
-                                        "model": LIGHTRAG_MODEL,
-                                        "created_at": LIGHTRAG_CREATED_AT,
+                                        "model": ollama_server_infos.LIGHTRAG_MODEL,
+                                        "created_at": ollama_server_infos.LIGHTRAG_CREATED_AT,
                                        "message": {
                                            "role": "assistant",
                                            "content": chunk,
@@ -1724,8 +1727,8 @@ def create_app(args):
                            eval_time = last_chunk_time - first_chunk_time

                            data = {
-                                "model": LIGHTRAG_MODEL,
-                                "created_at": LIGHTRAG_CREATED_AT,
+                                "model": ollama_server_infos.LIGHTRAG_MODEL,
+                                "created_at": ollama_server_infos.LIGHTRAG_CREATED_AT,
                                "done": True,
                                "total_duration": total_time,
                                "load_duration": 0,
@@ -1780,8 +1783,8 @@ def create_app(args):
                eval_time = last_chunk_time - first_chunk_time

                return {
-                    "model": LIGHTRAG_MODEL,
-                    "created_at": LIGHTRAG_CREATED_AT,
+                    "model": ollama_server_infos.LIGHTRAG_MODEL,
+                    "created_at": ollama_server_infos.LIGHTRAG_CREATED_AT,
                    "message": {
                        "role": "assistant",
                        "content": str(response_text),
@@ -1824,10 +1827,10 @@ def create_app(args):
                "embedding_binding_host": args.embedding_binding_host,
                "embedding_model": args.embedding_model,
                "max_tokens": args.max_tokens,
-                "kv_storage": KV_STORAGE,
-                "doc_status_storage": DOC_STATUS_STORAGE,
-                "graph_storage": GRAPH_STORAGE,
-                "vector_storage": VECTOR_STORAGE,
+                "kv_storage": ollama_server_infos.KV_STORAGE,
+                "doc_status_storage": ollama_server_infos.DOC_STATUS_STORAGE,
+                "graph_storage": ollama_server_infos.GRAPH_STORAGE,
+                "vector_storage": ollama_server_infos.VECTOR_STORAGE,
            },
        }