Fix special chars problem for Postgres

2025-04-17 22:58:36 +08:00
parent 14b4bc96ce
commit a3ca134e97
3 changed files with 10 additions and 5 deletions
--- a/lightrag/kg/postgres_impl.py
+++ b/lightrag/kg/postgres_impl.py
@@ -1049,10 +1049,10 @@ class PGGraphStorage(BaseGraphStorage):
        Returns:
            Normalized node ID suitable for Cypher queries
        """
        # Remove quotes
        normalized_id = node_id.strip('"')
        # Escape backslashes
        normalized_id = node_id
        normalized_id = normalized_id.replace("\\", "\\\\")
        normalized_id = normalized_id.replace('"', '\\"')
        return normalized_id
    async def initialize(self):
--- a/lightrag/operate.py
+++ b/lightrag/operate.py
@@ -157,8 +157,8 @@ async def _handle_single_entity_extraction(
        return None
    # Clean and validate entity name
-    entity_name = clean_str(record_attributes[1]).strip('"')
+    entity_name = clean_str(record_attributes[1]).strip()
-    if not entity_name.strip():
+    if not entity_name:
        logger.warning(
            f"Entity extraction error: empty entity name in: {record_attributes}"
        )
--- a/lightrag/utils.py
+++ b/lightrag/utils.py
@@ -1385,7 +1385,12 @@ def normalize_extracted_info(name: str, is_entity=False) -> str:
    name = re.sub(r"(?<=[a-zA-Z0-9])\s+(?=[\u4e00-\u9fa5])", "", name)
    # Remove English quotation marks from the beginning and end
-    name = name.strip('"').strip("'")
+    if (
        len(name) >= 2
        and name.startswith('"')
        and name.endswith('"')
    ):
        name = name[1:-1]
    if is_entity:
        # remove Chinese quotes