Spaces:

rm-lht
/

lightrag

Configuration error

YanSte commited on Feb 20

Commit

eaa50fc

unverified ·

2 Parent(s): 77f295c 8c18f1d

Merge pull request #900 from YanSte/cleanup-3

Files changed (5) hide show

examples/test_faiss.py CHANGED Viewed

@@ -70,7 +70,7 @@ def main():
         ),
         vector_storage="FaissVectorDBStorage",
         vector_db_storage_cls_kwargs={
-            "cosine_better_than_threshold": 0.3  # Your desired threshold
         },
     )

         ),
         vector_storage="FaissVectorDBStorage",
         vector_db_storage_cls_kwargs={
+            "cosine_better_than_threshold": 0.2  # Your desired threshold
         },
     )

lightrag/__init__.py CHANGED Viewed

@@ -1,5 +1,5 @@
 from .lightrag import LightRAG as LightRAG, QueryParam as QueryParam
-__version__ = "1.1.7"
 __author__ = "Zirui Guo"
 __url__ = "https://github.com/HKUDS/LightRAG"

 from .lightrag import LightRAG as LightRAG, QueryParam as QueryParam
+__version__ = "1.1.10"
 __author__ = "Zirui Guo"
 __url__ = "https://github.com/HKUDS/LightRAG"

lightrag/kg/networkx_impl.py CHANGED Viewed

@@ -16,11 +16,12 @@ import pipmaster as pm
 if not pm.is_installed("networkx"):
     pm.install("networkx")
 if not pm.is_installed("graspologic"):
     pm.install("graspologic")
-from graspologic import embed
 import networkx as nx
 @final

 if not pm.is_installed("networkx"):
     pm.install("networkx")
 if not pm.is_installed("graspologic"):
     pm.install("graspologic")
 import networkx as nx
+from graspologic import embed
 @final

lightrag/lightrag.py CHANGED Viewed

@@ -184,7 +184,7 @@ class LightRAG:
     """Maximum number of concurrent embedding function calls."""
     embedding_cache_config: dict[str, Any] = field(
-        default={
             "enabled": False,
             "similarity_threshold": 0.95,
             "use_llm_check": False,
@@ -727,7 +727,7 @@ class LightRAG:
     async def _process_entity_relation_graph(self, chunk: dict[str, Any]) -> None:
         try:
-            new_kg = await extract_entities(
                 chunk,
                 knowledge_graph_inst=self.chunk_entity_relation_graph,
                 entity_vdb=self.entities_vdb,
@@ -735,13 +735,6 @@ class LightRAG:
                 llm_response_cache=self.llm_response_cache,
                 global_config=asdict(self),
             )
-            if new_kg is None:
-                logger.info("No new entities or relationships extracted.")
-            else:
-                async with self._entity_lock:
-                    logger.info("New entities or relationships extracted.")
-                    self.chunk_entity_relation_graph = new_kg
         except Exception as e:
             logger.error("Failed to extract entities and relationships")
             raise e

     """Maximum number of concurrent embedding function calls."""
     embedding_cache_config: dict[str, Any] = field(
+        default_factory=lambda: {
             "enabled": False,
             "similarity_threshold": 0.95,
             "use_llm_check": False,
     async def _process_entity_relation_graph(self, chunk: dict[str, Any]) -> None:
         try:
+            await extract_entities(
                 chunk,
                 knowledge_graph_inst=self.chunk_entity_relation_graph,
                 entity_vdb=self.entities_vdb,
                 llm_response_cache=self.llm_response_cache,
                 global_config=asdict(self),
             )
         except Exception as e:
             logger.error("Failed to extract entities and relationships")
             raise e

lightrag/operate.py CHANGED Viewed

@@ -329,7 +329,7 @@ async def extract_entities(
     relationships_vdb: BaseVectorStorage,
     global_config: dict[str, str],
     llm_response_cache: BaseKVStorage | None = None,
-) -> BaseGraphStorage | None:
     use_llm_func: callable = global_config["llm_model_func"]
     entity_extract_max_gleaning = global_config["entity_extract_max_gleaning"]
     enable_llm_cache_for_entity_extract: bool = global_config[
@@ -522,16 +522,18 @@ async def extract_entities(
         ]
     )
-    if not len(all_entities_data) and not len(all_relationships_data):
-        logger.warning(
-            "Didn't extract any entities and relationships, maybe your LLM is not working"
-        )
-        return None
-    if not len(all_entities_data):
-        logger.warning("Didn't extract any entities")
-    if not len(all_relationships_data):
-        logger.warning("Didn't extract any relationships")
     if entity_vdb is not None:
         data_for_vdb = {
@@ -560,8 +562,6 @@ async def extract_entities(
         }
         await relationships_vdb.upsert(data_for_vdb)
-    return knowledge_graph_inst
 async def kg_query(
     query: str,

     relationships_vdb: BaseVectorStorage,
     global_config: dict[str, str],
     llm_response_cache: BaseKVStorage | None = None,
+) -> None:
     use_llm_func: callable = global_config["llm_model_func"]
     entity_extract_max_gleaning = global_config["entity_extract_max_gleaning"]
     enable_llm_cache_for_entity_extract: bool = global_config[
         ]
     )
+    if not (all_entities_data or all_relationships_data):
+        logger.info("Didn't extract any entities and relationships.")
+        return
+    if not all_entities_data:
+        logger.info("Didn't extract any entities")
+    if not all_relationships_data:
+        logger.info("Didn't extract any relationships")
+    logger.info(
+        f"New entities or relationships extracted, entities:{all_entities_data}, relationships:{all_relationships_data}"
+    )
     if entity_vdb is not None:
         data_for_vdb = {
         }
         await relationships_vdb.upsert(data_for_vdb)
 async def kg_query(
     query: str,