Spaces:

rm-lht
/

lightrag

Configuration error

yangdx commited on Mar 7

Commit

c5022d3

1 Parent(s): 74d902f

Settign LLM cache option for entity extraction from env

Files changed (3) hide show

env.example CHANGED Viewed

@@ -50,6 +50,7 @@
 # MAX_TOKEN_SUMMARY=500        # Max tokens for entity or relations summary
 # SUMMARY_LANGUAGE=English
 # MAX_EMBED_TOKENS=8192
 ### LLM Configuration (Use valid host. For local services installed with docker, you can use host.docker.internal)
 LLM_BINDING=ollama

 # MAX_TOKEN_SUMMARY=500        # Max tokens for entity or relations summary
 # SUMMARY_LANGUAGE=English
 # MAX_EMBED_TOKENS=8192
+# ENABLE_LLM_CACHE_FOR_EXTRACT=false  # Enable LLM cache for entity extraction, defaults to false
 ### LLM Configuration (Use valid host. For local services installed with docker, you can use host.docker.internal)
 LLM_BINDING=ollama

lightrag/api/README.md CHANGED Viewed

@@ -223,6 +223,9 @@ LightRAG supports binding to various LLM/Embedding backends:
 Use environment variables  `LLM_BINDING` or CLI argument `--llm-binding` to select LLM backend type. Use environment variables  `EMBEDDING_BINDING` or CLI argument `--embedding-binding` to select LLM backend type.
 ### Storage Types Supported
 LightRAG uses 4 types of storage for difference purposes:

 Use environment variables  `LLM_BINDING` or CLI argument `--llm-binding` to select LLM backend type. Use environment variables  `EMBEDDING_BINDING` or CLI argument `--embedding-binding` to select LLM backend type.
+### Entity Extraction Configuration
+- ENABLE_LLM_CACHE_FOR_EXTRACT: Enable LLM cache for entity extraction (default: false)
 ### Storage Types Supported
 LightRAG uses 4 types of storage for difference purposes:

lightrag/api/lightrag_server.py CHANGED Viewed

@@ -50,6 +50,9 @@ from .auth import auth_handler
 # This update allows the user to put a different.env file for each lightrag folder
 load_dotenv(".env", override=True)
 # Initialize config parser
 config = configparser.ConfigParser()
 config.read("config.ini")
@@ -323,7 +326,7 @@ def create_app(args):
             vector_db_storage_cls_kwargs={
                 "cosine_better_than_threshold": args.cosine_threshold
             },
-            enable_llm_cache_for_entity_extract=False,  # set to True for debuging to reduce llm fee
             embedding_cache_config={
                 "enabled": True,
                 "similarity_threshold": 0.95,
@@ -352,7 +355,7 @@ def create_app(args):
             vector_db_storage_cls_kwargs={
                 "cosine_better_than_threshold": args.cosine_threshold
             },
-            enable_llm_cache_for_entity_extract=False,  # set to True for debuging to reduce llm fee
             embedding_cache_config={
                 "enabled": True,
                 "similarity_threshold": 0.95,

 # This update allows the user to put a different.env file for each lightrag folder
 load_dotenv(".env", override=True)
+# Read entity extraction cache config
+enable_llm_cache = os.getenv("ENABLE_LLM_CACHE_FOR_EXTRACT", "false").lower() == "true"
 # Initialize config parser
 config = configparser.ConfigParser()
 config.read("config.ini")
             vector_db_storage_cls_kwargs={
                 "cosine_better_than_threshold": args.cosine_threshold
             },
+            enable_llm_cache_for_entity_extract=enable_llm_cache,  # Read from environment variable
             embedding_cache_config={
                 "enabled": True,
                 "similarity_threshold": 0.95,
             vector_db_storage_cls_kwargs={
                 "cosine_better_than_threshold": args.cosine_threshold
             },
+            enable_llm_cache_for_entity_extract=enable_llm_cache,  # Read from environment variable
             embedding_cache_config={
                 "enabled": True,
                 "similarity_threshold": 0.95,