Spaces:

rm-lht
/

lightrag

Configuration error

yangdx commited on Jan 29

Commit

d46e3aa

1 Parent(s): a76ad0a

Add RAG configuration options and enhance parameter configurability

- Add top-k and cosine-threshold parms for api server
- Update .env and cli parms handling with new parameters
- Improve splash screen display
- Update bash and storage classes to read new parameters from .env file.

Files changed (4) hide show

.env.example +11 -9
lightrag/api/lightrag_server.py +28 -1
lightrag/base.py +2 -1
lightrag/kg/nano_vector_db_impl.py +1 -1

.env.example CHANGED Viewed

@@ -6,6 +6,17 @@ PORT=9621
 WORKING_DIR=/app/data/rag_storage
 INPUT_DIR=/app/data/inputs
 # LLM Configuration (Use valid host. For local services, you can use host.docker.internal)
 # Ollama example
 LLM_BINDING=ollama
@@ -38,15 +49,6 @@ EMBEDDING_MODEL=bge-m3:latest
 # EMBEDDING_BINDING_HOST=http://host.docker.internal:9600
 # EMBEDDING_MODEL=bge-m3:latest
-# RAG Configuration
-MAX_ASYNC=4
-MAX_TOKENS=32768
-EMBEDDING_DIM=1024
-MAX_EMBED_TOKENS=8192
-#HISTORY_TURNS=3
-#CHUNK_SIZE=1200
-#CHUNK_OVERLAP_SIZE=100
 # Security (empty for no key)
 LIGHTRAG_API_KEY=your-secure-api-key-here

 WORKING_DIR=/app/data/rag_storage
 INPUT_DIR=/app/data/inputs
+# RAG Configuration
+MAX_ASYNC=4
+MAX_TOKENS=32768
+EMBEDDING_DIM=1024
+MAX_EMBED_TOKENS=8192
+#HISTORY_TURNS=3
+#CHUNK_SIZE=1200
+#CHUNK_OVERLAP_SIZE=100
+#COSINE_THRESHOLD=0.2
+#TOP_K=50
 # LLM Configuration (Use valid host. For local services, you can use host.docker.internal)
 # Ollama example
 LLM_BINDING=ollama
 # EMBEDDING_BINDING_HOST=http://host.docker.internal:9600
 # EMBEDDING_MODEL=bge-m3:latest
 # Security (empty for no key)
 LIGHTRAG_API_KEY=your-secure-api-key-here

lightrag/api/lightrag_server.py CHANGED Viewed

@@ -207,8 +207,12 @@ def display_splash_screen(args: argparse.Namespace) -> None:
     ASCIIColors.yellow(f"{args.chunk_size}")
     ASCIIColors.white("    ├─ Chunk Overlap Size: ", end="")
     ASCIIColors.yellow(f"{args.chunk_overlap_size}")
-    ASCIIColors.white("    └─ History Turns: ", end="")
     ASCIIColors.yellow(f"{args.history_turns}")
     # System Configuration
     ASCIIColors.magenta("\n🛠️ System Configuration:")
@@ -484,6 +488,20 @@ def parse_args() -> argparse.Namespace:
         help="Number of conversation history turns to include (default: from env or 3)",
     )
     args = parser.parse_args()
     return args
@@ -846,6 +864,9 @@ def create_app(args):
             graph_storage=GRAPH_STORAGE,
             vector_storage=VECTOR_STORAGE,
             doc_status_storage=DOC_STATUS_STORAGE,
         )
     else:
         rag = LightRAG(
@@ -863,6 +884,9 @@ def create_app(args):
             graph_storage=GRAPH_STORAGE,
             vector_storage=VECTOR_STORAGE,
             doc_status_storage=DOC_STATUS_STORAGE,
         )
     async def index_file(file_path: Union[str, Path]) -> None:
@@ -1052,6 +1076,7 @@ def create_app(args):
                     mode=request.mode,
                     stream=request.stream,
                     only_need_context=request.only_need_context,
                 ),
             )
@@ -1093,6 +1118,7 @@ def create_app(args):
                     mode=request.mode,
                     stream=True,
                     only_need_context=request.only_need_context,
                 ),
             )
@@ -1632,6 +1658,7 @@ def create_app(args):
                 "stream": request.stream,
                 "only_need_context": False,
                 "conversation_history": conversation_history,
             }
             if args.history_turns is not None:

     ASCIIColors.yellow(f"{args.chunk_size}")
     ASCIIColors.white("    ├─ Chunk Overlap Size: ", end="")
     ASCIIColors.yellow(f"{args.chunk_overlap_size}")
+    ASCIIColors.white("    ├─ History Turns: ", end="")
     ASCIIColors.yellow(f"{args.history_turns}")
+    ASCIIColors.white("    ├─ Cosine Threshold: ", end="")
+    ASCIIColors.yellow(f"{args.cosine_threshold}")
+    ASCIIColors.white("    └─ Top-K: ", end="")
+    ASCIIColors.yellow(f"{args.top_k}")
     # System Configuration
     ASCIIColors.magenta("\n🛠️ System Configuration:")
         help="Number of conversation history turns to include (default: from env or 3)",
     )
+    # Search parameters
+    parser.add_argument(
+        "--top-k",
+        type=int,
+        default=get_env_value("TOP_K", 50, int),
+        help="Number of most similar results to return (default: from env or 50)",
+    )
+    parser.add_argument(
+        "--cosine-threshold",
+        type=float,
+        default=get_env_value("COSINE_THRESHOLD", 0.4, float),
+        help="Cosine similarity threshold (default: from env or 0.4)",
+    )
     args = parser.parse_args()
     return args
             graph_storage=GRAPH_STORAGE,
             vector_storage=VECTOR_STORAGE,
             doc_status_storage=DOC_STATUS_STORAGE,
+            vector_db_storage_cls_kwargs={
+                "cosine_better_than_threshold": args.cosine_threshold
+            },
         )
     else:
         rag = LightRAG(
             graph_storage=GRAPH_STORAGE,
             vector_storage=VECTOR_STORAGE,
             doc_status_storage=DOC_STATUS_STORAGE,
+            vector_db_storage_cls_kwargs={
+                "cosine_better_than_threshold": args.cosine_threshold
+            },
         )
     async def index_file(file_path: Union[str, Path]) -> None:
                     mode=request.mode,
                     stream=request.stream,
                     only_need_context=request.only_need_context,
+                    top_k=args.top_k,
                 ),
             )
                     mode=request.mode,
                     stream=True,
                     only_need_context=request.only_need_context,
+                    top_k=args.top_k,
                 ),
             )
                 "stream": request.stream,
                 "only_need_context": False,
                 "conversation_history": conversation_history,
+                "top_k": args.top_k,
             }
             if args.history_turns is not None:

lightrag/base.py CHANGED Viewed

@@ -1,3 +1,4 @@
 from dataclasses import dataclass, field
 from typing import (
     TypedDict,
@@ -32,7 +33,7 @@ class QueryParam:
     response_type: str = "Multiple Paragraphs"
     stream: bool = False
     # Number of top-k items to retrieve; corresponds to entities in "local" mode and relationships in "global" mode.
-    top_k: int = 60
     # Number of document chunks to retrieve.
     # top_n: int = 10
     # Number of tokens for the original chunks.

+import os
 from dataclasses import dataclass, field
 from typing import (
     TypedDict,
     response_type: str = "Multiple Paragraphs"
     stream: bool = False
     # Number of top-k items to retrieve; corresponds to entities in "local" mode and relationships in "global" mode.
+    top_k: int = int(os.getenv("TOP_K", "60"))
     # Number of document chunks to retrieve.
     # top_n: int = 10
     # Number of tokens for the original chunks.

lightrag/kg/nano_vector_db_impl.py CHANGED Viewed

@@ -73,7 +73,7 @@ from lightrag.base import (
 @dataclass
 class NanoVectorDBStorage(BaseVectorStorage):
-    cosine_better_than_threshold: float = 0.2
     def __post_init__(self):
         self._client_file_name = os.path.join(

 @dataclass
 class NanoVectorDBStorage(BaseVectorStorage):
+    cosine_better_than_threshold: float = float(os.getenv("COSINE_THRESHOLD", "0.2"))
     def __post_init__(self):
         self._client_file_name = os.path.join(