Reduce embedding concurrency limit from 16 to 8

2026-01-08 04:39:55 +00:00 · 2025-07-13 03:13:52 +08:00 · 2025-07-13 03:13:52 +08:00 · 03b40937f7
commit 03b40937f7
parent a2eeae9661
2 changed files with 2 additions and 2 deletions
--- a/env.example
+++ b/env.example
@ -113,7 +113,7 @@ EMBEDDING_BINDING_HOST=http://localhost:11434
 ### Num of chunks send to Embedding in single request
 # EMBEDDING_BATCH_NUM=10
 ### Max concurrency requests for Embedding
-# EMBEDDING_FUNC_MAX_ASYNC=16
+# EMBEDDING_FUNC_MAX_ASYNC=8
 ### Maximum tokens sent to Embedding for each chunk (no longer in use?)
 # MAX_EMBED_TOKENS=8192
 ### Optional for Azure
--- a/lightrag/lightrag.py
+++ b/lightrag/lightrag.py
@ -205,7 +205,7 @@ class LightRAG:
    """Batch size for embedding computations."""

    embedding_func_max_async: int = field(
-        default=int(os.getenv("EMBEDDING_FUNC_MAX_ASYNC", 16))
+        default=int(os.getenv("EMBEDDING_FUNC_MAX_ASYNC", 8))
    )
    """Maximum number of concurrent embedding function calls."""