Reduce embedding concurrency limit from 16 to 8

This commit is contained in:
yangdx 2025-07-13 03:13:52 +08:00
parent a2eeae9661
commit 03b40937f7
2 changed files with 2 additions and 2 deletions

View File

@ -113,7 +113,7 @@ EMBEDDING_BINDING_HOST=http://localhost:11434
### Num of chunks send to Embedding in single request
# EMBEDDING_BATCH_NUM=10
### Max concurrency requests for Embedding
# EMBEDDING_FUNC_MAX_ASYNC=16
# EMBEDDING_FUNC_MAX_ASYNC=8
### Maximum tokens sent to Embedding for each chunk (no longer in use?)
# MAX_EMBED_TOKENS=8192
### Optional for Azure

View File

@ -205,7 +205,7 @@ class LightRAG:
"""Batch size for embedding computations."""
embedding_func_max_async: int = field(
default=int(os.getenv("EMBEDDING_FUNC_MAX_ASYNC", 16))
default=int(os.getenv("EMBEDDING_FUNC_MAX_ASYNC", 8))
)
"""Maximum number of concurrent embedding function calls."""