From 6e3ff1857046b3e2f65285e464f0c54471f16d9b Mon Sep 17 00:00:00 2001 From: yangdx Date: Tue, 18 Nov 2025 23:14:50 +0800 Subject: [PATCH] Adjust chunking parameters to match the default environment variable settings (cherry picked from commit e77340d4a1b3f09e559e307e4a37aa78c4744800) --- lightrag/operate.py | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/lightrag/operate.py b/lightrag/operate.py index b0736402..3a7502c1 100644 --- a/lightrag/operate.py +++ b/lightrag/operate.py @@ -72,8 +72,8 @@ def chunking_by_token_size( content: str, split_by_character: str | None = None, split_by_character_only: bool = False, - chunk_overlap_token_size: int = 128, - chunk_token_size: int = 1024, + chunk_overlap_token_size: int = 100, + chunk_token_size: int = 1200, ) -> list[dict[str, Any]]: tokens = tokenizer.encode(content) results: list[dict[str, Any]] = []