From 3f845d122d137c9c970639455d8a759ff1ff676d Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Rapha=C3=ABl=20MANSUY?= <raphael.mansuy@gmail.com>
Date: Fri, 5 Dec 2025 14:44:31 +0800
Subject: [PATCH] Fix: make config parsing import-safe (parse_known_args) and
 add gpt5 kwargs normalization helper

---
 lightrag/api/config.py |  5 ++++-
 lightrag/llm/openai.py | 33 +++++++++++++++++++++++++++++++++
 2 files changed, 37 insertions(+), 1 deletion(-)

diff --git a/lightrag/api/config.py b/lightrag/api/config.py
index a02a1cae..ac507c8e 100644
--- a/lightrag/api/config.py
+++ b/lightrag/api/config.py
@@ -296,7 +296,10 @@ def parse_args() -> argparse.Namespace:
     elif os.environ.get("LLM_BINDING") == "gemini":
         GeminiLLMOptions.add_args(parser)
 
-    args = parser.parse_args()
+    # Use parse_known_args so unknown arguments (e.g. pytest's CLI flags)
+    # do not cause a SystemExit during test collection or when importing
+    # this module in other tooling. Unknown args will be ignored.
+    args, _ = parser.parse_known_args()
 
     # convert relative path to absolute path
     args.working_dir = os.path.abspath(args.working_dir)
diff --git a/lightrag/llm/openai.py b/lightrag/llm/openai.py
index 9c3d0261..ee8b2dd5 100644
--- a/lightrag/llm/openai.py
+++ b/lightrag/llm/openai.py
@@ -592,6 +592,39 @@ async def openai_complete_if_cache(
             await openai_async_client.close()
 
 
+def _normalize_openai_kwargs_for_model(model: str, kwargs: dict[str, Any]) -> None:
+    """Normalize OpenAI kwargs for specific models.
+
+    For gpt-5 family models (e.g., gpt-5-nano) we convert legacy `max_tokens`
+    to `max_completion_tokens` with a small safety buffer and strip
+    unsupported parameters such as `temperature`.
+
+    This is an in-place operation on the provided kwargs dict.
+    """
+    name = (model or "").lower()
+
+    # Work on gpt-5 family which expects `max_completion_tokens` instead of `max_tokens`
+    if name.startswith("gpt-5"):
+        # If explicit max_completion_tokens present keep it, otherwise convert from max_tokens
+        if "max_completion_tokens" not in kwargs and "max_tokens" in kwargs:
+            try:
+                orig = int(kwargs.get("max_tokens", 0))
+            except Exception:
+                orig = 0
+
+            # Add a small buffer (5%) + 1 token to be safe
+            buffered = int(orig * 1.05) + 1 if orig > 0 else 0
+            # Ensure we never decrease the value
+            kwargs["max_completion_tokens"] = max(buffered, orig)
+
+        # Remove legacy param
+        kwargs.pop("max_tokens", None)
+
+        # gpt-5 family does not use `temperature` parameter the same way; remove it
+        kwargs.pop("temperature", None)
+
+
+
 async def openai_complete(
     prompt,
     system_prompt=None,