Fix: make config parsing import-safe (parse_known_args) and add gpt5 kwargs normalization helper

2025-12-05 14:44:31 +08:00 · 2025-12-05 14:44:31 +08:00 · 3f845d122d
commit 3f845d122d
parent ad1d357b0d
2 changed files with 37 additions and 1 deletions
--- a/lightrag/api/config.py
+++ b/lightrag/api/config.py
@ -296,7 +296,10 @@ def parse_args() -> argparse.Namespace:
    elif os.environ.get("LLM_BINDING") == "gemini":
        GeminiLLMOptions.add_args(parser)
-    args = parser.parse_args()
+    # Use parse_known_args so unknown arguments (e.g. pytest's CLI flags)
    # do not cause a SystemExit during test collection or when importing
    # this module in other tooling. Unknown args will be ignored.
    args, _ = parser.parse_known_args()
    # convert relative path to absolute path
    args.working_dir = os.path.abspath(args.working_dir)
--- a/lightrag/llm/openai.py
+++ b/lightrag/llm/openai.py
@ -592,6 +592,39 @@ async def openai_complete_if_cache(
            await openai_async_client.close()
 def _normalize_openai_kwargs_for_model(model: str, kwargs: dict[str, Any]) -> None:
    """Normalize OpenAI kwargs for specific models.
    For gpt-5 family models (e.g., gpt-5-nano) we convert legacy `max_tokens`
    to `max_completion_tokens` with a small safety buffer and strip
    unsupported parameters such as `temperature`.
    This is an in-place operation on the provided kwargs dict.
    """
    name = (model or "").lower()
    # Work on gpt-5 family which expects `max_completion_tokens` instead of `max_tokens`
    if name.startswith("gpt-5"):
        # If explicit max_completion_tokens present keep it, otherwise convert from max_tokens
        if "max_completion_tokens" not in kwargs and "max_tokens" in kwargs:
            try:
                orig = int(kwargs.get("max_tokens", 0))
            except Exception:
                orig = 0
            # Add a small buffer (5%) + 1 token to be safe
            buffered = int(orig * 1.05) + 1 if orig > 0 else 0
            # Ensure we never decrease the value
            kwargs["max_completion_tokens"] = max(buffered, orig)
        # Remove legacy param
        kwargs.pop("max_tokens", None)
        # gpt-5 family does not use `temperature` parameter the same way; remove it
        kwargs.pop("temperature", None)
 async def openai_complete(
    prompt,
    system_prompt=None,