add docling presets

2025-09-20 11:05:01 -05:00 · 2025-09-20 11:05:01 -05:00 · 7da9b98204
commit 7da9b98204
parent 88c9d60986
3 changed files with 91 additions and 13 deletions
--- a/src/agent.py
+++ b/src/agent.py
@ -106,6 +106,7 @@ async def async_response_stream(
    model: str,
    extra_headers: dict = None,
    previous_response_id: str = None,
+    tweaks: dict = None,
    log_prefix: str = "response",
 ):
    logger.info("User prompt received", prompt=prompt)
@ -120,6 +121,8 @@ async def async_response_stream(
        }
        if previous_response_id is not None:
            request_params["previous_response_id"] = previous_response_id
+        if tweaks:
+            request_params["tweaks"] = tweaks

        if "x-api-key" not in client.default_headers:
            if hasattr(client, "api_key") and extra_headers is not None:
@ -196,6 +199,7 @@ async def async_response(
    model: str,
    extra_headers: dict = None,
    previous_response_id: str = None,
+    tweaks: dict = None,
    log_prefix: str = "response",
 ):
    try:
@ -210,6 +214,8 @@ async def async_response(
        }
        if previous_response_id is not None:
            request_params["previous_response_id"] = previous_response_id
+        if tweaks:
+            request_params["tweaks"] = tweaks
        if extra_headers:
            request_params["extra_headers"] = extra_headers

@ -243,6 +249,7 @@ async def async_stream(
    model: str,
    extra_headers: dict = None,
    previous_response_id: str = None,
+    tweaks: dict = None,
    log_prefix: str = "response",
 ):
    async for chunk in async_response_stream(
@ -251,6 +258,7 @@ async def async_stream(
        model,
        extra_headers=extra_headers,
        previous_response_id=previous_response_id,
+        tweaks=tweaks,
        log_prefix=log_prefix,
    ):
        yield chunk
@ -263,6 +271,7 @@ async def async_langflow(
    prompt: str,
    extra_headers: dict = None,
    previous_response_id: str = None,
+    tweaks: dict = None,
 ):
    response_text, response_id, response_obj = await async_response(
        langflow_client,
@ -270,6 +279,7 @@ async def async_langflow(
        flow_id,
        extra_headers=extra_headers,
        previous_response_id=previous_response_id,
+        tweaks=tweaks,
        log_prefix="langflow",
    )
    return response_text, response_id
@ -282,6 +292,7 @@ async def async_langflow_stream(
    prompt: str,
    extra_headers: dict = None,
    previous_response_id: str = None,
+    tweaks: dict = None,
 ):
    logger.debug("Starting langflow stream", prompt=prompt)
    try:
@ -291,6 +302,7 @@ async def async_langflow_stream(
            flow_id,
            extra_headers=extra_headers,
            previous_response_id=previous_response_id,
+            tweaks=tweaks,
            log_prefix="langflow",
        ):
            logger.debug(
@ -451,6 +463,7 @@ async def async_langflow_chat(
    user_id: str,
    extra_headers: dict = None,
    previous_response_id: str = None,
+    tweaks: dict = None,
    store_conversation: bool = True,
 ):
    logger.debug(
@ -484,6 +497,7 @@ async def async_langflow_chat(
        flow_id,
        extra_headers=extra_headers,
        previous_response_id=previous_response_id,
+        tweaks=tweaks,
        log_prefix="langflow",
    )
    logger.debug(
@ -562,6 +576,7 @@ async def async_langflow_chat_stream(
    user_id: str,
    extra_headers: dict = None,
    previous_response_id: str = None,
+    tweaks: dict = None,
 ):
    logger.debug(
        "async_langflow_chat_stream called",
@ -588,6 +603,7 @@ async def async_langflow_chat_stream(
        flow_id,
        extra_headers=extra_headers,
        previous_response_id=previous_response_id,
+        tweaks=tweaks,
        log_prefix="langflow",
    ):
        # Extract text content to build full response for history
--- a/src/api/settings.py
+++ b/src/api/settings.py
@ -1,3 +1,5 @@
+import json
+import platform
 from starlette.responses import JSONResponse
 from utils.logging_config import get_logger
 from config.settings import (
@ -12,6 +14,60 @@ from config.settings import (

 logger = get_logger(__name__)

+# Docling preset configurations
+def get_docling_preset_configs():
+    """Get docling preset configurations with platform-specific settings"""
+    is_macos = platform.system() == "Darwin"
+
+    return {
+        "standard": {
+            "do_ocr": False
+        },
+        "ocr": {
+            "do_ocr": True,
+            "ocr_engine": "ocrmac" if is_macos else "easyocr"
+        },
+        "picture_description": {
+            "do_ocr": True,
+            "ocr_engine": "ocrmac" if is_macos else "easyocr",
+            "do_picture_classification": True,
+            "do_picture_description": True,
+            "picture_description_local": {
+                "repo_id": "HuggingFaceTB/SmolVLM-256M-Instruct",
+                "prompt": "Describe this image in a few sentences."
+            }
+        },
+        "VLM": {
+            "pipeline": "vlm",
+            "vlm_pipeline_model_local": {
+                "repo_id": "ds4sd/SmolDocling-256M-preview-mlx-bf16" if is_macos else "ds4sd/SmolDocling-256M-preview",
+                "response_format": "doctags",
+                "inference_framework": "mlx"
+            }
+        }
+    }
+
+
+def get_docling_tweaks(docling_preset: str = None) -> dict:
+    """Get Langflow tweaks for docling component based on preset"""
+    if not docling_preset:
+        # Get current preset from config
+        openrag_config = get_openrag_config()
+        docling_preset = openrag_config.knowledge.doclingPresets
+
+    preset_configs = get_docling_preset_configs()
+
+    if docling_preset not in preset_configs:
+        docling_preset = "standard"  # fallback
+
+    preset_config = preset_configs[docling_preset]
+    docling_serve_opts = json.dumps(preset_config)
+
+    return {
+        "DoclingRemote-ayRdw": {
+            "docling_serve_opts": docling_serve_opts
+        }
+    }


 async def get_settings(request, session_manager):
@ -174,7 +230,8 @@ async def update_settings(request, session_manager):
        
        # Update knowledge settings
        if "doclingPresets" in body:
-            valid_presets = ["standard", "ocr", "picture_description", "VLM"]
+            preset_configs = get_docling_preset_configs()
+            valid_presets = list(preset_configs.keys())
            if body["doclingPresets"] not in valid_presets:
                return JSONResponse(
                    {"error": f"doclingPresets must be one of: {', '.join(valid_presets)}"},
--- a/src/services/chat_service.py
+++ b/src/services/chat_service.py
@ -1,20 +1,12 @@
-from config.settings import NUDGES_FLOW_ID, clients, LANGFLOW_URL
-from agent import (
-    async_chat,
-    async_langflow,
-    async_chat_stream,
-)
-from auth_context import set_auth_context
 import json
-
+from config.settings import NUDGES_FLOW_ID, clients, LANGFLOW_URL, LANGFLOW_CHAT_FLOW_ID
+from agent import async_chat, async_langflow, async_chat_stream
+from auth_context import set_auth_context
+from api.settings import get_docling_tweaks
 from utils.logging_config import get_logger

 logger = get_logger(__name__)

-from agent import async_chat, async_chat_stream, async_langflow
-from auth_context import set_auth_context
-from config.settings import LANGFLOW_CHAT_FLOW_ID, LANGFLOW_URL, clients
-

 class ChatService:
    async def chat(
@ -135,6 +127,9 @@ class ChatService:
                "Langflow client not initialized. Ensure LANGFLOW is reachable or set LANGFLOW_KEY."
            )

+        # Get docling tweaks based on current configuration
+        docling_tweaks = get_docling_tweaks()
+
        if stream:
            from agent import async_langflow_chat_stream

@ -145,6 +140,7 @@ class ChatService:
                user_id,
                extra_headers=extra_headers,
                previous_response_id=previous_response_id,
+                tweaks=docling_tweaks,
            )
        else:
            from agent import async_langflow_chat
@ -156,6 +152,7 @@ class ChatService:
                user_id,
                extra_headers=extra_headers,
                previous_response_id=previous_response_id,
+                tweaks=docling_tweaks,
            )
            response_data = {"response": response_text}
            if response_id:
@ -205,12 +202,16 @@ class ChatService:

        from agent import async_langflow_chat

+        # Get docling tweaks (might not be used by nudges flow, but keeping consistent)
+        docling_tweaks = get_docling_tweaks()
+
        response_text, response_id = await async_langflow_chat(
            langflow_client,
            NUDGES_FLOW_ID,
            prompt,
            user_id,
            extra_headers=extra_headers,
+            tweaks=docling_tweaks,
            store_conversation=False,
        )
        response_data = {"response": response_text}
@ -241,12 +242,16 @@ class ChatService:
                raise ValueError(
                    "Langflow client not initialized. Ensure LANGFLOW is reachable or set LANGFLOW_KEY."
                )
+            # Get docling tweaks based on current configuration
+            docling_tweaks = get_docling_tweaks()
+
            response_text, response_id = await async_langflow(
                langflow_client=langflow_client,
                flow_id=LANGFLOW_CHAT_FLOW_ID,
                prompt=document_prompt,
                extra_headers=extra_headers,
                previous_response_id=previous_response_id,
+                tweaks=docling_tweaks,
            )
        else:  # chat
            # Set auth context for chat tools and provide user_id