From e8a425702e499bdb0be01384c5bf52b8a5d5261c Mon Sep 17 00:00:00 2001 From: Mendon Kissling <59585235+mendonk@users.noreply.github.com> Date: Thu, 9 Oct 2025 14:39:07 -0400 Subject: [PATCH] ingestion-flow --- flows/ingestion_flow.json | 45 +++++++++++++++++++++++++++++++-------- 1 file changed, 36 insertions(+), 9 deletions(-) diff --git a/flows/ingestion_flow.json b/flows/ingestion_flow.json index 911c3e38..79a4d7c4 100644 --- a/flows/ingestion_flow.json +++ b/flows/ingestion_flow.json @@ -1245,7 +1245,7 @@ ], "frozen": false, "icon": "binary", - "last_updated": "2025-10-04T02:17:01.272Z", + "last_updated": "2025-10-09T17:53:28.032Z", "legacy": false, "lf_version": "1.6.3.dev0", "metadata": { @@ -1550,7 +1550,7 @@ ], "frozen": false, "icon": "braces", - "last_updated": "2025-10-04T02:17:01.273Z", + "last_updated": "2025-10-09T17:53:28.034Z", "legacy": false, "lf_version": "1.6.3.dev0", "metadata": {}, @@ -2912,7 +2912,7 @@ ], "frozen": false, "icon": "table", - "last_updated": "2025-10-04T02:17:01.354Z", + "last_updated": "2025-10-09T17:53:28.116Z", "legacy": false, "lf_version": "1.6.3.dev0", "metadata": { @@ -3328,7 +3328,7 @@ ], "frozen": false, "icon": "table", - "last_updated": "2025-10-04T02:17:01.355Z", + "last_updated": "2025-10-09T17:53:28.117Z", "legacy": false, "lf_version": "1.6.3.dev0", "metadata": { @@ -3744,7 +3744,7 @@ ], "frozen": false, "icon": "table", - "last_updated": "2025-10-04T02:17:01.355Z", + "last_updated": "2025-10-09T17:53:28.117Z", "legacy": false, "lf_version": "1.6.3.dev0", "metadata": { @@ -4129,19 +4129,46 @@ }, "selected": false, "type": "genericNode" + }, + { + "data": { + "id": "note-DCu9M", + "node": { + "description": "## README\n\nThis flow transforms raw documents into searchable knowledge stored in an OpenSearch vector database.\nThis [knowledge](https://docs.openr.ag/knowledge) serves as context that your [agents](https://docs.openr.ag/agents) draw upon to answer questions and perform tasks.\n\n* Data sources: This flow ingests data from OAuth connectors or can load from your local machine. For more, see [Ingest Knowledge](https://docs.openr.ag/knowledge#ingest-knowledge).\n* Docling ingestion: The [**Docling Serve** component](https://docs.openr.ag/ingestion) processes input documents by connecting to your instance of Docling serve. For more, see [Docling Ingestion](https://docs.openr.ag/ingestion).\n* Processing: The flow adds metadata through three [**DataFrame Operations** components](https://docs.langflow.org/components-processing#dataframe-operations) that add `filename`, `file_size`, and `mimetype` columns.\nThe **Split Text** component then splits the processed text into uniform, easily searchable chunks.\n* Embedding generation:The [**Embedding Model** component](https://docs.langflow.org/components-embedding-models) generates vector embeddings with the model you selected at [Application onboarding](https://docs.openr.ag/install#application-onboarding), and the [**OpenSearch** component](https://docs.langflow.org/bundles-elastic#opensearch) stores the processed documents and their embeddings in the documents index.\n* Metadata and ownership: The **Secret Input** components provide user context that is stored as metadata in OpenSearch. These fields are populated from OAuth configuration values, and enable multi-tenant document isolation in OpenSearch, so each user's documents remain private and traceable.\n\nFor more information, see the [OpenRAG docs](https://docs.openr.ag/ingestion#knowledge-ingestion-flows).\n", + "display_name": "", + "documentation": "", + "template": {} + }, + "type": "note" + }, + "dragging": false, + "height": 439, + "id": "note-DCu9M", + "measured": { + "height": 439, + "width": 1000 + }, + "position": { + "x": -538.3997974029603, + "y": 1984.9915833571447 + }, + "resizing": true, + "selected": true, + "type": "noteNode", + "width": 1000 } ], "viewport": { - "x": 227.3737875665738, - "y": -299.1651660660417, - "zoom": 0.43587407227641217 + "x": 439.0828210185154, + "y": -485.0911154471861, + "zoom": 0.5133513373758299 } }, "description": "Load your data for chat context with Retrieval Augmented Generation.", "endpoint_name": null, "id": "5488df7c-b93f-4f87-a446-b67028bc0813", "is_component": false, - "last_tested_version": "1.6.3.dev0", + "last_tested_version": "1.6.3.dev1", "name": "OpenSearch Ingestion Flow", "tags": [ "openai",