ingestion-flow

This commit is contained in:
Mendon Kissling 2025-10-09 14:39:07 -04:00
parent 07cf0c93d0
commit e8a425702e

View file

@ -1245,7 +1245,7 @@
],
"frozen": false,
"icon": "binary",
"last_updated": "2025-10-04T02:17:01.272Z",
"last_updated": "2025-10-09T17:53:28.032Z",
"legacy": false,
"lf_version": "1.6.3.dev0",
"metadata": {
@ -1550,7 +1550,7 @@
],
"frozen": false,
"icon": "braces",
"last_updated": "2025-10-04T02:17:01.273Z",
"last_updated": "2025-10-09T17:53:28.034Z",
"legacy": false,
"lf_version": "1.6.3.dev0",
"metadata": {},
@ -2912,7 +2912,7 @@
],
"frozen": false,
"icon": "table",
"last_updated": "2025-10-04T02:17:01.354Z",
"last_updated": "2025-10-09T17:53:28.116Z",
"legacy": false,
"lf_version": "1.6.3.dev0",
"metadata": {
@ -3328,7 +3328,7 @@
],
"frozen": false,
"icon": "table",
"last_updated": "2025-10-04T02:17:01.355Z",
"last_updated": "2025-10-09T17:53:28.117Z",
"legacy": false,
"lf_version": "1.6.3.dev0",
"metadata": {
@ -3744,7 +3744,7 @@
],
"frozen": false,
"icon": "table",
"last_updated": "2025-10-04T02:17:01.355Z",
"last_updated": "2025-10-09T17:53:28.117Z",
"legacy": false,
"lf_version": "1.6.3.dev0",
"metadata": {
@ -4129,19 +4129,46 @@
},
"selected": false,
"type": "genericNode"
},
{
"data": {
"id": "note-DCu9M",
"node": {
"description": "## README\n\nThis flow transforms raw documents into searchable knowledge stored in an OpenSearch vector database.\nThis [knowledge](https://docs.openr.ag/knowledge) serves as context that your [agents](https://docs.openr.ag/agents) draw upon to answer questions and perform tasks.\n\n* Data sources: This flow ingests data from OAuth connectors or can load from your local machine. For more, see [Ingest Knowledge](https://docs.openr.ag/knowledge#ingest-knowledge).\n* Docling ingestion: The [**Docling Serve** component](https://docs.openr.ag/ingestion) processes input documents by connecting to your instance of Docling serve. For more, see [Docling Ingestion](https://docs.openr.ag/ingestion).\n* Processing: The flow adds metadata through three [**DataFrame Operations** components](https://docs.langflow.org/components-processing#dataframe-operations) that add `filename`, `file_size`, and `mimetype` columns.\nThe **Split Text** component then splits the processed text into uniform, easily searchable chunks.\n* Embedding generation:The [**Embedding Model** component](https://docs.langflow.org/components-embedding-models) generates vector embeddings with the model you selected at [Application onboarding](https://docs.openr.ag/install#application-onboarding), and the [**OpenSearch** component](https://docs.langflow.org/bundles-elastic#opensearch) stores the processed documents and their embeddings in the documents index.\n* Metadata and ownership: The **Secret Input** components provide user context that is stored as metadata in OpenSearch. These fields are populated from OAuth configuration values, and enable multi-tenant document isolation in OpenSearch, so each user's documents remain private and traceable.\n\nFor more information, see the [OpenRAG docs](https://docs.openr.ag/ingestion#knowledge-ingestion-flows).\n",
"display_name": "",
"documentation": "",
"template": {}
},
"type": "note"
},
"dragging": false,
"height": 439,
"id": "note-DCu9M",
"measured": {
"height": 439,
"width": 1000
},
"position": {
"x": -538.3997974029603,
"y": 1984.9915833571447
},
"resizing": true,
"selected": true,
"type": "noteNode",
"width": 1000
}
],
"viewport": {
"x": 227.3737875665738,
"y": -299.1651660660417,
"zoom": 0.43587407227641217
"x": 439.0828210185154,
"y": -485.0911154471861,
"zoom": 0.5133513373758299
}
},
"description": "Load your data for chat context with Retrieval Augmented Generation.",
"endpoint_name": null,
"id": "5488df7c-b93f-4f87-a446-b67028bc0813",
"is_component": false,
"last_tested_version": "1.6.3.dev0",
"last_tested_version": "1.6.3.dev1",
"name": "OpenSearch Ingestion Flow",
"tags": [
"openai",