From 7c7b8a319ba1d457411f67579e2e21beed6ca617 Mon Sep 17 00:00:00 2001 From: Vasilije <8619304+Vasilije1990@users.noreply.github.com> Date: Thu, 8 Aug 2024 20:12:34 +0200 Subject: [PATCH] Enable different chunking methods --- cognee/modules/data/processing/document_types/AudioDocument.py | 2 +- cognee/modules/data/processing/document_types/PdfDocument.py | 1 + 2 files changed, 2 insertions(+), 1 deletion(-) diff --git a/cognee/modules/data/processing/document_types/AudioDocument.py b/cognee/modules/data/processing/document_types/AudioDocument.py index d0eeee2fc..28fab07ed 100644 --- a/cognee/modules/data/processing/document_types/AudioDocument.py +++ b/cognee/modules/data/processing/document_types/AudioDocument.py @@ -11,7 +11,7 @@ from cognee.tasks.chunking.chunking_registry import get_chunking_function class AudioReader: id: UUID file_path: str - chunking_function:callable + chunking_strategy:str def __init__(self, id: UUID, file_path: str, chunking_strategy:str = "paragraph"): self.id = id diff --git a/cognee/modules/data/processing/document_types/PdfDocument.py b/cognee/modules/data/processing/document_types/PdfDocument.py index 901975841..0952fd879 100644 --- a/cognee/modules/data/processing/document_types/PdfDocument.py +++ b/cognee/modules/data/processing/document_types/PdfDocument.py @@ -12,6 +12,7 @@ from .Document import Document class PdfReader(): id: UUID file_path: str + chunking_strategy: str def __init__(self, id: UUID, file_path: str, chunking_strategy:str = "paragraph"): self.id = id