Get metadata from metadata table
This commit is contained in:
parent
cd0e505ac0
commit
15802237e9
3 changed files with 8 additions and 3 deletions
|
|
@ -14,4 +14,6 @@ async def get_metadata(metadata_id: UUID) -> Metadata:
|
||||||
async with db_engine.get_async_session() as session:
|
async with db_engine.get_async_session() as session:
|
||||||
metadata = await session.get(Metadata, metadata_id)
|
metadata = await session.get(Metadata, metadata_id)
|
||||||
|
|
||||||
return json.parse(metadata)
|
return metadata
|
||||||
|
|
||||||
|
|
||||||
|
|
|
||||||
|
|
@ -15,6 +15,7 @@ async def write_metadata(data_item: Any, data_id: UUID) -> UUID:
|
||||||
db_engine = get_relational_engine()
|
db_engine = get_relational_engine()
|
||||||
async with db_engine.get_async_session() as session:
|
async with db_engine.get_async_session() as session:
|
||||||
metadata = Metadata(
|
metadata = Metadata(
|
||||||
|
id=data_id,
|
||||||
metadata_repr=json.dumps(metadata_dict),
|
metadata_repr=json.dumps(metadata_dict),
|
||||||
metadata_source=parse_type(type(data_item)),
|
metadata_source=parse_type(type(data_item)),
|
||||||
data_id=data_id
|
data_id=data_id
|
||||||
|
|
|
||||||
|
|
@ -6,6 +6,7 @@ from cognee.modules.data.processing.document_types import (
|
||||||
ImageDocument,
|
ImageDocument,
|
||||||
TextDocument,
|
TextDocument,
|
||||||
)
|
)
|
||||||
|
from cognee.modules.data.operations.get_metadata import get_metadata
|
||||||
|
|
||||||
EXTENSION_TO_DOCUMENT_CLASS = {
|
EXTENSION_TO_DOCUMENT_CLASS = {
|
||||||
"pdf": PdfDocument, # Text documents
|
"pdf": PdfDocument, # Text documents
|
||||||
|
|
@ -38,15 +39,16 @@ EXTENSION_TO_DOCUMENT_CLASS = {
|
||||||
}
|
}
|
||||||
|
|
||||||
|
|
||||||
def classify_documents(data_documents: list[Data]) -> list[Document]:
|
async def classify_documents(data_documents: list[Data]) -> list[Document]:
|
||||||
documents = []
|
documents = []
|
||||||
for data_item in data_documents:
|
for data_item in data_documents:
|
||||||
|
metadata = await get_metadata(data_item.id)
|
||||||
document = EXTENSION_TO_DOCUMENT_CLASS[data_item.extension](
|
document = EXTENSION_TO_DOCUMENT_CLASS[data_item.extension](
|
||||||
id=data_item.id,
|
id=data_item.id,
|
||||||
title=f"{data_item.name}.{data_item.extension}",
|
title=f"{data_item.name}.{data_item.extension}",
|
||||||
raw_data_location=data_item.raw_data_location,
|
raw_data_location=data_item.raw_data_location,
|
||||||
name=data_item.name,
|
name=data_item.name,
|
||||||
metadata_id=data_item.metadata_id
|
metadata_id=metadata.id
|
||||||
)
|
)
|
||||||
documents.append(document)
|
documents.append(document)
|
||||||
|
|
||||||
|
|
|
||||||
Loading…
Add table
Reference in a new issue