From e8fc6c89525fd22bc646db5a84a9d73f4beea6be Mon Sep 17 00:00:00 2001 From: Vasilije <8619304+Vasilije1990@users.noreply.github.com> Date: Thu, 17 Aug 2023 08:41:30 +0200 Subject: [PATCH] quick fix to the bug --- level_1/level_1_pdf_vectorstore_dlt_etl.py | 6 +++--- 1 file changed, 3 insertions(+), 3 deletions(-) diff --git a/level_1/level_1_pdf_vectorstore_dlt_etl.py b/level_1/level_1_pdf_vectorstore_dlt_etl.py index c6cfb5ca3..7186df587 100644 --- a/level_1/level_1_pdf_vectorstore_dlt_etl.py +++ b/level_1/level_1_pdf_vectorstore_dlt_etl.py @@ -363,12 +363,12 @@ def main(raw_loading, processed_loading,document_paths): file_path = os.path.join(BASE_DIR, "ticket_schema.json") json_schema = load_json_or_infer_schema(file_path, document) output = _convert_pdf_to_document(path=document) - find_data_in_store = get_from_weaviate(query="Train", path=['year'], operator='Equal', valueText='2017*') + try: + find_data_in_store = get_from_weaviate(query="Train", path=['year'], operator='Equal', valueText='2017*') - if find_data_in_store: output = find_data_in_store print(output[1]) - else: + except: load_to_weaviate(document) pipeline = dlt.pipeline(pipeline_name="train_ticket", destination='duckdb', dataset_name='train_ticket_data')