Handle azure models as well

2025-01-07 15:00:58 +01:00 · 2025-01-07 15:00:58 +01:00 · fb13a1b61a
commit fb13a1b61a
parent a774191ed3
1 changed files with 2 additions and 0 deletions
--- a/cognee/tasks/chunks/chunk_by_paragraph.py
+++ b/cognee/tasks/chunks/chunk_by_paragraph.py
@ -29,6 +29,8 @@ def chunk_by_paragraph(
    for paragraph_id, sentence, word_count, end_type in chunk_by_sentence(data, maximum_length=paragraph_length):
        # Check if this sentence would exceed length limit
        if embedding_model:
+            if embedding_model.startswith("azure/"):
+                embedding_model = embedding_model.split("/")[-1]
            tokenizer = tiktoken.encoding_for_model(embedding_model)
            token_count = len(tokenizer.encode(sentence))
        else: