fix: remove obsolete code

2024-03-13 10:19:03 +01:00 · 2024-03-13 10:19:03 +01:00 · d871a7b3d1
commit d871a7b3d1
parent 9448e36201
6 changed files with 203 additions and 250 deletions
--- a/.dlt/config.toml
+++ b/.dlt/config.toml
@ -1,6 +1,6 @@
 # put your configuration values here
 [runtime]
-log_level="WARNING"  # the system log level of dlt
+log_level = "WARNING"  # the system log level of dlt
 # use the dlthub_telemetry setting to enable/disable anonymous usage data reporting, see https://dlthub.com/docs/telemetry
 dlthub_telemetry = false
--- a/.dlt/secrets.toml
+++ b/.dlt/secrets.toml
@ -1,5 +0,0 @@
 # put your secret values and credentials here. do not share this file and do not push it to github
 [destination.qdrant.credentials]
 location = "https://cff4594b-c2de-4fcf-8365-4c1d3a1c1429.us-east4-0.gcp.cloud.qdrant.io:6333"
 api_key = "K5BKjVGR8Qn4pVMk9nPFNTqITu3QVGR1O8qlDDH6kk52HUwB4lRjjw"
--- a/cognee.ipynb
+++ b/cognee.ipynb
--- a/cognitive_architecture/api/v1/add/add.py
+++ b/cognitive_architecture/api/v1/add/add.py
@ -41,7 +41,7 @@ async def add(file_paths: Union[str, List[str]], dataset_name: str = None):
            if dataset_name is not None and not key.startswith(dataset_name):
                continue
-            results.append(add_dlt(datasets[key], dataset_name = key))
+            results.append(add(datasets[key], dataset_name = key))
        return await asyncio.gather(*results)
--- a/cognitive_architecture/infrastructure/llm/openai/adapter.py
+++ b/cognitive_architecture/infrastructure/llm/openai/adapter.py
@ -15,102 +15,6 @@ class OpenAIAdapter(LLMInterface):
        openai.api_key = api_key
        self.aclient = instructor.apatch(AsyncOpenAI())
        self.model = model
        # OPENAI_API_KEY = config.openai_key
    # @staticmethod
    # def retry_with_exponential_backoff(
    #         func,
    #         initial_delay: float = 1,
    #         exponential_base: float = 2,
    #         jitter: bool = True,
    #         max_retries: int = 20,
    #         errors: tuple = (openai.RateLimitError,),
    # ):
    #     """Retry a function with exponential backoff."""
    #     def wrapper(*args, **kwargs):
    #         """Wrapper for sync functions."""
    #         # Initialize variables
    #         num_retries = 0
    #         delay = initial_delay
    #         # Loop until a successful response or max_retries is hit or an exception is raised
    #         while True:
    #             try:
    #                 return func(*args, **kwargs)
    #             # Retry on specified errors
    #             except errors:
    #                 # Increment retries
    #                 num_retries += 1
    #                 # Check if max retries has been reached
    #                 if num_retries > max_retries:
    #                     raise Exception(
    #                         f"Maximum number of retries ({max_retries}) exceeded."
    #                     )
    #                 # Increment the delay
    #                 delay *= exponential_base * (1 + jitter * random.random())
    #                 # Sleep for the delay
    #                 time.sleep(delay)
    #             # Raise exceptions for any errors not specified
    #             except Exception as e:
    #                 raise e
    #     return wrapper
    # @staticmethod
    # async def aretry_with_exponential_backoff(
    #         func,
    #         initial_delay: float = 1,
    #         exponential_base: float = 2,
    #         jitter: bool = True,
    #         max_retries: int = 20,
    #         errors: tuple = (openai.RateLimitError,),
    # ):
    #     """Retry a function with exponential backoff."""
    #     async def wrapper(*args, **kwargs):
    #         """Wrapper for async functions.
    #         :param args: list
    #         :param kwargs: dict"""
    #         # Initialize variables
    #         num_retries = 0
    #         delay = initial_delay
    #         # Loop until a successful response or max_retries is hit or an exception is raised
    #         while True:
    #             try:
    #                 return await func(*args, **kwargs)
    #             # Retry on specified errors
    #             except errors as e:
    #                 print(f"acreate (backoff): caught error: {e}")
    #                 # Increment retries
    #                 num_retries += 1
    #                 # Check if max retries has been reached
    #                 if num_retries > max_retries:
    #                     raise Exception(
    #                         f"Maximum number of retries ({max_retries}) exceeded."
    #                     )
    #                 # Increment the delay
    #                 delay *= exponential_base * (1 + jitter * random.random())
    #                 # Sleep for the delay
    #                 await asyncio.sleep(delay)
    #             # Raise exceptions for any errors not specified
    #             except Exception as e:
    #                 raise e
    #     return wrapper
    @retry(stop = stop_after_attempt(5))
    def completions_with_backoff(self, **kwargs):
@ -127,11 +31,6 @@ class OpenAIAdapter(LLMInterface):
    async def acreate_embedding_with_backoff(self, input: List[str], model: str = "text-embedding-ada-002"):
        """Wrapper around Embedding.acreate w/ backoff"""
        # client = openai.AsyncOpenAI(
        #     # This is the default and can be omitted
        #     api_key=os.environ.get("OPENAI_API_KEY"),
        # )
        return await self.aclient.embeddings.create(input=input, model=model)
    async def async_get_embedding_with_backoff(self, text, model="text-embedding-ada-002"):
@ -139,7 +38,6 @@ class OpenAIAdapter(LLMInterface):
        It specifies defaults + handles rate-limiting + is async"""
        text = text.replace("\n", " ")
        response = await self.aclient.embeddings.create(input =text, model= model)
        # response = await self.acreate_embedding_with_backoff(input=text, model=model)
        embedding = response.data[0].embedding
        return embedding
@ -162,7 +60,7 @@ class OpenAIAdapter(LLMInterface):
    async def async_get_batch_embeddings_with_backoff(self, texts: List[str], models: List[str]):
        """To get multiple text embeddings in parallel, import/call this function
        It specifies defaults + handles rate-limiting + is async"""
-        # Create a generator of coroutines
+        # Collect all coroutines
        coroutines = (self.async_get_embedding_with_backoff(text, model)
            for text, model in zip(texts, models))
--- a/cognitive_architecture/infrastructure/llm/openai/openai_tools.py
+++ b/cognitive_architecture/infrastructure/llm/openai/openai_tools.py
@ -6,11 +6,11 @@ from tenacity import retry, stop_after_attempt
 import openai
 HOST = os.getenv("OPENAI_API_BASE")
 HOST_TYPE = os.getenv("BACKEND_TYPE")  # default None == ChatCompletion
 if HOST is not None:
    openai.api_base = HOST
@retry(stop = stop_after_attempt(5))
 def completions_with_backoff(**kwargs):
    """Wrapper around ChatCompletion.create w/ backoff"""
@ -62,7 +62,6 @@ def get_embedding_with_backoff(text:str, model:str="text-embedding-ada-002"):
    return embedding
 async def async_get_batch_embeddings_with_backoff(texts: List[str], models: List[str]) :
    """To get multiple text embeddings in parallel, import/call this function
    It specifies defaults + handles rate-limiting + is async"""