Added docs

2024-03-25 22:11:25 +01:00 · 2024-03-25 22:11:25 +01:00 · a86978fb15
commit a86978fb15
parent d903eacdc7
6 changed files with 858 additions and 297 deletions
--- a/cognee/config.py
+++ b/cognee/config.py
@ -43,6 +43,10 @@ class Config:
    graph_filename = os.getenv("GRAPH_NAME", "cognee_graph.pkl")

    # Model parameters
+    llm_provider: str = "ollama"
+    ollama_endpoint: str = "http://localhost:11434/v1"
+    ollama_key: Optional[str] = os.getenv("OLLAMA_API_KEY")
+    ollama_model: str = "gpt-3.5-turbo"
    model: str = "gpt-4-0125-preview"
    # model: str = "gpt-3.5-turbo"
    model_endpoint: str = "openai"
--- a/cognee/infrastructure/InfrastructureConfig.py
+++ b/cognee/infrastructure/InfrastructureConfig.py
@ -1,6 +1,8 @@
 from cognee.config import Config
 from .databases.relational import SqliteEngine, DatabaseEngine
 from .databases.vector import WeaviateAdapter, VectorDBInterface
+from .llm.llm_interface import LLMInterface
+from .llm.openai.adapter import OpenAIAdapter

 config = Config()
 config.load()
@ -8,11 +10,15 @@ config.load()
 class InfrastructureConfig():
    database_engine: DatabaseEngine = None
    vector_engine: VectorDBInterface = None
+    llm_engine: LLMInterface = None

    def get_config(self) -> dict:
        if self.database_engine is None:
            self.database_engine = SqliteEngine(config.db_path, config.db_name)

+        if self.llm_engine is None:
+            self.llm_engine = OpenAIAdapter(config.openai_key, config.model)
+
        if self.vector_engine is None:
            self.vector_engine = WeaviateAdapter(
                config.weaviate_url,
@ -28,5 +34,6 @@ class InfrastructureConfig():
    def set_config(self, new_config: dict):
        self.database_engine = new_config["database_engine"]
        self.vector_engine = new_config["vector_engine"]
+        self.llm_engine = new_config["llm_engine"]

 infrastructure_config = InfrastructureConfig()
--- a/cognee/infrastructure/llm/get_llm_client.py
+++ b/cognee/infrastructure/llm/get_llm_client.py
@ -1,10 +1,27 @@
 """Get the LLM client."""
+from enum import Enum
 from cognee.config import Config
 from .openai.adapter import OpenAIAdapter
+from .ollama.adapter import OllamaAPIAdapter
+
+# Define an Enum for LLM Providers
+class LLMProvider(Enum):
+    OPENAI = "openai"
+    OLLAMA = "ollama"

 config = Config()
 config.load()

 def get_llm_client():
-    """Get the LLM client."""
-    return OpenAIAdapter(config.openai_key, config.model)
+    """Get the LLM client based on the configuration using Enums."""
+    provider = LLMProvider(config.llm_provider)
+
+    if provider == LLMProvider.OPENAI:
+        return OpenAIAdapter(config.openai_key, config.model)
+    elif provider == LLMProvider.OLLAMA:
+        return OllamaAPIAdapter(config.ollama_endpoint, config.ollama_key, config.ollama_model)
+    else:
+        raise ValueError(f"Unsupported LLM provider: {provider}")
+
+# Usage example
+llm_client = get_llm_client()
--- a/cognee/infrastructure/llm/ollama/adapter.py
+++ b/cognee/infrastructure/llm/ollama/adapter.py
@ -0,0 +1,108 @@
+import asyncio
+
+import aiohttp
+from typing import List, Type
+from pydantic import BaseModel
+import instructor
+from tenacity import retry, stop_after_attempt
+from openai import AsyncOpenAI
+
+import openai
+from cognee.infrastructure.llm.llm_interface import LLMInterface
+from cognee.infrastructure.llm.prompts import read_query_prompt
+
+
+class OllamaAPIAdapter(LLMInterface):
+    """Adapter for Ollama's API"""
+
+    def __init__(self, ollama_endpoint, api_key: str, model: str):
+
+        self.aclient =  instructor.patch(
+                                                AsyncOpenAI(
+                                                    base_url=ollama_endpoint,
+                                                    api_key=api_key,  # required, but unused
+                                                ),
+                                                mode=instructor.Mode.JSON,
+                                            )
+        self.model = model
+
+    @retry(stop=stop_after_attempt(5))
+    def completions_with_backoff(self, **kwargs):
+        """Wrapper around ChatCompletion.create w/ backoff"""
+        # Local model
+        return openai.chat.completions.create(**kwargs)
+
+    @retry(stop=stop_after_attempt(5))
+    async def acompletions_with_backoff(self, **kwargs):
+        """Wrapper around ChatCompletion.acreate w/ backoff"""
+        return await openai.chat.completions.acreate(**kwargs)
+
+    @retry(stop=stop_after_attempt(5))
+    async def acreate_embedding_with_backoff(self, input: List[str], model: str = "text-embedding-3-large"):
+        """Wrapper around Embedding.acreate w/ backoff"""
+
+        return await self.aclient.embeddings.create(input=input, model=model)
+
+    async def async_get_embedding_with_backoff(self, text, model="text-embedding-3-large"):
+        """To get text embeddings, import/call this function
+        It specifies defaults + handles rate-limiting + is async"""
+        text = text.replace("\n", " ")
+        response = await self.aclient.embeddings.create(input=text, model=model)
+        embedding = response.data[0].embedding
+        return embedding
+
+    @retry(stop=stop_after_attempt(5))
+    def create_embedding_with_backoff(self, **kwargs):
+        """Wrapper around Embedding.create w/ backoff"""
+        return openai.embeddings.create(**kwargs)
+
+    def get_embedding_with_backoff(self, text: str, model: str = "text-embedding-3-large"):
+        """To get text embeddings, import/call this function
+        It specifies defaults + handles rate-limiting
+        :param text: str
+        :param model: str
+        """
+        text = text.replace("\n", " ")
+        response = self.create_embedding_with_backoff(input=[text], model=model)
+        embedding = response.data[0].embedding
+        return embedding
+
+    async def async_get_batch_embeddings_with_backoff(self, texts: List[str], models: List[str]):
+        """To get multiple text embeddings in parallel, import/call this function
+        It specifies defaults + handles rate-limiting + is async"""
+        # Collect all coroutines
+        coroutines = (self.async_get_embedding_with_backoff(text, model)
+                      for text, model in zip(texts, models))
+
+        # Run the coroutines in parallel and gather the results
+        embeddings = await asyncio.gather(*coroutines)
+
+        return embeddings
+
+    @retry(stop=stop_after_attempt(5))
+    async def acreate_structured_output(self, text_input: str, system_prompt: str,
+                                        response_model: Type[BaseModel]) -> BaseModel:
+        """Generate a response from a user query."""
+        return await self.aclient.chat.completions.create(
+            model=self.model,
+            messages=[
+                {
+                    "role": "user",
+                    "content": f"""Use the given format to
+                    extract information from the following input: {text_input}. """,
+                },
+                {"role": "system", "content": system_prompt},
+            ],
+            response_model=response_model,
+        )
+
+    def show_prompt(self, text_input: str, system_prompt: str) -> str:
+        """Format and display the prompt for a user query."""
+        if not text_input:
+            text_input = "No user input provided."
+        if not system_prompt:
+            raise ValueError("No system prompt path provided.")
+        system_prompt = read_query_prompt(system_prompt)
+
+        formatted_prompt = f"""System Prompt:\n{system_prompt}\n\nUser Input:\n{text_input}\n""" if system_prompt else None
+        return formatted_prompt
--- a/poetry.lock
+++ b/poetry.lock
--- a/pyproject.toml
+++ b/pyproject.toml
@ -18,7 +18,7 @@ classifiers = [

 [tool.poetry.dependencies]
 python = "~3.10"
-openai = "1.12.0"
+openai = "1.14.3"
 python-dotenv = "1.0.1"
 fastapi = "^0.109.2"
 uvicorn = "0.22.0"
@ -26,7 +26,7 @@ boto3 = "^1.26.125"
 gunicorn = "^20.1.0"
 sqlalchemy = "^2.0.21"
 asyncpg = "^0.28.0"
-instructor = "^0.3.4"
+instructor = "^0.6.6"
 networkx = "^3.2.1"
 graphviz = "^0.20.1"
 langdetect = "^1.0.9"
@ -46,11 +46,9 @@ dlt = "^0.4.6"
 duckdb = {version = "^0.10.0", extras = ["dlt"]}
 overrides = "^7.7.0"
 aiofiles = "^23.2.1"
-qdrant-client = "^1.8.0"
 duckdb-engine = "^0.11.2"
 graphistry = "^0.33.5"
 tenacity = "^8.2.3"
-weaviate-client = "^4.5.4"

 [tool.poetry.extras]
 dbt = ["dbt-core", "dbt-redshift", "dbt-bigquery", "dbt-duckdb", "dbt-snowflake", "dbt-athena-community", "dbt-databricks"]
@ -61,6 +59,7 @@ postgres = ["psycopg2-binary", "psycopg2cffi"]
 redshift = ["psycopg2-binary", "psycopg2cffi"]
 parquet = ["pyarrow"]
 duckdb = ["duckdb"]
+qdrant = ["qdrant-client"]
 filesystem = ["s3fs", "botocore"]
 s3 = ["s3fs", "botocore"]
 gs = ["gcsfs"]