Merge b7f1716c58 into 56f6d09df0

2025-10-28 11:08:19 +08:00 · 2025-10-28 11:08:19 +08:00 · debb7bf330
commit debb7bf330
parent 56f6d09df0 b7f1716c58
7 changed files with 280 additions and 1 deletions
--- a/graphiti_core/embedder/init.py
+++ b/graphiti_core/embedder/init.py
@ -1,8 +1,11 @@
 from .client import EmbedderClient
 from .openai import OpenAIEmbedder, OpenAIEmbedderConfig
+from .ollama import OllamaEmbedder, OllamaEmbedderConfig

 __all__ = [
    'EmbedderClient',
    'OpenAIEmbedder',
    'OpenAIEmbedderConfig',
+    'OllamaEmbedder',
+    'OllamaEmbedderConfig',
 ]
--- a/graphiti_core/embedder/ollama.py
+++ b/graphiti_core/embedder/ollama.py
@ -0,0 +1,131 @@
+"""
+Copyright 2024, Zep Software, Inc.
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+    http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+"""
+
+import logging
+from collections.abc import Iterable
+from typing import Any
+
+import httpx
+from pydantic import Field
+
+from .client import EmbedderClient, EmbedderConfig
+
+logger = logging.getLogger(__name__)
+
+DEFAULT_EMBEDDING_MODEL = 'nomic-embed-text'
+DEFAULT_BASE_URL = 'http://localhost:11434'
+
+
+class OllamaEmbedderConfig(EmbedderConfig):
+    embedding_model: str = Field(default=DEFAULT_EMBEDDING_MODEL)
+    base_url: str = Field(default=DEFAULT_BASE_URL)
+
+
+class OllamaEmbedder(EmbedderClient):
+    """
+    Ollama Embedder Client
+    
+    Uses Ollama's native API endpoint for embeddings.
+    """
+
+    def __init__(self, config: OllamaEmbedderConfig | None = None):
+        if config is None:
+            config = OllamaEmbedderConfig()
+        self.config = config
+        self.base_url = config.base_url.rstrip('/')
+        self.embed_url = f"{self.base_url}/api/embed"
+
+    async def create(
+        self, input_data: str | list[str] | Iterable[int] | Iterable[Iterable[int]]
+    ) -> list[float]:
+        """
+        Create embeddings for the given input data using Ollama's embedding model.
+
+        Args:
+            input_data: The input data to create embeddings for. Can be a string, list of strings,
+                       or an iterable of integers or iterables of integers.
+
+        Returns:
+            A list of floats representing the embedding vector.
+        """
+        # Convert input to string if needed
+        if isinstance(input_data, str):
+            text_input = input_data
+        elif isinstance(input_data, list) and len(input_data) > 0:
+            if isinstance(input_data[0], str):
+                # For list of strings, take the first one for single embedding
+                text_input = input_data[0]
+            else:
+                # Convert other types to string
+                text_input = str(input_data[0])
+        else:
+            text_input = str(input_data)
+
+        payload = {
+            "model": self.config.embedding_model,
+            "input": text_input
+        }
+
+        try:
+            async with httpx.AsyncClient() as client:
+                response = await client.post(
+                    self.embed_url,
+                    json=payload,
+                    headers={"Content-Type": "application/json"},
+                    timeout=30.0
+                )
+
+                if response.status_code != 200:
+                    error_text = response.text
+                    raise Exception(f"Ollama API error {response.status_code}: {error_text}")
+
+                result = response.json()
+
+                if "embeddings" not in result:
+                    raise Exception(f"No embeddings in response: {result}")
+
+                embeddings = result["embeddings"]
+                if not embeddings or len(embeddings) == 0:
+                    raise Exception("Empty embeddings returned")
+
+                # Return the first embedding, truncated to the configured dimension
+                embedding = embeddings[0]
+                return embedding[: self.config.embedding_dim]
+
+        except httpx.HTTPStatusError as e:
+            logger.error(f"HTTP error creating Ollama embedding: {e.response.status_code} - {e.response.text}")
+            raise Exception(f"Ollama API error {e.response.status_code}: {e.response.text}")
+        except Exception as e:
+            logger.error(f"Error creating Ollama embedding: {e}")
+            raise
+
+    async def create_batch(self, input_data_list: list[str]) -> list[list[float]]:
+        """
+        Create batch embeddings using Ollama's embedding model.
+        
+        Note: Ollama doesn't support batch embeddings natively, so we process them sequentially.
+        """
+        embeddings = []
+        
+        for text in input_data_list:
+            try:
+                embedding = await self.create(text)
+                embeddings.append(embedding)
+            except Exception as e:
+                logger.error(f"Error creating embedding for text '{text[:50]}...': {e}")
+                raise
+        
+        return embeddings
--- a/mcp_server/.env.example
+++ b/mcp_server/.env.example
@ -23,6 +23,17 @@ MODEL_NAME=gpt-4.1-mini
 # Optional: Only needed for non-standard OpenAI endpoints
 # OPENAI_BASE_URL=https://api.openai.com/v1

+# Embedder Configuration
+# Provider is auto-detected based on configuration:
+# - Azure: if AZURE_OPENAI_EMBEDDING_ENDPOINT is set
+# - Ollama: if USE_OLLAMA_FOR_EMBEDDER is set to true
+# - OpenAI: default (no additional config needed)
+# USE_OLLAMA_FOR_EMBEDDER=true  # Set this to true to use Ollama
+# OLLAMA_EMBEDDER_API_KEY=ollama  # Ollama API key (optional, defaults to 'ollama')
+# OLLAMA_EMBEDDER_BASE_URL=http://localhost:11434  # Ollama base URL (when using Ollama)
+# OLLAMA_EMBEDDER_MODEL_NAME=nomic-embed-text  # Ollama embedding model to use
+# OLLAMA_EMBEDDER_DIMENSION=768  # Ollama embedding dimension (model-specific)
+
 # Optional: Group ID for namespacing graph data
 # GROUP_ID=my_project

--- a/mcp_server/.env.example.gemini_ollama
+++ b/mcp_server/.env.example.gemini_ollama
@ -0,0 +1,45 @@
+# Graphiti MCP Server Environment Configuration
+
+# Neo4j Database Configuration
+# These settings are used to connect to your Neo4j database
+NEO4J_URI=bolt://localhost:7687
+NEO4J_USER=neo4j
+NEO4J_PASSWORD=demodemo
+
+# OpenAI API Configuration
+# Required for LLM operations
+OPENAI_API_KEY=your_gemini_api_key_here
+MODEL_NAME=gemini-2.5-flash
+SMALL_MODEL_NAME=gemini-2.5-flash
+
+# Optional: Only needed for non-standard OpenAI endpoints
+OPENAI_BASE_URL=https://generativelanguage.googleapis.com/v1beta
+
+# Embedder Configuration
+# Optional: Separate API key and URL for embedder (falls back to OPENAI_API_KEY and OPENAI_BASE_URL if not set)
+# Note: OpenRouter does not support embeddings API, using Ollama as free alternative
+USE_OLLAMA_FOR_EMBEDDER=true
+OLLAMA_EMBEDDER_API_KEY=ollama
+OLLAMA_EMBEDDER_BASE_URL=http://localhost:11434
+OLLAMA_EMBEDDER_MODEL_NAME=nomic-embed-text
+OLLAMA_EMBEDDER_DIMENSION=768
+
+# Optional: Group ID for namespacing graph data
+# GROUP_ID=my_project
+
+# Optional: Path configuration for Docker
+# PATH=/root/.local/bin:${PATH}
+
+# Optional: Memory settings for Neo4j (used in Docker Compose)
+# NEO4J_server_memory_heap_initial__size=512m
+# NEO4J_server_memory_heap_max__size=1G
+# NEO4J_server_memory_pagecache_size=512m
+
+# Azure OpenAI configuration
+# Optional: Only needed for Azure OpenAI endpoints
+# AZURE_OPENAI_ENDPOINT=your_azure_openai_endpoint_here
+# AZURE_OPENAI_API_VERSION=2025-01-01-preview
+# AZURE_OPENAI_DEPLOYMENT_NAME=gpt-4o-gpt-4o-mini-deployment
+# AZURE_OPENAI_EMBEDDING_API_VERSION=2023-05-15
+# AZURE_OPENAI_EMBEDDING_DEPLOYMENT_NAME=text-embedding-3-large-deployment
+# AZURE_OPENAI_USE_MANAGED_IDENTITY=false
--- a/mcp_server/.env.example.openrouter_ollama
+++ b/mcp_server/.env.example.openrouter_ollama
@ -0,0 +1,44 @@
+# Graphiti MCP Server Environment Configuration
+
+# Neo4j Database Configuration
+# These settings are used to connect to your Neo4j database
+NEO4J_URI=bolt://localhost:7687
+NEO4J_USER=neo4j
+NEO4J_PASSWORD=demodemo
+
+# OpenAI API Configuration
+# Required for LLM operations
+OPENAI_API_KEY=your_open_router_api_key_here
+MODEL_NAME=gpt-4.1-mini
+
+# Optional: Only needed for non-standard OpenAI endpoints
+OPENAI_BASE_URL=https://openrouter.ai/api/v1
+
+# Embedder Configuration
+# Optional: Separate API key and URL for embedder (falls back to OPENAI_API_KEY and OPENAI_BASE_URL if not set)
+# Note: OpenRouter does not support embeddings API, using Ollama as free alternative
+USE_OLLAMA_FOR_EMBEDDER=true
+OLLAMA_EMBEDDER_API_KEY=ollama
+OLLAMA_EMBEDDER_BASE_URL=http://localhost:11434
+OLLAMA_EMBEDDER_MODEL_NAME=nomic-embed-text
+OLLAMA_EMBEDDER_DIMENSION=768
+
+# Optional: Group ID for namespacing graph data
+# GROUP_ID=my_project
+
+# Optional: Path configuration for Docker
+# PATH=/root/.local/bin:${PATH}
+
+# Optional: Memory settings for Neo4j (used in Docker Compose)
+# NEO4J_server_memory_heap_initial__size=512m
+# NEO4J_server_memory_heap_max__size=1G
+# NEO4J_server_memory_pagecache_size=512m
+
+# Azure OpenAI configuration
+# Optional: Only needed for Azure OpenAI endpoints
+# AZURE_OPENAI_ENDPOINT=your_azure_openai_endpoint_here
+# AZURE_OPENAI_API_VERSION=2025-01-01-preview
+# AZURE_OPENAI_DEPLOYMENT_NAME=gpt-4o-gpt-4o-mini-deployment
+# AZURE_OPENAI_EMBEDDING_API_VERSION=2023-05-15
+# AZURE_OPENAI_EMBEDDING_DEPLOYMENT_NAME=text-embedding-3-large-deployment
+# AZURE_OPENAI_USE_MANAGED_IDENTITY=false
--- a/mcp_server/README.md
+++ b/mcp_server/README.md
@ -102,6 +102,11 @@ The server supports both Neo4j and FalkorDB as database backends. Use the `DATAB
 - `MODEL_NAME`: OpenAI model name to use for LLM operations.
 - `SMALL_MODEL_NAME`: OpenAI model name to use for smaller LLM operations.
 - `LLM_TEMPERATURE`: Temperature for LLM responses (0.0-2.0).
+- `USE_OLLAMA_FOR_EMBEDDER`: Set to `true` to use Ollama for embeddings (auto-detects Ollama provider)
+- `OLLAMA_EMBEDDER_API_KEY`: Ollama API key (optional, defaults to 'ollama')
+- `OLLAMA_EMBEDDER_BASE_URL`: Ollama base URL for embedder API (when using Ollama)
+- `OLLAMA_EMBEDDER_MODEL_NAME`: Ollama embedding model name
+- `OLLAMA_EMBEDDER_DIMENSION`: Ollama embedding dimension
 - `AZURE_OPENAI_ENDPOINT`: Optional Azure OpenAI LLM endpoint URL
 - `AZURE_OPENAI_DEPLOYMENT_NAME`: Optional Azure OpenAI LLM deployment name
 - `AZURE_OPENAI_API_VERSION`: Optional Azure OpenAI LLM API version
--- a/mcp_server/graphiti_mcp_server.py
+++ b/mcp_server/graphiti_mcp_server.py
@ -25,6 +25,7 @@ from graphiti_core.edges import EntityEdge
 from graphiti_core.embedder.azure_openai import AzureOpenAIEmbedderClient
 from graphiti_core.embedder.client import EmbedderClient
 from graphiti_core.embedder.openai import OpenAIEmbedder, OpenAIEmbedderConfig
+from graphiti_core.embedder.ollama import OllamaEmbedder, OllamaEmbedderConfig
 from graphiti_core.llm_client import LLMClient
 from graphiti_core.llm_client.azure_openai_client import AzureOpenAILLMClient
 from graphiti_core.llm_client.config import LLMConfig
@ -360,6 +361,7 @@ class GraphitiEmbedderConfig(BaseModel):
    azure_openai_deployment_name: str | None = None
    azure_openai_api_version: str | None = None
    azure_openai_use_managed_identity: bool = False
+    use_ollama_for_embedder: bool = False

    @classmethod
    def from_env(cls) -> 'GraphitiEmbedderConfig':
@ -369,6 +371,13 @@ class GraphitiEmbedderConfig(BaseModel):
        model_env = os.environ.get('EMBEDDER_MODEL_NAME', '')
        model = model_env if model_env.strip() else DEFAULT_EMBEDDER_MODEL

+        # Get embedder-specific API key and base URL, fallback to general OpenAI settings
+
+        # Detect provider based on configuration (similar to Azure pattern)
+        use_ollama_for_embedder = (
+            os.environ.get('USE_OLLAMA_FOR_EMBEDDER', 'false').lower() == 'true'
+        )
+
        azure_openai_endpoint = os.environ.get('AZURE_OPENAI_EMBEDDING_ENDPOINT', None)
        azure_openai_api_version = os.environ.get('AZURE_OPENAI_EMBEDDING_API_VERSION', None)
        azure_openai_deployment_name = os.environ.get(
@ -405,11 +414,19 @@ class GraphitiEmbedderConfig(BaseModel):
                api_key=api_key,
                azure_openai_api_version=azure_openai_api_version,
                azure_openai_deployment_name=azure_openai_deployment_name,
+                use_ollama_for_embedder=False,
            )
        else:
+            if use_ollama_for_embedder:
+                api_key_env = os.environ.get("OLLAMA_EMBEDDER_API_KEY")
+                api_key = api_key_env if api_key_env else 'ollama'
+                logger.info(f'ollama api_key: {api_key}')
+            else:
+                api_key = os.environ.get("OPENAI_API_KEY")
            return cls(
                model=model,
-                api_key=os.environ.get('OPENAI_API_KEY'),
+                api_key=api_key,
+                use_ollama_for_embedder=use_ollama_for_embedder,
            )

    def create_client(self) -> EmbedderClient | None:
@ -441,6 +458,29 @@ class GraphitiEmbedderConfig(BaseModel):
            else:
                logger.error('OPENAI_API_KEY must be set when using Azure OpenAI API')
                return None
+        elif self.use_ollama_for_embedder:
+
+            base_url_env = os.environ.get('OLLAMA_EMBEDDER_BASE_URL')
+            base_url = base_url_env if base_url_env else 'http://localhost:11434'
+
+            model_env = os.environ.get('OLLAMA_EMBEDDER_MODEL_NAME')
+            model = model_env if model_env else 'nomic-embed-text'
+
+            # Get embedding dimension from environment
+            embedding_dim_env = os.environ.get('OLLAMA_EMBEDDER_DIMENSION')
+            embedding_dim = int(embedding_dim_env) if embedding_dim_env else 768
+
+            logger.info(f'ollama model: {model}')
+            logger.info(f'ollama base_url: {base_url}')
+            logger.info(f'ollama embedding_dim: {embedding_dim}')
+
+            # Ollama API setup
+            ollama_config = OllamaEmbedderConfig(
+                embedding_model=model,
+                base_url=base_url,
+                embedding_dim=embedding_dim  # nomic-embed-text default
+            )
+            return OllamaEmbedder(config=ollama_config)
        else:
            # OpenAI API setup
            if not self.api_key: