Added Mistral support as LLM provider using litellm

2025-09-23 13:16:44 +05:30 · 2025-09-23 13:16:44 +05:30 · 617c1f0d71
commit 617c1f0d71
parent a4ab65768b
7 changed files with 163 additions and 3 deletions
--- a/cognee/api/v1/add/add.py
+++ b/cognee/api/v1/add/add.py
@ -170,7 +170,7 @@ async def add(
        - LLM_API_KEY: API key for your LLM provider (OpenAI, Anthropic, etc.)

        Optional:
-        - LLM_PROVIDER: "openai" (default), "anthropic", "gemini", "ollama"
+        - LLM_PROVIDER: "openai" (default), "anthropic", "gemini", "ollama", "mistral"
        - LLM_MODEL: Model name (default: "gpt-5-mini")
        - DEFAULT_USER_EMAIL: Custom default user email
        - DEFAULT_USER_PASSWORD: Custom default user password
--- a/cognee/api/v1/settings/routers/get_settings_router.py
+++ b/cognee/api/v1/settings/routers/get_settings_router.py
@ -21,7 +21,13 @@ class SettingsDTO(OutDTO):


 class LLMConfigInputDTO(InDTO):
-    provider: Union[Literal["openai"], Literal["ollama"], Literal["anthropic"], Literal["gemini"]]
+    provider: Union[
+        Literal["openai"],
+        Literal["ollama"],
+        Literal["anthropic"],
+        Literal["gemini"],
+        Literal["mistral"],
+    ]
    model: str
    api_key: str

--- a/cognee/infrastructure/llm/structured_output_framework/litellm_instructor/llm/get_llm_client.py
+++ b/cognee/infrastructure/llm/structured_output_framework/litellm_instructor/llm/get_llm_client.py
@ -23,6 +23,7 @@ class LLMProvider(Enum):
    - ANTHROPIC: Represents the Anthropic provider.
    - CUSTOM: Represents a custom provider option.
    - GEMINI: Represents the Gemini provider.
+    - MISTRAL: Represents the Mistral AI provider.
    """

    OPENAI = "openai"
@ -30,6 +31,7 @@ class LLMProvider(Enum):
    ANTHROPIC = "anthropic"
    CUSTOM = "custom"
    GEMINI = "gemini"
+    MISTRAL = "mistral"


 def get_llm_client(raise_api_key_error: bool = True):
@ -145,5 +147,20 @@ def get_llm_client(raise_api_key_error: bool = True):
            api_version=llm_config.llm_api_version,
        )

+    elif provider == LLMProvider.MISTRAL:
+        if llm_config.llm_api_key is None:
+            raise LLMAPIKeyNotSetError()
+
+        from cognee.infrastructure.llm.structured_output_framework.litellm_instructor.llm.mistral.adapter import (
+            MistralAdapter,
+        )
+
+        return MistralAdapter(
+            api_key=llm_config.llm_api_key,
+            model=llm_config.llm_model,
+            max_completion_tokens=max_completion_tokens,
+            endpoint=llm_config.llm_endpoint,
+        )
+
    else:
        raise UnsupportedLLMProviderError(provider)
--- a/cognee/infrastructure/llm/structured_output_framework/litellm_instructor/llm/mistral/init.py
+++ b/cognee/infrastructure/llm/structured_output_framework/litellm_instructor/llm/mistral/init.py
--- a/cognee/infrastructure/llm/structured_output_framework/litellm_instructor/llm/mistral/adapter.py
+++ b/cognee/infrastructure/llm/structured_output_framework/litellm_instructor/llm/mistral/adapter.py
@ -0,0 +1,113 @@
+import litellm
+import instructor
+from pydantic import BaseModel
+from typing import Type, Optional
+from litellm import acompletion, JSONSchemaValidationError
+
+from cognee.shared.logging_utils import get_logger
+from cognee.modules.observability.get_observe import get_observe
+from cognee.infrastructure.llm.exceptions import MissingSystemPromptPathError
+from cognee.infrastructure.llm.structured_output_framework.litellm_instructor.llm.llm_interface import (
+    LLMInterface,
+)
+from cognee.infrastructure.llm.LLMGateway import LLMGateway
+from cognee.infrastructure.llm.config import get_llm_config
+from cognee.infrastructure.llm.structured_output_framework.litellm_instructor.llm.rate_limiter import (
+    rate_limit_async,
+    sleep_and_retry_async,
+)
+
+logger = get_logger()
+observe = get_observe()
+
+
+class MistralAdapter(LLMInterface):
+    """
+    Adapter for Mistral AI API, for structured output generation and prompt display.
+
+    Public methods:
+    - acreate_structured_output
+    - show_prompt
+    """
+
+    name = "Mistral"
+    model: str
+    api_key: str
+    max_completion_tokens: int
+
+    def __init__(self, api_key: str, model: str, max_completion_tokens: int, endpoint: str = None):
+        from mistralai import Mistral
+
+        self.model = model
+        self.max_completion_tokens = max_completion_tokens
+
+        self.aclient = instructor.from_litellm(
+            litellm.acompletion,
+            mode=instructor.Mode.MISTRAL_TOOLS,
+            api_key=get_llm_config().llm_api_key,
+        )
+
+    @sleep_and_retry_async()
+    @rate_limit_async
+    async def acreate_structured_output(
+        self, text_input: str, system_prompt: str, response_model: Type[BaseModel]
+    ) -> BaseModel:
+        """
+        Generate a response from the user query.
+
+        Parameters:
+        -----------
+            - text_input (str): The input text from the user to be processed.
+            - system_prompt (str): A prompt that sets the context for the query.
+            - response_model (Type[BaseModel]): The model to structure the response according to
+              its format.
+
+        Returns:
+        --------
+            - BaseModel: An instance of BaseModel containing the structured response.
+        """
+        return await self.aclient.chat.completions.create(
+            model=self.model,
+            max_tokens=self.max_completion_tokens,
+            max_retries=5,
+            messages=[
+                {
+                    "role": "system",
+                    "content": system_prompt,
+                },
+                {
+                    "role": "user",
+                    "content": f"""Use the given format to extract information
+            from the following input: {text_input}""",
+                },
+            ],
+            response_model=response_model,
+        )
+
+    def show_prompt(self, text_input: str, system_prompt: str) -> str:
+        """
+        Format and display the prompt for a user query.
+
+        Parameters:
+        -----------
+            - text_input (str): Input text from the user to be included in the prompt.
+            - system_prompt (str): The system prompt that will be shown alongside the user input.
+
+        Returns:
+        --------
+            - str: The formatted prompt string combining system prompt and user input.
+        """
+        if not text_input:
+            text_input = "No user input provided."
+        if not system_prompt:
+            raise MissingSystemPromptPathError()
+
+        system_prompt = LLMGateway.read_query_prompt(system_prompt)
+
+        formatted_prompt = (
+            f"""System Prompt:\n{system_prompt}\n\nUser Input:\n{text_input}\n"""
+            if system_prompt
+            else None
+        )
+
+        return formatted_prompt
--- a/cognee/modules/settings/get_settings.py
+++ b/cognee/modules/settings/get_settings.py
@ -15,6 +15,7 @@ class ModelName(Enum):
    ollama = "ollama"
    anthropic = "anthropic"
    gemini = "gemini"
+    mistral = "mistral"


 class LLMConfig(BaseModel):
@ -72,6 +73,10 @@ def get_settings() -> SettingsDict:
            "value": "gemini",
            "label": "Gemini",
        },
+        {
+            "value": "mistral",
+            "label": "Mistral",
+        },
    ]

    return SettingsDict.model_validate(
@ -134,6 +139,24 @@ def get_settings() -> SettingsDict:
                            "label": "Gemini 2.0 Flash",
                        },
                    ],
+                    "mistral": [
+                        {
+                            "value": "mistral-medium-2508",
+                            "label": "Mistral Medium 3.1",
+                        },
+                        {
+                            "value": "magistral-medium-2509",
+                            "label": "Magistral Medium 1.2",
+                        },
+                        {
+                            "value": "magistral-medium-2507",
+                            "label": "Magistral Medium 1.1",
+                        },
+                        {
+                            "value": "mistral-large-2411",
+                            "label": "Mistral Large 2.1",
+                        },
+                    ],
                },
            },
            vector_db={
--- a/pyproject.toml
+++ b/pyproject.toml
@ -54,7 +54,8 @@ dependencies = [
    "networkx>=3.4.2,<4",
    "uvicorn>=0.34.0,<1.0.0",
    "gunicorn>=20.1.0,<24",
-    "websockets>=15.0.1,<16.0.0"
+    "websockets>=15.0.1,<16.0.0",
+    "mistralai>=1.9.10",
 ]

 [project.optional-dependencies]