From 5cf14eb7fc2d89bbecf70d6f48048e8cf0a1009a Mon Sep 17 00:00:00 2001
From: Vasilije <8619304+Vasilije1990@users.noreply.github.com>
Date: Fri, 16 May 2025 17:54:12 +0200
Subject: [PATCH] fix: Mcp small updates (#831)

<!-- .github/pull_request_template.md -->

## Description
<!-- Provide a clear description of the changes in this PR -->

## DCO Affirmation
I affirm that all code in every commit of this pull request conforms to
the terms of the Topoteretes Developer Certificate of Origin.

---------

Co-authored-by: Igor Ilic <igorilic03@gmail.com>
---
 cognee-mcp/pyproject.toml |   2 +-
 cognee-mcp/src/server.py  | 173 ++++++++++++++++++++++++++++++++++++--
 2 files changed, 167 insertions(+), 8 deletions(-)
diff --git a/cognee-mcp/pyproject.toml b/cognee-mcp/pyproject.toml
index a2190dfda..e1bc56153 100644
--- a/cognee-mcp/pyproject.toml
+++ b/cognee-mcp/pyproject.toml
@@ -8,7 +8,7 @@ requires-python = ">=3.10"
 dependencies = [
     # For local cognee repo usage remove comment bellow and add absolute path to cognee
     #"cognee[postgres,codegraph,gemini,huggingface] @ file:/Users/<username>/Desktop/cognee",
-    "cognee[postgres,codegraph,gemini,huggingface]==0.1.40",
+    "cognee[postgres,codegraph,gemini,huggingface,docs]==0.1.40",
     "fastmcp>=1.0",
     "mcp==1.5.0",
     "uv>=0.6.3",
diff --git a/cognee-mcp/src/server.py b/cognee-mcp/src/server.py
index f8c65bc7c..6a0ff41d0 100755
--- a/cognee-mcp/src/server.py
+++ b/cognee-mcp/src/server.py
@@ -24,9 +24,46 @@ log_file = get_log_file_location()
 
 
 @mcp.tool()
-async def cognify(text: str, graph_model_file: str = None, graph_model_name: str = None) -> list:
+async def cognify(data: str, graph_model_file: str = None, graph_model_name: str = None) -> list:
+    """
+    Transform data into a structured knowledge graph in Cognee's memory layer.
+
+    This function launches a background task that processes the provided text/file location and
+    generates a knowledge graph representation. The function returns immediately while
+    the processing continues in the background due to MCP timeout constraints.
+
+    Parameters
+    ----------
+    data : str
+        The data to be processed and transformed into structured knowledge.
+        This can include natural language, file location, or any text-based information
+        that should become part of the agent's memory.
+
+    graph_model_file : str, optional
+        Path to a custom schema file that defines the structure of the generated knowledge graph.
+        If provided, this file will be loaded using importlib to create a custom graph model.
+        Default is None, which uses Cognee's built-in KnowledgeGraph model.
+
+    graph_model_name : str, optional
+        Name of the class within the graph_model_file to instantiate as the graph model.
+        Required if graph_model_file is specified.
+        Default is None, which uses the default KnowledgeGraph class.
+
+    Returns
+    -------
+    list
+        A list containing a single TextContent object with information about the
+        background task launch and how to check its status.
+
+    Notes
+    -----
+    - The function launches a background task and returns immediately
+    - The actual cognify process may take significant time depending on text length
+    - Use the cognify_status tool to check the progress of the operation
+    """
+
     async def cognify_task(
-        text: str, graph_model_file: str = None, graph_model_name: str = None
+        data: str, graph_model_file: str = None, graph_model_name: str = None
     ) -> str:
         """Build knowledge graph from the input text"""
         # NOTE: MCP uses stdout to communicate, we must redirect all output
@@ -38,7 +75,7 @@ async def cognify(text: str, graph_model_file: str = None, graph_model_name: str
             else:
                 graph_model = KnowledgeGraph
 
-            await cognee.add(text)
+            await cognee.add(data)
 
             try:
                 await cognee.cognify(graph_model=graph_model)
@@ -49,7 +86,7 @@ async def cognify(text: str, graph_model_file: str = None, graph_model_name: str
 
     asyncio.create_task(
         cognify_task(
-            text=text,
+            data=data,
             graph_model_file=graph_model_file,
             graph_model_name=graph_model_name,
         )
@@ -71,6 +108,35 @@ async def cognify(text: str, graph_model_file: str = None, graph_model_name: str
 
 @mcp.tool()
 async def codify(repo_path: str) -> list:
+    """
+    Analyze and generate a code-specific knowledge graph from a software repository.
+
+    This function launches a background task that processes the provided repository
+    and builds a code knowledge graph. The function returns immediately while
+    the processing continues in the background due to MCP timeout constraints.
+
+    Parameters
+    ----------
+    repo_path : str
+        Path to the code repository to analyze. This can be a local file path or a
+        relative path to a repository. The path should point to the root of the
+        repository or a specific directory within it.
+
+    Returns
+    -------
+    list
+        A list containing a single TextContent object with information about the
+        background task launch and how to check its status.
+
+    Notes
+    -----
+    - The function launches a background task and returns immediately
+    - The code graph generation may take significant time for larger repositories
+    - Use the codify_status tool to check the progress of the operation
+    - Process results are logged to the standard Cognee log file
+    - All stdout is redirected to stderr to maintain MCP communication integrity
+    """
+
     async def codify_task(repo_path: str):
         # NOTE: MCP uses stdout to communicate, we must redirect all output
         #       going to stdout ( like the print function ) to stderr.
@@ -103,6 +169,46 @@ async def codify(repo_path: str) -> list:
 
 @mcp.tool()
 async def search(search_query: str, search_type: str) -> list:
+    """
+    Search the Cognee knowledge graph for information relevant to the query.
+
+    This function executes a search against the Cognee knowledge graph using the
+    specified query and search type. It returns formatted results based on the
+    search type selected.
+
+    Parameters
+    ----------
+    search_query : str
+        The search query in natural language. This can be a question, instruction, or
+        any text that expresses what information is needed from the knowledge graph.
+
+    search_type : str
+        The type of search to perform. Valid options include:
+        - "GRAPH_COMPLETION": Returns an LLM response based on the search query and Cognee's memory
+        - "RAG_COMPLETION": Returns an LLM response based on the search query and standard RAG data
+        - "CODE": Returns code-related knowledge in JSON format
+        - "CHUNKS": Returns raw text chunks from the knowledge graph
+        - "INSIGHTS": Returns relationships between nodes in readable format
+
+        The search_type is case-insensitive and will be converted to uppercase.
+
+    Returns
+    -------
+    list
+        A list containing a single TextContent object with the search results.
+        The format of the result depends on the search_type:
+        - For CODE: JSON-formatted search results
+        - For GRAPH_COMPLETION/RAG_COMPLETION: A single text completion
+        - For CHUNKS: String representation of the raw chunks
+        - For INSIGHTS: Formatted string showing node relationships
+        - For other types: String representation of the search results
+
+    Notes
+    -----
+    - Different search types produce different output formats
+    - The function handles the conversion between Cognee's internal result format and MCP's output format
+    """
+
     async def search_task(search_query: str, search_type: str) -> str:
         """Search the knowledge graph"""
         # NOTE: MCP uses stdout to communicate, we must redirect all output
@@ -132,7 +238,24 @@ async def search(search_query: str, search_type: str) -> list:
 
 @mcp.tool()
 async def prune():
-    """Reset the knowledge graph"""
+    """
+    Reset the Cognee knowledge graph by removing all stored information.
+
+    This function performs a complete reset of both the data layer and system layer
+    of the Cognee knowledge graph, removing all nodes, edges, and associated metadata.
+    It is typically used during development or when needing to start fresh with a new
+    knowledge base.
+
+    Returns
+    -------
+    list
+        A list containing a single TextContent object with confirmation of the prune operation.
+
+    Notes
+    -----
+    - This operation cannot be undone. All memory data will be permanently deleted.
+    - The function prunes both data content (using prune_data) and system metadata (using prune_system)
+    """
     with redirect_stdout(sys.stderr):
         await cognee.prune.prune_data()
         await cognee.prune.prune_system(metadata=True)
@@ -141,7 +264,25 @@ async def prune():
 
 @mcp.tool()
 async def cognify_status():
-    """Get status of cognify pipeline"""
+    """
+    Get the current status of the cognify pipeline.
+
+    This function retrieves information about current and recently completed cognify operations
+    in the main_dataset. It provides details on progress, success/failure status, and statistics
+    about the processed data.
+
+    Returns
+    -------
+    list
+        A list containing a single TextContent object with the status information as a string.
+        The status includes information about active and completed jobs for the cognify_pipeline.
+
+    Notes
+    -----
+    - The function retrieves pipeline status specifically for the "cognify_pipeline" on the "main_dataset"
+    - Status information includes job progress, execution time, and completion status
+    - The status is returned in string format for easy reading
+    """
     with redirect_stdout(sys.stderr):
         user = await get_default_user()
         status = await get_pipeline_status(
@@ -152,7 +293,25 @@ async def cognify_status():
 
 @mcp.tool()
 async def codify_status():
-    """Get status of codify pipeline"""
+    """
+    Get the current status of the codify pipeline.
+
+    This function retrieves information about current and recently completed codify operations
+    in the codebase dataset. It provides details on progress, success/failure status, and statistics
+    about the processed code repositories.
+
+    Returns
+    -------
+    list
+        A list containing a single TextContent object with the status information as a string.
+        The status includes information about active and completed jobs for the cognify_code_pipeline.
+
+    Notes
+    -----
+    - The function retrieves pipeline status specifically for the "cognify_code_pipeline" on the "codebase" dataset
+    - Status information includes job progress, execution time, and completion status
+    - The status is returned in string format for easy reading
+    """
     with redirect_stdout(sys.stderr):
         user = await get_default_user()
         status = await get_pipeline_status(