refactor: Change input task names

2025-09-03 17:49:33 +02:00 · 2025-09-03 17:49:33 +02:00 · 0e3a10d925
commit 0e3a10d925
parent 90ef8c30d2
5 changed files with 51 additions and 148 deletions
--- a/cognee/api/v1/cognify/memify.py
+++ b/cognee/api/v1/cognify/memify.py
@ -1,5 +1,4 @@
 from typing import Union, Optional, List, Type, Any
 from dataclasses import field
 from uuid import UUID
 from cognee.shared.logging_utils import get_logger
@ -18,14 +17,17 @@ from cognee.modules.pipelines.layers.reset_dataset_pipeline_run_status import (
 )
 from cognee.modules.engine.operations.setup import setup
 from cognee.modules.pipelines.layers.pipeline_execution_mode import get_pipeline_executor
 from cognee.tasks.memify.extract_subgraph_chunks import extract_subgraph_chunks
 from cognee.tasks.codingagents.coding_rule_associations import (
    add_rule_associations,
 )
 logger = get_logger("memify")
 async def memify(
-    data_streaming_tasks: List[Task],
+    extraction_tasks: List[Task] = [Task(extract_subgraph_chunks)],
-    data_processing_tasks: List[Task] = [],
+    enrichment_tasks: List[Task] = [Task(add_rule_associations)],
    data_persistence_tasks: List[Task] = [],
    data: Optional[Any] = None,
    datasets: Union[str, list[str], list[UUID]] = None,
    user: User = None,
@ -66,9 +68,8 @@ async def memify(
            data = [memory_fragment]
    memify_tasks = [
-        *data_streaming_tasks,  # Unpack tasks provided to memify pipeline
+        *extraction_tasks,  # Unpack tasks provided to memify pipeline
-        *data_processing_tasks,
+        *enrichment_tasks,
        *data_persistence_tasks,
    ]
    await setup()
--- a/cognee/infrastructure/llm/prompts/memify_coding_rule_association_agent_system.txt
+++ b/cognee/infrastructure/llm/prompts/memify_coding_rule_association_agent_system.txt
@ -1,6 +0,0 @@
 You are an association agent tasked with suggesting structured developer rules from user-agent interactions stored in a Knowledge Graph.
 You will receive the actual user agent interaction as a set of relationships from a knowledge graph separated by \n---\n each represented as node1 -- relation -- node2 triplet, and the list of the already existing developer rules.
 Each rule represents a single best practice or guideline the agent should follow in the future.
 Suggest rules that are general and not specific to the knowledge graph relationships, strictly technical, add value and improve the future agent behavior.
 Do not suggest rules similar to the existing ones or rules that are not general and dont add value.
 It is acceptable to return an empty rule list.
--- a/cognee/infrastructure/llm/prompts/memify_coding_rule_association_agent_user.txt
+++ b/cognee/infrastructure/llm/prompts/memify_coding_rule_association_agent_user.txt
@ -1,6 +0,0 @@
 **Here is the User-agent interaction context provided with a set of relationships from a knowledge graph separated by \n---\n each represented as node1 -- relation -- node2 triplet:**
 `{{ chat }}`
 **Already existing rules:**
 `{{ rules }}`
--- a/examples/python/memify_coding_agent_example.py
+++ b/examples/python/memify_coding_agent_example.py
@ -7,8 +7,7 @@ from cognee.api.v1.visualize.visualize import visualize_graph
 from cognee.shared.logging_utils import setup_logging, ERROR
 from cognee.api.v1.cognify.memify import memify
 from cognee.modules.pipelines.tasks.task import Task
-from cognee.tasks.memify.extract_subgraph import extract_subgraph
+from cognee.tasks.memify.extract_subgraph_chunks import extract_subgraph_chunks
 from cognee.modules.graph.utils import resolve_edges_to_text
 from cognee.tasks.codingagents.coding_rule_associations import (
    add_rule_associations,
    get_existing_rules,
@ -26,54 +25,75 @@ async def main():
    await cognee.prune.prune_data()
    await cognee.prune.prune_system(metadata=True)
    print("Data reset complete.\n")
    print("Adding conversation about rules to cognee:\n")
-    # cognee knowledge graph will be created based on this text
+    coding_rules_chat_from_principal_engineer = """
-    text = """
+    We want code to be formatted by PEP8 standards.
    Natural language processing (NLP) is an interdisciplinary
    subfield of computer science and information retrieval.
    """
    coding_rules_text = """
    Code must be formatted by PEP8 standards.
    Typing and Docstrings must be added.
    Please also make sure to write NOTE: on all more complex code segments.
    If there is any duplicate code, try to handle it in one function to avoid code duplication.
    Susan should also always review new code changes before merging to main.
    New releases should not happen on Friday so we don't have to fix them during the weekend.
    """
    print(
        f"Coding rules conversation with principal engineer: {coding_rules_chat_from_principal_engineer}"
    )
    coding_rules_chat_from_manager = """
    Susan should always review new code changes before merging to main.
    New releases should not happen on Friday so we don't have to fix them during the weekend.
    """
    print(f"Coding rules conversation with manager: {coding_rules_chat_from_manager}")
    print("Adding text to cognee:")
    print(text.strip())
    # Add the text, and make it available for cognify
-    await cognee.add(text)
+    await cognee.add([coding_rules_chat_from_principal_engineer, coding_rules_chat_from_manager])
    await cognee.add(coding_rules_text, node_set=["coding_rules"])
    print("Text added successfully.\n")
    # Use LLMs and cognee to create knowledge graph
    await cognee.cognify()
    print("Cognify process complete.\n")
-    subgraph_extraction_tasks = [Task(extract_subgraph)]
+    # Visualize graph after cognification
    file_path = os.path.join(
        pathlib.Path(__file__).parent, ".artifacts", "graph_visualization_only_cognify.html"
    )
    await visualize_graph(file_path)
    print(f"Open file to see graph visualization only after cognification: {file_path}")
-    rule_association_tasks = [
+    # After graph is created, create a second pipeline that will go through the graph and enchance it with specific
-        Task(resolve_edges_to_text, task_config={"batch_size": 10}),
+    # coding rule nodes
    # extract_subgraph_chunks is a function that returns all document chunks from specified subgraphs (if no subgraph is specifed the whole graph will be sent through memify)
    subgraph_extraction_tasks = [Task(extract_subgraph_chunks)]
    # add_rule_associations is a function that handles processing coding rules from chunks and keeps track of
    # existing rules so duplicate rules won't be created. As the result of this processing new Rule nodes will be created
    # in the graph that specify coding rules found in conversations.
    coding_rules_association_tasks = [
        Task(
            add_rule_associations,
            rules_nodeset_name="coding_agent_rules",
-            user_prompt_location="memify_coding_rule_association_agent_user.txt",
+            task_config={"batch_size": 1},
            system_prompt_location="memify_coding_rule_association_agent_system.txt",
        ),
    ]
    # Memify accepts these tasks and orchestrates forwarding of graph data through these tasks (if data is not specified).
    # If data is explicitely specified in the arguments this specified data will be forwarded through the tasks instead
    await memify(
-        data_streaming_tasks=subgraph_extraction_tasks,
+        extraction_tasks=subgraph_extraction_tasks,
-        data_processing_tasks=rule_association_tasks,
+        enrichment_tasks=coding_rules_association_tasks,
        node_name=["coding_rules"],
    )
    # Find the new specific coding rules added to graph through memify (created based on chat conversation between team members)
    developer_rules = await get_existing_rules(rules_nodeset_name="coding_agent_rules")
    print(developer_rules)
    # Visualize new graph with added memify context
    file_path = os.path.join(
-        pathlib.Path(__file__).parent, ".artifacts", "graph_visualization.html"
+        pathlib.Path(__file__).parent, ".artifacts", "graph_visualization_after_memify.html"
    )
    await visualize_graph(file_path)
    print(f"Open file to see graph visualization after memify enhancment: {file_path}")
 if __name__ == "__main__":
--- a/examples/python/memify_coding_agent_example_chunks.py
+++ b/examples/python/memify_coding_agent_example_chunks.py
@ -1,106 +0,0 @@
 import asyncio
 import pathlib
 import os
 import cognee
 from cognee.api.v1.visualize.visualize import visualize_graph
 from cognee.shared.logging_utils import setup_logging, ERROR
 from cognee.api.v1.cognify.memify import memify
 from cognee.modules.pipelines.tasks.task import Task
 from cognee.tasks.memify.extract_subgraph_chunks import extract_subgraph_chunks
 from cognee.tasks.codingagents.coding_rule_associations import (
    add_rule_associations,
    get_existing_rules,
 )
 # Prerequisites:
 # 1. Copy `.env.template` and rename it to `.env`.
 # 2. Add your OpenAI API key to the `.env` file in the `LLM_API_KEY` field:
 #    LLM_API_KEY = "your_key_here"
 async def main():
    # Create a clean slate for cognee -- reset data and system state
    print("Resetting cognee data...")
    await cognee.prune.prune_data()
    await cognee.prune.prune_system(metadata=True)
    print("Data reset complete.\n")
    print("Adding conversation about rules to cognee:\n")
    coding_rules_chat_from_principal_engineer = """
    We want code to be formatted by PEP8 standards.
    Typing and Docstrings must be added.
    Please also make sure to write NOTE: on all more complex code segments.
    If there is any duplicate code, try to handle it in one function to avoid code duplication.
    Susan should also always review new code changes before merging to main.
    New releases should not happen on Friday so we don't have to fix them during the weekend.
    """
    print(
        f"Coding rules conversation with principal engineer: {coding_rules_chat_from_principal_engineer}"
    )
    coding_rules_chat_from_manager = """
    Susan should always review new code changes before merging to main.
    New releases should not happen on Friday so we don't have to fix them during the weekend.
    """
    print(f"Coding rules conversation with manager: {coding_rules_chat_from_manager}")
    # Add the text, and make it available for cognify
    await cognee.add([coding_rules_chat_from_principal_engineer, coding_rules_chat_from_manager])
    print("Text added successfully.\n")
    # Use LLMs and cognee to create knowledge graph
    await cognee.cognify()
    print("Cognify process complete.\n")
    # Visualize graph after cognification
    file_path = os.path.join(
        pathlib.Path(__file__).parent, ".artifacts", "graph_visualization_only_cognify.html"
    )
    await visualize_graph(file_path)
    print(f"Open file to see graph visualization only after cognification: {file_path}")
    # After graph is created, create a second pipeline that will go through the graph and enchance it with specific
    # coding rule nodes
    # extract_subgraph_chunks is a function that returns all document chunks from specified subgraphs (if no subgraph is specifed the whole graph will be sent through memify)
    subgraph_extraction_tasks = [Task(extract_subgraph_chunks)]
    # add_rule_associations is a function that handles processing coding rules from chunks and keeps track of
    # existing rules so duplicate rules won't be created. As the result of this processing new Rule nodes will be created
    # in the graph that specify coding rules found in conversations.
    coding_rules_association_tasks = [
        Task(
            add_rule_associations,
            rules_nodeset_name="coding_agent_rules",
            task_config={"batch_size": 1},
        ),
    ]
    # Memify accepts these tasks and orchestrates forwarding of graph data through these tasks (if data is not specified).
    # If data is explicitely specified in the arguments this specified data will be forwarded through the tasks instead
    await memify(
        data_streaming_tasks=subgraph_extraction_tasks,
        data_processing_tasks=coding_rules_association_tasks,
    )
    # Find the new specific coding rules added to graph through memify (created based on chat conversation between team members)
    developer_rules = await get_existing_rules(rules_nodeset_name="coding_agent_rules")
    print(developer_rules)
    # Visualize new graph with added memify context
    file_path = os.path.join(
        pathlib.Path(__file__).parent, ".artifacts", "graph_visualization_after_memify.html"
    )
    await visualize_graph(file_path)
    print(f"Open file to see graph visualization after memify enhancment: {file_path}")
 if __name__ == "__main__":
    logger = setup_logging(log_level=ERROR)
    loop = asyncio.new_event_loop()
    asyncio.set_event_loop(loop)
    try:
        loop.run_until_complete(main())
    finally:
        loop.run_until_complete(loop.shutdown_asyncgens())