From 72e5b2bec877c8c8d4775a1ff780673604c6ac92 Mon Sep 17 00:00:00 2001
From: Igor Ilic <igorilic03@gmail.com>
Date: Mon, 1 Sep 2025 17:48:50 +0200
Subject: [PATCH 01/19] feat: Initial memify commit

---
 cognee/api/v1/cognify/memify.py         | 71 +++++++++++++++++++++++++
 cognee/tasks/memify/__init__.py         |  1 +
 cognee/tasks/memify/extract_subgraph.py |  2 +
 3 files changed, 74 insertions(+)
 create mode 100644 cognee/api/v1/cognify/memify.py
 create mode 100644 cognee/tasks/memify/__init__.py
 create mode 100644 cognee/tasks/memify/extract_subgraph.py

diff --git a/cognee/api/v1/cognify/memify.py b/cognee/api/v1/cognify/memify.py
new file mode 100644
index 000000000..65a622af7
--- /dev/null
+++ b/cognee/api/v1/cognify/memify.py
@@ -0,0 +1,71 @@
+from pydantic import BaseModel
+from typing import Union, Optional, List, Type
+from uuid import UUID
+
+from cognee.shared.logging_utils import get_logger
+from cognee.shared.data_models import KnowledgeGraph
+from cognee.infrastructure.llm import get_max_chunk_tokens
+
+from cognee.modules.engine.models.node_set import NodeSet
+from cognee.modules.pipelines import run_pipeline
+from cognee.modules.pipelines.tasks.task import Task
+from cognee.modules.chunking.TextChunker import TextChunker
+from cognee.modules.ontology.rdf_xml.OntologyResolver import OntologyResolver
+from cognee.modules.users.models import User
+
+from cognee.tasks.memify import extract_subgraph
+from cognee.modules.pipelines.layers.pipeline_execution_mode import get_pipeline_executor
+
+logger = get_logger("memify")
+
+
+async def memify(
+    datasets: Union[str, list[str], list[UUID]] = None,
+    user: User = None,
+    tasks: List[Task] = None,
+    node_type: Optional[Type] = NodeSet,
+    node_name: Optional[List[str]] = None,
+    cypher_query: Optional[str] = None,
+    vector_db_config: dict = None,
+    graph_db_config: dict = None,
+    run_in_background: bool = False,
+):
+    """
+    Prerequisites:
+        - **LLM_API_KEY**: Must be configured (required for entity extraction and graph generation)
+        - **Data Added**: Must have data previously added via `cognee.add()` and `cognee.cognify()`
+        - **Vector Database**: Must be accessible for embeddings storage
+        - **Graph Database**: Must be accessible for relationship storage
+
+    Args:
+        datasets: Dataset name(s) or dataset uuid to process. Processes all available data if None.
+            - Single dataset: "my_dataset"
+            - Multiple datasets: ["docs", "research", "reports"]
+            - None: Process all datasets for the user
+        user: User context for authentication and data access. Uses default if None.
+        vector_db_config: Custom vector database configuration for embeddings storage.
+        graph_db_config: Custom graph database configuration for relationship storage.
+        run_in_background: If True, starts processing asynchronously and returns immediately.
+                          If False, waits for completion before returning.
+                          Background mode recommended for large datasets (>100MB).
+                          Use pipeline_run_id from return value to monitor progress.
+    """
+    memify_tasks = [
+        Task(extract_subgraph, cypher_query=cypher_query, node_type=node_type, node_name=node_name),
+        *tasks,  # Unpack tasks provided to memify pipeline
+    ]
+
+    # By calling get pipeline executor we get a function that will have the run_pipeline run in the background or a function that we will need to wait for
+    pipeline_executor_func = get_pipeline_executor(run_in_background=run_in_background)
+
+    # Run the run_pipeline in the background or blocking based on executor
+    return await pipeline_executor_func(
+        pipeline=run_pipeline,
+        tasks=memify_tasks,
+        user=user,
+        datasets=datasets,
+        vector_db_config=vector_db_config,
+        graph_db_config=graph_db_config,
+        incremental_loading=False,
+        pipeline_name="memify_pipeline",
+    )
diff --git a/cognee/tasks/memify/__init__.py b/cognee/tasks/memify/__init__.py
new file mode 100644
index 000000000..a95e88794
--- /dev/null
+++ b/cognee/tasks/memify/__init__.py
@@ -0,0 +1 @@
+from extract_subgraph import extract_subgraph
diff --git a/cognee/tasks/memify/extract_subgraph.py b/cognee/tasks/memify/extract_subgraph.py
new file mode 100644
index 000000000..1cf7ab951
--- /dev/null
+++ b/cognee/tasks/memify/extract_subgraph.py
@@ -0,0 +1,2 @@
+async def extract_subgraph():
+    pass

From 0bf8abcc6fb9491b03c27b7c6f3cea1753004a29 Mon Sep 17 00:00:00 2001
From: Hande <159312713+hande-k@users.noreply.github.com>
Date: Tue, 2 Sep 2025 11:18:22 +0300
Subject: [PATCH 02/19] fix: add fix to low level example

---
 cognee/modules/data/methods/load_or_create_datasets.py | 2 +-
 examples/low_level/pipeline.py                         | 2 +-
 2 files changed, 2 insertions(+), 2 deletions(-)

diff --git a/cognee/modules/data/methods/load_or_create_datasets.py b/cognee/modules/data/methods/load_or_create_datasets.py
index 1d6ef3efb..2c9a6497c 100644
--- a/cognee/modules/data/methods/load_or_create_datasets.py
+++ b/cognee/modules/data/methods/load_or_create_datasets.py
@@ -2,7 +2,7 @@ from typing import List, Union
 from uuid import UUID
 
 from cognee.modules.data.models import Dataset
-from cognee.modules.data.methods import create_authorized_dataset
+from cognee.modules.data.methods.create_authorized_dataset import create_authorized_dataset
 from cognee.modules.data.exceptions import DatasetNotFoundError
 
 
diff --git a/examples/low_level/pipeline.py b/examples/low_level/pipeline.py
index 804e42ff7..085d313a7 100644
--- a/examples/low_level/pipeline.py
+++ b/examples/low_level/pipeline.py
@@ -73,7 +73,7 @@ def ingest_files(data: List[Any]):
 
                 new_company.departments.append(departments_data_points[department_name])
 
-    return companies_data_points.values()
+    return list(companies_data_points.values())
 
 
 async def main():

From 195e05a544ea5fe62cf92a767cd0ce0dc876fdd4 Mon Sep 17 00:00:00 2001
From: Hande <159312713+hande-k@users.noreply.github.com>
Date: Tue, 2 Sep 2025 11:41:26 +0300
Subject: [PATCH 03/19] fix: add fix to starter-kit low level

---
 cognee-starter-kit/src/pipelines/low_level.py | 72 ++++++++++---------
 1 file changed, 40 insertions(+), 32 deletions(-)

diff --git a/cognee-starter-kit/src/pipelines/low_level.py b/cognee-starter-kit/src/pipelines/low_level.py
index 4c4c9d6da..8b4fccf33 100644
--- a/cognee-starter-kit/src/pipelines/low_level.py
+++ b/cognee-starter-kit/src/pipelines/low_level.py
@@ -1,14 +1,15 @@
 import os
-import uuid
 import json
 import asyncio
 import pathlib
+from typing import List, Any
 from cognee import config, prune, search, SearchType, visualize_graph
 from cognee.low_level import setup, DataPoint
 from cognee.pipelines import run_tasks, Task
 from cognee.tasks.storage import add_data_points
 from cognee.tasks.storage.index_graph_edges import index_graph_edges
 from cognee.modules.users.methods import get_default_user
+from cognee.modules.data.methods import load_or_create_datasets
 
 
 class Person(DataPoint):
@@ -33,45 +34,51 @@ class Company(DataPoint):
     metadata: dict = {"index_fields": ["name"]}
 
 
-def ingest_files():
-    companies_file_path = os.path.join(os.path.dirname(__file__), "../data/companies.json")
-    companies = json.loads(open(companies_file_path, "r").read())
+def ingest_files(data: List[Any]):
+    if not data or data == [None]:
+        companies_file_path = os.path.join(os.path.dirname(__file__), "../data/companies.json")
+        companies = json.loads(open(companies_file_path, "r").read())
 
-    people_file_path = os.path.join(os.path.dirname(__file__), "../data/people.json")
-    people = json.loads(open(people_file_path, "r").read())
+        people_file_path = os.path.join(os.path.dirname(__file__), "../data/people.json")
+        people = json.loads(open(people_file_path, "r").read())
+
+        data = [{"companies": companies, "people": people}]
 
     people_data_points = {}
     departments_data_points = {}
-
-    for person in people:
-        new_person = Person(name=person["name"])
-        people_data_points[person["name"]] = new_person
-
-        if person["department"] not in departments_data_points:
-            departments_data_points[person["department"]] = Department(
-                name=person["department"], employees=[new_person]
-            )
-        else:
-            departments_data_points[person["department"]].employees.append(new_person)
-
     companies_data_points = {}
 
-    # Create a single CompanyType node, so we connect all companies to it.
-    companyType = CompanyType()
+    for data_item in data:
+        people = data_item["people"]
+        companies = data_item["companies"]
 
-    for company in companies:
-        new_company = Company(name=company["name"], departments=[], is_type=companyType)
-        companies_data_points[company["name"]] = new_company
+        for person in people:
+            new_person = Person(name=person["name"])
+            people_data_points[person["name"]] = new_person
 
-        for department_name in company["departments"]:
-            if department_name not in departments_data_points:
-                departments_data_points[department_name] = Department(
-                    name=department_name, employees=[]
+            if person["department"] not in departments_data_points:
+                departments_data_points[person["department"]] = Department(
+                    name=person["department"], employees=[new_person]
                 )
+            else:
+                departments_data_points[person["department"]].employees.append(new_person)
 
-            new_company.departments.append(departments_data_points[department_name])
+        # Create a single CompanyType node, so we connect all companies to it.
+        companyType = CompanyType()
 
-    return companies_data_points.values()
+        for company in companies:
+            new_company = Company(name=company["name"], departments=[], is_type=companyType)
+            companies_data_points[company["name"]] = new_company
+
+            for department_name in company["departments"]:
+                if department_name not in departments_data_points:
+                    departments_data_points[department_name] = Department(
+                        name=department_name, employees=[]
+                    )
+
+                new_company.departments.append(departments_data_points[department_name])
+
+    return list(companies_data_points.values())
 
 
 async def main():
@@ -86,16 +93,17 @@ async def main():
 
     await setup()
 
-    # Generate a random dataset_id
-    dataset_id = uuid.uuid4()
+    # Get default user
     user = await get_default_user()
 
+    datasets = await load_or_create_datasets(["demo_dataset"], [], user)
+
     pipeline = run_tasks(
         [
             Task(ingest_files),
             Task(add_data_points),
         ],
-        dataset_id,
+        datasets[0].id,
         None,
         user,
         "demo_pipeline",

From af084af70fe8fc940aacea27f16cd400611932e0 Mon Sep 17 00:00:00 2001
From: Igor Ilic <igorilic03@gmail.com>
Date: Tue, 2 Sep 2025 21:32:09 +0200
Subject: [PATCH 04/19] feat: Memify pipeline initial commit

---
 cognee/api/v1/add/add.py                      |   4 +-
 cognee/api/v1/cognify/memify.py               |  48 +++++--
 ...y_coding_rule_association_agent_system.txt |   6 +
 ...ify_coding_rule_association_agent_user.txt |   6 +
 .../modules/graph/cognee_graph/CogneeGraph.py |  69 ++++++++++
 .../reset_dataset_pipeline_run_status.py      |  22 +++-
 .../modules/pipelines/operations/pipeline.py  |   1 +
 cognee/tasks/codingagents/__init__.py         |   0
 .../codingagents/coding_rule_associations.py  | 124 ++++++++++++++++++
 cognee/tasks/memify/__init__.py               |   2 +-
 cognee/tasks/memify/extract_subgraph.py       |   9 +-
 11 files changed, 275 insertions(+), 16 deletions(-)
 create mode 100644 cognee/infrastructure/llm/prompts/memify_coding_rule_association_agent_system.txt
 create mode 100644 cognee/infrastructure/llm/prompts/memify_coding_rule_association_agent_user.txt
 create mode 100644 cognee/tasks/codingagents/__init__.py
 create mode 100644 cognee/tasks/codingagents/coding_rule_associations.py

diff --git a/cognee/api/v1/add/add.py b/cognee/api/v1/add/add.py
index 98771947c..eeb867984 100644
--- a/cognee/api/v1/add/add.py
+++ b/cognee/api/v1/add/add.py
@@ -150,7 +150,9 @@ async def add(
 
     user, authorized_dataset = await resolve_authorized_user_dataset(dataset_id, dataset_name, user)
 
-    await reset_dataset_pipeline_run_status(authorized_dataset.id, user)
+    await reset_dataset_pipeline_run_status(
+        authorized_dataset.id, user, pipeline_names=["add_pipeline", "cognify_pipeline"]
+    )
 
     pipeline_run_info = None
 
diff --git a/cognee/api/v1/cognify/memify.py b/cognee/api/v1/cognify/memify.py
index 65a622af7..7e35ef5dc 100644
--- a/cognee/api/v1/cognify/memify.py
+++ b/cognee/api/v1/cognify/memify.py
@@ -1,28 +1,33 @@
-from pydantic import BaseModel
 from typing import Union, Optional, List, Type
 from uuid import UUID
 
 from cognee.shared.logging_utils import get_logger
-from cognee.shared.data_models import KnowledgeGraph
-from cognee.infrastructure.llm import get_max_chunk_tokens
 
+from cognee.modules.retrieval.utils.brute_force_triplet_search import get_memory_fragment
+from cognee.modules.graph.cognee_graph.CogneeGraph import CogneeGraph
 from cognee.modules.engine.models.node_set import NodeSet
 from cognee.modules.pipelines import run_pipeline
 from cognee.modules.pipelines.tasks.task import Task
-from cognee.modules.chunking.TextChunker import TextChunker
-from cognee.modules.ontology.rdf_xml.OntologyResolver import OntologyResolver
 from cognee.modules.users.models import User
+from cognee.modules.pipelines.layers.resolve_authorized_user_datasets import (
+    resolve_authorized_user_datasets,
+)
+from cognee.modules.pipelines.layers.reset_dataset_pipeline_run_status import (
+    reset_dataset_pipeline_run_status,
+)
+from cognee.modules.engine.operations.setup import setup
 
-from cognee.tasks.memify import extract_subgraph
+from cognee.tasks.memify.extract_subgraph import extract_subgraph
+from cognee.tasks.codingagents.coding_rule_associations import add_rule_associations
 from cognee.modules.pipelines.layers.pipeline_execution_mode import get_pipeline_executor
 
 logger = get_logger("memify")
 
 
 async def memify(
+    tasks: List[Task],
     datasets: Union[str, list[str], list[UUID]] = None,
     user: User = None,
-    tasks: List[Task] = None,
     node_type: Optional[Type] = NodeSet,
     node_name: Optional[List[str]] = None,
     cypher_query: Optional[str] = None,
@@ -50,11 +55,35 @@ async def memify(
                           Background mode recommended for large datasets (>100MB).
                           Use pipeline_run_id from return value to monitor progress.
     """
+
+    if cypher_query:
+        pass
+    else:
+        memory_fragment = await get_memory_fragment(node_type=node_type, node_name=node_name)
+        # List of edges should be a single element in the list to represent one data item
+        data = [memory_fragment.edges]
+
     memify_tasks = [
-        Task(extract_subgraph, cypher_query=cypher_query, node_type=node_type, node_name=node_name),
-        *tasks,  # Unpack tasks provided to memify pipeline
+        Task(extract_subgraph),
+        Task(CogneeGraph.resolve_edges_to_text, task_config={"batch_size": 10}),
+        Task(
+            add_rule_associations,
+            rules_nodeset_name="coding_agent_rules",
+            user_prompt_location="memify_coding_rule_association_agent_user.txt",
+            system_prompt_location="memify_coding_rule_association_agent_system.txt",
+        ),
+        # *tasks,  # Unpack tasks provided to memify pipeline
     ]
 
+    await setup()
+
+    user, authorized_datasets = await resolve_authorized_user_datasets(datasets, user)
+
+    for dataset in authorized_datasets:
+        await reset_dataset_pipeline_run_status(
+            dataset.id, user, pipeline_names=["memify_pipeline"]
+        )
+
     # By calling get pipeline executor we get a function that will have the run_pipeline run in the background or a function that we will need to wait for
     pipeline_executor_func = get_pipeline_executor(run_in_background=run_in_background)
 
@@ -63,6 +92,7 @@ async def memify(
         pipeline=run_pipeline,
         tasks=memify_tasks,
         user=user,
+        data=data,
         datasets=datasets,
         vector_db_config=vector_db_config,
         graph_db_config=graph_db_config,
diff --git a/cognee/infrastructure/llm/prompts/memify_coding_rule_association_agent_system.txt b/cognee/infrastructure/llm/prompts/memify_coding_rule_association_agent_system.txt
new file mode 100644
index 000000000..31c9825bd
--- /dev/null
+++ b/cognee/infrastructure/llm/prompts/memify_coding_rule_association_agent_system.txt
@@ -0,0 +1,6 @@
+You are an association agent tasked with suggesting structured developer rules from user-agent interactions stored in a Knowledge Graph.
+You will receive the actual user agent interaction as a set of relationships from a knowledge graph separated by \n---\n each represented as node1 -- relation -- node2 triplet, and the list of the already existing developer rules.
+Each rule represents a single best practice or guideline the agent should follow in the future.
+Suggest rules that are general and not specific to the current text, strictly technical, add value and improve the future agent behavior.
+Do not suggest rules similar to the existing ones or rules that are not general and dont add value.
+It is acceptable to return an empty rule list.
diff --git a/cognee/infrastructure/llm/prompts/memify_coding_rule_association_agent_user.txt b/cognee/infrastructure/llm/prompts/memify_coding_rule_association_agent_user.txt
new file mode 100644
index 000000000..9b525c625
--- /dev/null
+++ b/cognee/infrastructure/llm/prompts/memify_coding_rule_association_agent_user.txt
@@ -0,0 +1,6 @@
+**Here is the User-agent interaction context provided with a set of relationships from a knowledge graph separated by \n---\n each represented as node1 -- relation -- node2 triplet:**
+`{{ chat }}`
+
+
+**Already existing rules:**
+`{{ rules }}`
diff --git a/cognee/modules/graph/cognee_graph/CogneeGraph.py b/cognee/modules/graph/cognee_graph/CogneeGraph.py
index 924532ce0..94a8e965e 100644
--- a/cognee/modules/graph/cognee_graph/CogneeGraph.py
+++ b/cognee/modules/graph/cognee_graph/CogneeGraph.py
@@ -188,3 +188,72 @@ class CogneeGraph(CogneeAbstractGraph):
             return n1 + n2 + e
 
         return heapq.nsmallest(k, self.edges, key=score)
+
+    @staticmethod
+    async def resolve_edges_to_text(retrieved_edges: list) -> str:
+        """
+        Converts retrieved graph edges into a human-readable string format.
+
+        Parameters:
+        -----------
+
+            - retrieved_edges (list): A list of edges retrieved from the graph.
+
+        Returns:
+        --------
+
+            - str: A formatted string representation of the nodes and their connections.
+        """
+
+        def _get_nodes(retrieved_edges: list) -> dict:
+            def _get_title(text: str, first_n_words: int = 7, top_n_words: int = 3) -> str:
+                def _top_n_words(text, stop_words=None, top_n=3, separator=", "):
+                    """Concatenates the top N frequent words in text."""
+                    if stop_words is None:
+                        from cognee.modules.retrieval.utils.stop_words import DEFAULT_STOP_WORDS
+
+                        stop_words = DEFAULT_STOP_WORDS
+
+                    import string
+
+                    words = [word.lower().strip(string.punctuation) for word in text.split()]
+
+                    if stop_words:
+                        words = [word for word in words if word and word not in stop_words]
+
+                    from collections import Counter
+
+                    top_words = [word for word, freq in Counter(words).most_common(top_n)]
+
+                    return separator.join(top_words)
+
+                """Creates a title, by combining first words with most frequent words from the text."""
+                first_n_words = text.split()[:first_n_words]
+                top_n_words = _top_n_words(text, top_n=top_n_words)
+                return f"{' '.join(first_n_words)}... [{top_n_words}]"
+
+            """Creates a dictionary of nodes with their names and content."""
+            nodes = {}
+            for edge in retrieved_edges:
+                for node in (edge.node1, edge.node2):
+                    if node.id not in nodes:
+                        text = node.attributes.get("text")
+                        if text:
+                            name = _get_title(text)
+                            content = text
+                        else:
+                            name = node.attributes.get("name", "Unnamed Node")
+                            content = node.attributes.get("description", name)
+                        nodes[node.id] = {"node": node, "name": name, "content": content}
+            return nodes
+
+        nodes = _get_nodes(retrieved_edges)
+        node_section = "\n".join(
+            f"Node: {info['name']}\n__node_content_start__\n{info['content']}\n__node_content_end__\n"
+            for info in nodes.values()
+        )
+        connection_section = "\n".join(
+            f"{nodes[edge.node1.id]['name']} --[{edge.attributes['relationship_type']}]--> {nodes[edge.node2.id]['name']}"
+            for edge in retrieved_edges
+        )
+        return f"Nodes:\n{node_section}\n\nConnections:\n{connection_section}"
diff --git a/cognee/modules/pipelines/layers/reset_dataset_pipeline_run_status.py b/cognee/modules/pipelines/layers/reset_dataset_pipeline_run_status.py
index cc72a6e51..bc59f9a6b 100644
--- a/cognee/modules/pipelines/layers/reset_dataset_pipeline_run_status.py
+++ b/cognee/modules/pipelines/layers/reset_dataset_pipeline_run_status.py
@@ -1,12 +1,28 @@
 from uuid import UUID
+from typing import Optional, List
+
 from cognee.modules.pipelines.methods import get_pipeline_runs_by_dataset, reset_pipeline_run_status
 from cognee.modules.pipelines.models.PipelineRun import PipelineRunStatus
 from cognee.modules.users.models import User
 
 
-async def reset_dataset_pipeline_run_status(dataset_id: UUID, user: User):
+async def reset_dataset_pipeline_run_status(
+    dataset_id: UUID, user: User, pipeline_names: Optional[list[str]] = None
+):
+    """Reset the status of all (or selected) pipeline runs for a dataset.
+
+    If *pipeline_names* is given, only runs whose *pipeline_name* is in
+    that list are touched.
+    """
     related_pipeline_runs = await get_pipeline_runs_by_dataset(dataset_id)
 
     for pipeline_run in related_pipeline_runs:
-        if pipeline_run.status is not PipelineRunStatus.DATASET_PROCESSING_INITIATED:
-            await reset_pipeline_run_status(user.id, dataset_id, pipeline_run.pipeline_name)
+        # Skip runs that are initiated
+        if pipeline_run.status is PipelineRunStatus.DATASET_PROCESSING_INITIATED:
+            continue
+
+        # If a name filter is provided, skip non-matching runs
+        if pipeline_names is not None and pipeline_run.pipeline_name not in pipeline_names:
+            continue
+
+        await reset_pipeline_run_status(user.id, dataset_id, pipeline_run.pipeline_name)
diff --git a/cognee/modules/pipelines/operations/pipeline.py b/cognee/modules/pipelines/operations/pipeline.py
index cbe6dee5c..b59a171f7 100644
--- a/cognee/modules/pipelines/operations/pipeline.py
+++ b/cognee/modules/pipelines/operations/pipeline.py
@@ -5,6 +5,7 @@ from typing import Union
 from cognee.modules.pipelines.layers.setup_and_check_environment import (
     setup_and_check_environment,
 )
+
 from cognee.shared.logging_utils import get_logger
 from cognee.modules.data.methods.get_dataset_data import get_dataset_data
 from cognee.modules.data.models import Data, Dataset
diff --git a/cognee/tasks/codingagents/__init__.py b/cognee/tasks/codingagents/__init__.py
new file mode 100644
index 000000000..e69de29bb
diff --git a/cognee/tasks/codingagents/coding_rule_associations.py b/cognee/tasks/codingagents/coding_rule_associations.py
new file mode 100644
index 000000000..6971ecc83
--- /dev/null
+++ b/cognee/tasks/codingagents/coding_rule_associations.py
@@ -0,0 +1,124 @@
+from uuid import NAMESPACE_OID, uuid5
+
+from cognee.infrastructure.databases.graph import get_graph_engine
+from cognee.infrastructure.databases.vector import get_vector_engine
+
+from cognee.low_level import DataPoint
+from cognee.infrastructure.llm import LLMGateway
+from cognee.shared.logging_utils import get_logger
+from cognee.modules.engine.models import NodeSet
+from cognee.tasks.storage import add_data_points, index_graph_edges
+from typing import Optional, List, Any
+from pydantic import Field
+
+logger = get_logger("coding_rule_association")
+
+
+class Rule(DataPoint):
+    """A single developer rule extracted from text."""
+
+    text: str = Field(..., description="The coding rule associated with the conversation")
+    belongs_to_set: Optional[NodeSet] = None
+    metadata: dict = {"index_fields": ["rule"]}
+
+
+class RuleSet(DataPoint):
+    """Collection of parsed rules."""
+
+    rules: List[Rule] = Field(
+        ...,
+        description="List of developer rules extracted from the input text. Each rule represents a coding best practice or guideline.",
+    )
+
+
+async def get_existing_rules(rules_nodeset_name: str) -> str:
+    graph_engine = await get_graph_engine()
+    nodes_data, _ = await graph_engine.get_nodeset_subgraph(
+        node_type=NodeSet, node_name=[rules_nodeset_name]
+    )
+
+    existing_rules = [
+        item[1]["text"]
+        for item in nodes_data
+        if isinstance(item, tuple)
+        and len(item) == 2
+        and isinstance(item[1], dict)
+        and "text" in item[1]
+    ]
+
+    existing_rules = "\n".join(f"- {rule}" for rule in existing_rules)
+
+    return existing_rules
+
+
+async def get_origin_edges(data: str, rules: List[Rule]) -> list[Any]:
+    vector_engine = get_vector_engine()
+
+    origin_chunk = await vector_engine.search("DocumentChunk_text", data, limit=1)
+
+    try:
+        origin_id = origin_chunk[0].id
+    except (AttributeError, KeyError, TypeError, IndexError):
+        origin_id = None
+
+    relationships = []
+
+    if origin_id and isinstance(rules, (list, tuple)) and len(rules) > 0:
+        for rule in rules:
+            try:
+                rule_id = getattr(rule, "id", None)
+                if rule_id is not None:
+                    rel_name = "rule_associated_from"
+                    relationships.append(
+                        (
+                            rule_id,
+                            origin_id,
+                            rel_name,
+                            {
+                                "relationship_name": rel_name,
+                                "source_node_id": rule_id,
+                                "target_node_id": origin_id,
+                                "ontology_valid": False,
+                            },
+                        )
+                    )
+            except Exception as e:
+                logger.info(f"Warning: Skipping invalid rule due to error: {e}")
+    else:
+        logger.info("No valid origin_id or rules provided.")
+
+    return relationships
+
+
+async def add_rule_associations(
+    data: str,
+    rules_nodeset_name: str,
+    user_prompt_location: str = "coding_rule_association_agent_user.txt",
+    system_prompt_location: str = "coding_rule_association_agent_system.txt",
+):
+    graph_engine = await get_graph_engine()
+    existing_rules = await get_existing_rules(rules_nodeset_name=rules_nodeset_name)
+
+    user_context = {"user data": data, "rules": existing_rules}
+
+    user_prompt = LLMGateway.render_prompt(user_prompt_location, context=user_context)
+    system_prompt = LLMGateway.render_prompt(system_prompt_location, context={})
+
+    rule_list = await LLMGateway.acreate_structured_output(
+        text_input=user_prompt, system_prompt=system_prompt, response_model=RuleSet
+    )
+
+    rules_nodeset = NodeSet(
+        id=uuid5(NAMESPACE_OID, name=rules_nodeset_name), name=rules_nodeset_name
+    )
+    for rule in rule_list.rules:
+        rule.belongs_to_set = rules_nodeset
+
+    edges_to_save = await get_origin_edges(data=data, rules=rule_list.rules)
+
+    await add_data_points(data_points=rule_list.rules)
+
+    if len(edges_to_save) > 0:
+        await graph_engine.add_edges(edges_to_save)
+
+    await index_graph_edges()
diff --git a/cognee/tasks/memify/__init__.py b/cognee/tasks/memify/__init__.py
index a95e88794..d2e0172f6 100644
--- a/cognee/tasks/memify/__init__.py
+++ b/cognee/tasks/memify/__init__.py
@@ -1 +1 @@
-from extract_subgraph import extract_subgraph
+from .extract_subgraph import extract_subgraph
diff --git a/cognee/tasks/memify/extract_subgraph.py b/cognee/tasks/memify/extract_subgraph.py
index 1cf7ab951..198a5b367 100644
--- a/cognee/tasks/memify/extract_subgraph.py
+++ b/cognee/tasks/memify/extract_subgraph.py
@@ -1,2 +1,7 @@
-async def extract_subgraph():
-    pass
+from cognee.modules.retrieval.utils.brute_force_triplet_search import get_memory_fragment
+
+
+async def extract_subgraph(subgraphs):
+    for subgraph in subgraphs:
+        for edge in subgraph:
+            yield edge

From 1a2977779f49001c5696330b005a3c90d75f6b7f Mon Sep 17 00:00:00 2001
From: Igor Ilic <igorilic03@gmail.com>
Date: Wed, 3 Sep 2025 12:03:17 +0200
Subject: [PATCH 05/19] feat: Add memify coding agent example

---
 cognee/api/v1/cognify/memify.py               | 12 +--
 .../python/memify_coding_agent_example.py     | 76 +++++++++++++++++++
 2 files changed, 78 insertions(+), 10 deletions(-)
 create mode 100644 examples/python/memify_coding_agent_example.py

diff --git a/cognee/api/v1/cognify/memify.py b/cognee/api/v1/cognify/memify.py
index 7e35ef5dc..df45bac76 100644
--- a/cognee/api/v1/cognify/memify.py
+++ b/cognee/api/v1/cognify/memify.py
@@ -4,7 +4,7 @@ from uuid import UUID
 from cognee.shared.logging_utils import get_logger
 
 from cognee.modules.retrieval.utils.brute_force_triplet_search import get_memory_fragment
-from cognee.modules.graph.cognee_graph.CogneeGraph import CogneeGraph
+
 from cognee.modules.engine.models.node_set import NodeSet
 from cognee.modules.pipelines import run_pipeline
 from cognee.modules.pipelines.tasks.task import Task
@@ -18,7 +18,6 @@ from cognee.modules.pipelines.layers.reset_dataset_pipeline_run_status import (
 from cognee.modules.engine.operations.setup import setup
 
 from cognee.tasks.memify.extract_subgraph import extract_subgraph
-from cognee.tasks.codingagents.coding_rule_associations import add_rule_associations
 from cognee.modules.pipelines.layers.pipeline_execution_mode import get_pipeline_executor
 
 logger = get_logger("memify")
@@ -65,14 +64,7 @@ async def memify(
 
     memify_tasks = [
         Task(extract_subgraph),
-        Task(CogneeGraph.resolve_edges_to_text, task_config={"batch_size": 10}),
-        Task(
-            add_rule_associations,
-            rules_nodeset_name="coding_agent_rules",
-            user_prompt_location="memify_coding_rule_association_agent_user.txt",
-            system_prompt_location="memify_coding_rule_association_agent_system.txt",
-        ),
-        # *tasks,  # Unpack tasks provided to memify pipeline
+        *tasks,  # Unpack tasks provided to memify pipeline
     ]
 
     await setup()
diff --git a/examples/python/memify_coding_agent_example.py b/examples/python/memify_coding_agent_example.py
new file mode 100644
index 000000000..70064c346
--- /dev/null
+++ b/examples/python/memify_coding_agent_example.py
@@ -0,0 +1,76 @@
+import asyncio
+import cognee
+from cognee.shared.logging_utils import setup_logging, ERROR
+from cognee.api.v1.search import SearchType
+
+# Prerequisites:
+# 1. Copy `.env.template` and rename it to `.env`.
+# 2. Add your OpenAI API key to the `.env` file in the `LLM_API_KEY` field:
+#    LLM_API_KEY = "your_key_here"
+
+
+async def main():
+    # Create a clean slate for cognee -- reset data and system state
+    print("Resetting cognee data...")
+    await cognee.prune.prune_data()
+    await cognee.prune.prune_system(metadata=True)
+    print("Data reset complete.\n")
+
+    # cognee knowledge graph will be created based on this text
+    text = """
+    Natural language processing (NLP) is an interdisciplinary
+    subfield of computer science and information retrieval.
+    """
+
+    coding_rules_text = """
+    Code must be formatted by PEP8 standards.
+    Typing and Docstrings must be added.
+    """
+
+    print("Adding text to cognee:")
+    print(text.strip())
+    # Add the text, and make it available for cognify
+    await cognee.add(text)
+    await cognee.add(coding_rules_text, node_set=["coding_rules"])
+    print("Text added successfully.\n")
+
+    # Use LLMs and cognee to create knowledge graph
+    await cognee.cognify()
+    print("Cognify process complete.\n")
+
+    from cognee.api.v1.cognify.memify import memify
+
+    from cognee.modules.graph.cognee_graph.CogneeGraph import CogneeGraph
+    from cognee.tasks.codingagents.coding_rule_associations import add_rule_associations
+    from cognee.modules.pipelines.tasks.task import Task
+
+    memify_tasks = [
+        Task(CogneeGraph.resolve_edges_to_text, task_config={"batch_size": 10}),
+        Task(
+            add_rule_associations,
+            rules_nodeset_name="coding_agent_rules",
+            user_prompt_location="memify_coding_rule_association_agent_user.txt",
+            system_prompt_location="memify_coding_rule_association_agent_system.txt",
+        ),
+    ]
+
+    await memify(tasks=memify_tasks, node_name=["coding_rules"])
+
+    import os
+    import pathlib
+    from cognee.api.v1.visualize.visualize import visualize_graph
+
+    file_path = os.path.join(
+        pathlib.Path(__file__).parent, ".artifacts", "graph_visualization.html"
+    )
+    await visualize_graph(file_path)
+
+
+if __name__ == "__main__":
+    logger = setup_logging(log_level=ERROR)
+    loop = asyncio.new_event_loop()
+    asyncio.set_event_loop(loop)
+    try:
+        loop.run_until_complete(main())
+    finally:
+        loop.run_until_complete(loop.shutdown_asyncgens())

From 2847569616cb47fa6f76c511d2d654a399dc24f1 Mon Sep 17 00:00:00 2001
From: Igor Ilic <igorilic03@gmail.com>
Date: Wed, 3 Sep 2025 16:08:32 +0200
Subject: [PATCH 06/19] feat: memify next iteration

---
 cognee/api/v1/cognify/memify.py               |  28 +++--
 ...y_coding_rule_association_agent_system.txt |   2 +-
 .../modules/graph/cognee_graph/CogneeGraph.py |  69 ------------
 cognee/modules/graph/utils/__init__.py        |   1 +
 .../graph/utils/resolve_edges_to_text.py      |  67 +++++++++++
 .../retrieval/graph_completion_retriever.py   |  48 +-------
 .../codingagents/coding_rule_associations.py  |   6 +-
 cognee/tasks/memify/__init__.py               |   1 +
 cognee/tasks/memify/extract_subgraph.py       |   6 +-
 .../tasks/memify/extract_subgraph_chunks.py   |  11 ++
 .../python/memify_coding_agent_example.py     |  34 ++++--
 .../memify_coding_agent_example_chunks.py     | 106 ++++++++++++++++++
 12 files changed, 235 insertions(+), 144 deletions(-)
 create mode 100644 cognee/modules/graph/utils/resolve_edges_to_text.py
 create mode 100644 cognee/tasks/memify/extract_subgraph_chunks.py
 create mode 100644 examples/python/memify_coding_agent_example_chunks.py

diff --git a/cognee/api/v1/cognify/memify.py b/cognee/api/v1/cognify/memify.py
index df45bac76..8237059ec 100644
--- a/cognee/api/v1/cognify/memify.py
+++ b/cognee/api/v1/cognify/memify.py
@@ -1,4 +1,5 @@
-from typing import Union, Optional, List, Type
+from typing import Union, Optional, List, Type, Any
+from dataclasses import field
 from uuid import UUID
 
 from cognee.shared.logging_utils import get_logger
@@ -16,15 +17,16 @@ from cognee.modules.pipelines.layers.reset_dataset_pipeline_run_status import (
     reset_dataset_pipeline_run_status,
 )
 from cognee.modules.engine.operations.setup import setup
-
-from cognee.tasks.memify.extract_subgraph import extract_subgraph
 from cognee.modules.pipelines.layers.pipeline_execution_mode import get_pipeline_executor
 
 logger = get_logger("memify")
 
 
 async def memify(
-    tasks: List[Task],
+    preprocessing_tasks: List[Task],
+    processing_tasks: List[Task] = [],
+    postprocessing_tasks: List[Task] = [],
+    data: Optional[Any] = None,
     datasets: Union[str, list[str], list[UUID]] = None,
     user: User = None,
     node_type: Optional[Type] = NodeSet,
@@ -55,16 +57,18 @@ async def memify(
                           Use pipeline_run_id from return value to monitor progress.
     """
 
-    if cypher_query:
-        pass
-    else:
-        memory_fragment = await get_memory_fragment(node_type=node_type, node_name=node_name)
-        # List of edges should be a single element in the list to represent one data item
-        data = [memory_fragment.edges]
+    if not data:
+        if cypher_query:
+            pass
+        else:
+            memory_fragment = await get_memory_fragment(node_type=node_type, node_name=node_name)
+            # Subgraphs should be a single element in the list to represent one data item
+            data = [memory_fragment]
 
     memify_tasks = [
-        Task(extract_subgraph),
-        *tasks,  # Unpack tasks provided to memify pipeline
+        *preprocessing_tasks,  # Unpack tasks provided to memify pipeline
+        *processing_tasks,
+        *postprocessing_tasks,
     ]
 
     await setup()
diff --git a/cognee/infrastructure/llm/prompts/memify_coding_rule_association_agent_system.txt b/cognee/infrastructure/llm/prompts/memify_coding_rule_association_agent_system.txt
index 31c9825bd..d9adf45f7 100644
--- a/cognee/infrastructure/llm/prompts/memify_coding_rule_association_agent_system.txt
+++ b/cognee/infrastructure/llm/prompts/memify_coding_rule_association_agent_system.txt
@@ -1,6 +1,6 @@
 You are an association agent tasked with suggesting structured developer rules from user-agent interactions stored in a Knowledge Graph.
 You will receive the actual user agent interaction as a set of relationships from a knowledge graph separated by \n---\n each represented as node1 -- relation -- node2 triplet, and the list of the already existing developer rules.
 Each rule represents a single best practice or guideline the agent should follow in the future.
-Suggest rules that are general and not specific to the current text, strictly technical, add value and improve the future agent behavior.
+Suggest rules that are general and not specific to the knowledge graph relationships, strictly technical, add value and improve the future agent behavior.
 Do not suggest rules similar to the existing ones or rules that are not general and dont add value.
 It is acceptable to return an empty rule list.
diff --git a/cognee/modules/graph/cognee_graph/CogneeGraph.py b/cognee/modules/graph/cognee_graph/CogneeGraph.py
index 94a8e965e..924532ce0 100644
--- a/cognee/modules/graph/cognee_graph/CogneeGraph.py
+++ b/cognee/modules/graph/cognee_graph/CogneeGraph.py
@@ -188,72 +188,3 @@ class CogneeGraph(CogneeAbstractGraph):
             return n1 + n2 + e
 
         return heapq.nsmallest(k, self.edges, key=score)
-
-    @staticmethod
-    async def resolve_edges_to_text(retrieved_edges: list) -> str:
-        """
-        Converts retrieved graph edges into a human-readable string format.
-
-        Parameters:
-        -----------
-
-            - retrieved_edges (list): A list of edges retrieved from the graph.
-
-        Returns:
-        --------
-
-            - str: A formatted string representation of the nodes and their connections.
-        """
-
-        def _get_nodes(retrieved_edges: list) -> dict:
-            def _get_title(text: str, first_n_words: int = 7, top_n_words: int = 3) -> str:
-                def _top_n_words(text, stop_words=None, top_n=3, separator=", "):
-                    """Concatenates the top N frequent words in text."""
-                    if stop_words is None:
-                        from cognee.modules.retrieval.utils.stop_words import DEFAULT_STOP_WORDS
-
-                        stop_words = DEFAULT_STOP_WORDS
-
-                    import string
-
-                    words = [word.lower().strip(string.punctuation) for word in text.split()]
-
-                    if stop_words:
-                        words = [word for word in words if word and word not in stop_words]
-
-                    from collections import Counter
-
-                    top_words = [word for word, freq in Counter(words).most_common(top_n)]
-
-                    return separator.join(top_words)
-
-                """Creates a title, by combining first words with most frequent words from the text."""
-                first_n_words = text.split()[:first_n_words]
-                top_n_words = _top_n_words(text, top_n=top_n_words)
-                return f"{' '.join(first_n_words)}... [{top_n_words}]"
-
-            """Creates a dictionary of nodes with their names and content."""
-            nodes = {}
-            for edge in retrieved_edges:
-                for node in (edge.node1, edge.node2):
-                    if node.id not in nodes:
-                        text = node.attributes.get("text")
-                        if text:
-                            name = _get_title(text)
-                            content = text
-                        else:
-                            name = node.attributes.get("name", "Unnamed Node")
-                            content = node.attributes.get("description", name)
-                        nodes[node.id] = {"node": node, "name": name, "content": content}
-            return nodes
-
-        nodes = _get_nodes(retrieved_edges)
-        node_section = "\n".join(
-            f"Node: {info['name']}\n__node_content_start__\n{info['content']}\n__node_content_end__\n"
-            for info in nodes.values()
-        )
-        connection_section = "\n".join(
-            f"{nodes[edge.node1.id]['name']} --[{edge.attributes['relationship_type']}]--> {nodes[edge.node2.id]['name']}"
-            for edge in retrieved_edges
-        )
-        return f"Nodes:\n{node_section}\n\nConnections:\n{connection_section}"
diff --git a/cognee/modules/graph/utils/__init__.py b/cognee/modules/graph/utils/__init__.py
index d1cda2d83..ebc648495 100644
--- a/cognee/modules/graph/utils/__init__.py
+++ b/cognee/modules/graph/utils/__init__.py
@@ -4,3 +4,4 @@ from .get_model_instance_from_graph import get_model_instance_from_graph
 from .retrieve_existing_edges import retrieve_existing_edges
 from .convert_node_to_data_point import convert_node_to_data_point
 from .deduplicate_nodes_and_edges import deduplicate_nodes_and_edges
+from .resolve_edges_to_text import resolve_edges_to_text
diff --git a/cognee/modules/graph/utils/resolve_edges_to_text.py b/cognee/modules/graph/utils/resolve_edges_to_text.py
new file mode 100644
index 000000000..56c303abc
--- /dev/null
+++ b/cognee/modules/graph/utils/resolve_edges_to_text.py
@@ -0,0 +1,67 @@
+async def resolve_edges_to_text(retrieved_edges: list) -> str:
+    """
+    Converts retrieved graph edges into a human-readable string format.
+
+    Parameters:
+    -----------
+
+        - retrieved_edges (list): A list of edges retrieved from the graph.
+
+    Returns:
+    --------
+
+        - str: A formatted string representation of the nodes and their connections.
+    """
+
+    def _get_nodes(retrieved_edges: list) -> dict:
+        def _get_title(text: str, first_n_words: int = 7, top_n_words: int = 3) -> str:
+            def _top_n_words(text, stop_words=None, top_n=3, separator=", "):
+                """Concatenates the top N frequent words in text."""
+                if stop_words is None:
+                    from cognee.modules.retrieval.utils.stop_words import DEFAULT_STOP_WORDS
+
+                    stop_words = DEFAULT_STOP_WORDS
+
+                import string
+
+                words = [word.lower().strip(string.punctuation) for word in text.split()]
+
+                if stop_words:
+                    words = [word for word in words if word and word not in stop_words]
+
+                from collections import Counter
+
+                top_words = [word for word, freq in Counter(words).most_common(top_n)]
+
+                return separator.join(top_words)
+
+            """Creates a title, by combining first words with most frequent words from the text."""
+            first_n_words = text.split()[:first_n_words]
+            top_n_words = _top_n_words(text, top_n=top_n_words)
+            return f"{' '.join(first_n_words)}... [{top_n_words}]"
+
+        """Creates a dictionary of nodes with their names and content."""
+        nodes = {}
+        for edge in retrieved_edges:
+            for node in (edge.node1, edge.node2):
+                if node.id not in nodes:
+                    text = node.attributes.get("text")
+                    if text:
+                        name = _get_title(text)
+                        content = text
+                    else:
+                        name = node.attributes.get("name", "Unnamed Node")
+                        content = node.attributes.get("description", name)
+                    nodes[node.id] = {"node": node, "name": name, "content": content}
+        return nodes
+
+    nodes = _get_nodes(retrieved_edges)
+    node_section = "\n".join(
+        f"Node: {info['name']}\n__node_content_start__\n{info['content']}\n__node_content_end__\n"
+        for info in nodes.values()
+    )
+    connection_section = "\n".join(
+        f"{nodes[edge.node1.id]['name']} --[{edge.attributes['relationship_type']}]--> {nodes[edge.node2.id]['name']}"
+        for edge in retrieved_edges
+    )
+    return f"Nodes:\n{node_section}\n\nConnections:\n{connection_section}"
diff --git a/cognee/modules/retrieval/graph_completion_retriever.py b/cognee/modules/retrieval/graph_completion_retriever.py
index 6a5193c56..bc4fa27b3 100644
--- a/cognee/modules/retrieval/graph_completion_retriever.py
+++ b/cognee/modules/retrieval/graph_completion_retriever.py
@@ -5,6 +5,7 @@ import string
 
 from cognee.infrastructure.engine import DataPoint
 from cognee.tasks.storage import add_data_points
+from cognee.modules.graph.utils import resolve_edges_to_text
 from cognee.modules.graph.utils.convert_node_to_data_point import get_all_subclasses
 from cognee.modules.retrieval.base_retriever import BaseRetriever
 from cognee.modules.retrieval.utils.brute_force_triplet_search import brute_force_triplet_search
@@ -53,22 +54,6 @@ class GraphCompletionRetriever(BaseRetriever):
         self.node_type = node_type
         self.node_name = node_name
 
-    def _get_nodes(self, retrieved_edges: list) -> dict:
-        """Creates a dictionary of nodes with their names and content."""
-        nodes = {}
-        for edge in retrieved_edges:
-            for node in (edge.node1, edge.node2):
-                if node.id not in nodes:
-                    text = node.attributes.get("text")
-                    if text:
-                        name = self._get_title(text)
-                        content = text
-                    else:
-                        name = node.attributes.get("name", "Unnamed Node")
-                        content = node.attributes.get("description", name)
-                    nodes[node.id] = {"node": node, "name": name, "content": content}
-        return nodes
-
     async def resolve_edges_to_text(self, retrieved_edges: list) -> str:
         """
         Converts retrieved graph edges into a human-readable string format.
@@ -83,16 +68,7 @@ class GraphCompletionRetriever(BaseRetriever):
 
             - str: A formatted string representation of the nodes and their connections.
         """
-        nodes = self._get_nodes(retrieved_edges)
-        node_section = "\n".join(
-            f"Node: {info['name']}\n__node_content_start__\n{info['content']}\n__node_content_end__\n"
-            for info in nodes.values()
-        )
-        connection_section = "\n".join(
-            f"{nodes[edge.node1.id]['name']} --[{edge.attributes['relationship_type']}]--> {nodes[edge.node2.id]['name']}"
-            for edge in retrieved_edges
-        )
-        return f"Nodes:\n{node_section}\n\nConnections:\n{connection_section}"
+        return await resolve_edges_to_text(retrieved_edges)
 
     async def get_triplets(self, query: str) -> list:
         """
@@ -196,26 +172,6 @@ class GraphCompletionRetriever(BaseRetriever):
 
         return [completion]
 
-    def _top_n_words(self, text, stop_words=None, top_n=3, separator=", "):
-        """Concatenates the top N frequent words in text."""
-        if stop_words is None:
-            stop_words = DEFAULT_STOP_WORDS
-
-        words = [word.lower().strip(string.punctuation) for word in text.split()]
-
-        if stop_words:
-            words = [word for word in words if word and word not in stop_words]
-
-        top_words = [word for word, freq in Counter(words).most_common(top_n)]
-
-        return separator.join(top_words)
-
-    def _get_title(self, text: str, first_n_words: int = 7, top_n_words: int = 3) -> str:
-        """Creates a title, by combining first words with most frequent words from the text."""
-        first_n_words = text.split()[:first_n_words]
-        top_n_words = self._top_n_words(text, top_n=top_n_words)
-        return f"{' '.join(first_n_words)}... [{top_n_words}]"
-
     async def save_qa(self, question: str, answer: str, context: str, triplets: List) -> None:
         """
         Saves a question and answer pair for later analysis or storage.
diff --git a/cognee/tasks/codingagents/coding_rule_associations.py b/cognee/tasks/codingagents/coding_rule_associations.py
index 6971ecc83..e722e7728 100644
--- a/cognee/tasks/codingagents/coding_rule_associations.py
+++ b/cognee/tasks/codingagents/coding_rule_associations.py
@@ -96,10 +96,14 @@ async def add_rule_associations(
     user_prompt_location: str = "coding_rule_association_agent_user.txt",
     system_prompt_location: str = "coding_rule_association_agent_system.txt",
 ):
+    if isinstance(data, list):
+        # If data is a list of strings join all strings in list
+        data = " ".join(data)
+
     graph_engine = await get_graph_engine()
     existing_rules = await get_existing_rules(rules_nodeset_name=rules_nodeset_name)
 
-    user_context = {"user data": data, "rules": existing_rules}
+    user_context = {"chat": data, "rules": existing_rules}
 
     user_prompt = LLMGateway.render_prompt(user_prompt_location, context=user_context)
     system_prompt = LLMGateway.render_prompt(system_prompt_location, context={})
diff --git a/cognee/tasks/memify/__init__.py b/cognee/tasks/memify/__init__.py
index d2e0172f6..692bac443 100644
--- a/cognee/tasks/memify/__init__.py
+++ b/cognee/tasks/memify/__init__.py
@@ -1 +1,2 @@
 from .extract_subgraph import extract_subgraph
+from .extract_subgraph_chunks import extract_subgraph_chunks
diff --git a/cognee/tasks/memify/extract_subgraph.py b/cognee/tasks/memify/extract_subgraph.py
index 198a5b367..d6ca3773f 100644
--- a/cognee/tasks/memify/extract_subgraph.py
+++ b/cognee/tasks/memify/extract_subgraph.py
@@ -1,7 +1,7 @@
-from cognee.modules.retrieval.utils.brute_force_triplet_search import get_memory_fragment
+from cognee.modules.graph.cognee_graph.CogneeGraph import CogneeGraph
 
 
-async def extract_subgraph(subgraphs):
+async def extract_subgraph(subgraphs: list[CogneeGraph]):
     for subgraph in subgraphs:
-        for edge in subgraph:
+        for edge in subgraph.edges:
             yield edge
diff --git a/cognee/tasks/memify/extract_subgraph_chunks.py b/cognee/tasks/memify/extract_subgraph_chunks.py
new file mode 100644
index 000000000..9aab498d7
--- /dev/null
+++ b/cognee/tasks/memify/extract_subgraph_chunks.py
@@ -0,0 +1,11 @@
+from cognee.modules.graph.cognee_graph.CogneeGraph import CogneeGraph
+
+
+async def extract_subgraph_chunks(subgraphs: list[CogneeGraph]):
+    """
+    Get all Document Chunks from subgraphs and forward to next task in pipeline
+    """
+    for subgraph in subgraphs:
+        for node in subgraph.nodes.values():
+            if node.attributes["type"] == "DocumentChunk":
+                yield node.attributes["text"]
diff --git a/examples/python/memify_coding_agent_example.py b/examples/python/memify_coding_agent_example.py
index 70064c346..004a840f8 100644
--- a/examples/python/memify_coding_agent_example.py
+++ b/examples/python/memify_coding_agent_example.py
@@ -1,7 +1,18 @@
 import asyncio
+import pathlib
+import os
+
 import cognee
+from cognee.api.v1.visualize.visualize import visualize_graph
 from cognee.shared.logging_utils import setup_logging, ERROR
-from cognee.api.v1.search import SearchType
+from cognee.api.v1.cognify.memify import memify
+from cognee.modules.pipelines.tasks.task import Task
+from cognee.tasks.memify.extract_subgraph import extract_subgraph
+from cognee.modules.graph.utils import resolve_edges_to_text
+from cognee.tasks.codingagents.coding_rule_associations import (
+    add_rule_associations,
+    get_existing_rules,
+)
 
 # Prerequisites:
 # 1. Copy `.env.template` and rename it to `.env`.
@@ -38,14 +49,10 @@ async def main():
     await cognee.cognify()
     print("Cognify process complete.\n")
 
-    from cognee.api.v1.cognify.memify import memify
+    subgraph_extraction_tasks = [Task(extract_subgraph)]
 
-    from cognee.modules.graph.cognee_graph.CogneeGraph import CogneeGraph
-    from cognee.tasks.codingagents.coding_rule_associations import add_rule_associations
-    from cognee.modules.pipelines.tasks.task import Task
-
-    memify_tasks = [
-        Task(CogneeGraph.resolve_edges_to_text, task_config={"batch_size": 10}),
+    rule_association_tasks = [
+        Task(resolve_edges_to_text, task_config={"batch_size": 10}),
         Task(
             add_rule_associations,
             rules_nodeset_name="coding_agent_rules",
@@ -54,11 +61,14 @@ async def main():
         ),
     ]
 
-    await memify(tasks=memify_tasks, node_name=["coding_rules"])
+    await memify(
+        preprocessing_tasks=subgraph_extraction_tasks,
+        processing_tasks=rule_association_tasks,
+        node_name=["coding_rules"],
+    )
 
-    import os
-    import pathlib
-    from cognee.api.v1.visualize.visualize import visualize_graph
+    developer_rules = await get_existing_rules(rules_nodeset_name="coding_agent_rules")
+    print(developer_rules)
 
     file_path = os.path.join(
         pathlib.Path(__file__).parent, ".artifacts", "graph_visualization.html"
diff --git a/examples/python/memify_coding_agent_example_chunks.py b/examples/python/memify_coding_agent_example_chunks.py
new file mode 100644
index 000000000..b07bcb815
--- /dev/null
+++ b/examples/python/memify_coding_agent_example_chunks.py
@@ -0,0 +1,106 @@
+import asyncio
+import pathlib
+import os
+
+import cognee
+from cognee.api.v1.visualize.visualize import visualize_graph
+from cognee.shared.logging_utils import setup_logging, ERROR
+from cognee.api.v1.cognify.memify import memify
+from cognee.modules.pipelines.tasks.task import Task
+from cognee.tasks.memify.extract_subgraph_chunks import extract_subgraph_chunks
+from cognee.tasks.codingagents.coding_rule_associations import (
+    add_rule_associations,
+    get_existing_rules,
+)
+
+# Prerequisites:
+# 1. Copy `.env.template` and rename it to `.env`.
+# 2. Add your OpenAI API key to the `.env` file in the `LLM_API_KEY` field:
+#    LLM_API_KEY = "your_key_here"
+
+
+async def main():
+    # Create a clean slate for cognee -- reset data and system state
+    print("Resetting cognee data...")
+    await cognee.prune.prune_data()
+    await cognee.prune.prune_system(metadata=True)
+    print("Data reset complete.\n")
+    print("Adding conversation about rules to cognee:\n")
+
+    coding_rules_chat_from_principal_engineer = """
+    We want code to be formatted by PEP8 standards.
+    Typing and Docstrings must be added.
+    Please also make sure to write NOTE: on all more complex code segments.
+    If there is any duplicate code, try to handle it in one function to avoid code duplication.
+    Susan should also always review new code changes before merging to main.
+    New releases should not happen on Friday so we don't have to fix them during the weekend.
+    """
+    print(
+        f"Coding rules conversation with principal engineer: {coding_rules_chat_from_principal_engineer}"
+    )
+
+    coding_rules_chat_from_manager = """
+    Susan should always review new code changes before merging to main.
+    New releases should not happen on Friday so we don't have to fix them during the weekend.
+    """
+    print(f"Coding rules conversation with manager: {coding_rules_chat_from_manager}")
+
+    # Add the text, and make it available for cognify
+    await cognee.add([coding_rules_chat_from_principal_engineer, coding_rules_chat_from_manager])
+    print("Text added successfully.\n")
+
+    # Use LLMs and cognee to create knowledge graph
+    await cognee.cognify()
+    print("Cognify process complete.\n")
+
+    # Visualize graph after cognification
+    file_path = os.path.join(
+        pathlib.Path(__file__).parent, ".artifacts", "graph_visualization_only_cognify.html"
+    )
+    await visualize_graph(file_path)
+    print(f"Open file to see graph visualization only after cognification: {file_path}")
+
+    # After graph is created, create a second pipeline that will go through the graph and enchance it with specific
+    # coding rule nodes
+
+    # extract_subgraph_chunks is a function that returns all document chunks from specified subgraphs (if no subgraph is specifed the whole graph will be sent through memify)
+    subgraph_extraction_tasks = [Task(extract_subgraph_chunks)]
+
+    # add_rule_associations is a function that handles processing coding rules from chunks and keeps track of
+    # existing rules so duplicate rules won't be created. As the result of this processing new Rule nodes will be created
+    # in the graph that specify coding rules found in conversations.
+    coding_rules_association_tasks = [
+        Task(
+            add_rule_associations,
+            rules_nodeset_name="coding_agent_rules",
+            task_config={"batch_size": 1},
+        ),
+    ]
+
+    # Memify accepts these tasks and orchestrates forwarding of graph data through these tasks (if data is not specified).
+    # If data is explicitely specified in the arguments this specified data will be forwarded through the tasks instead
+    await memify(
+        preprocessing_tasks=subgraph_extraction_tasks,
+        processing_tasks=coding_rules_association_tasks,
+    )
+
+    # Find the new specific coding rules added to graph through memify (created based on chat conversation between team members)
+    developer_rules = await get_existing_rules(rules_nodeset_name="coding_agent_rules")
+    print(developer_rules)
+
+    # Visualize new graph with added memify context
+    file_path = os.path.join(
+        pathlib.Path(__file__).parent, ".artifacts", "graph_visualization_after_memify.html"
+    )
+    await visualize_graph(file_path)
+    print(f"Open file to see graph visualization after memify enhancment: {file_path}")
+
+
+if __name__ == "__main__":
+    logger = setup_logging(log_level=ERROR)
+    loop = asyncio.new_event_loop()
+    asyncio.set_event_loop(loop)
+    try:
+        loop.run_until_complete(main())
+    finally:
+        loop.run_until_complete(loop.shutdown_asyncgens())

From 90ef8c30d211bd8de3861063b0a2144cedeb2588 Mon Sep 17 00:00:00 2001
From: Igor Ilic <igorilic03@gmail.com>
Date: Wed, 3 Sep 2025 16:16:55 +0200
Subject: [PATCH 07/19] refactor: Rename tasks

---
 cognee/api/v1/cognify/memify.py                      | 12 ++++++------
 examples/python/memify_coding_agent_example.py       |  4 ++--
 .../python/memify_coding_agent_example_chunks.py     |  4 ++--
 3 files changed, 10 insertions(+), 10 deletions(-)

diff --git a/cognee/api/v1/cognify/memify.py b/cognee/api/v1/cognify/memify.py
index 8237059ec..3c5f7be0f 100644
--- a/cognee/api/v1/cognify/memify.py
+++ b/cognee/api/v1/cognify/memify.py
@@ -23,9 +23,9 @@ logger = get_logger("memify")
 
 
 async def memify(
-    preprocessing_tasks: List[Task],
-    processing_tasks: List[Task] = [],
-    postprocessing_tasks: List[Task] = [],
+    data_streaming_tasks: List[Task],
+    data_processing_tasks: List[Task] = [],
+    data_persistence_tasks: List[Task] = [],
     data: Optional[Any] = None,
     datasets: Union[str, list[str], list[UUID]] = None,
     user: User = None,
@@ -66,9 +66,9 @@ async def memify(
             data = [memory_fragment]
 
     memify_tasks = [
-        *preprocessing_tasks,  # Unpack tasks provided to memify pipeline
-        *processing_tasks,
-        *postprocessing_tasks,
+        *data_streaming_tasks,  # Unpack tasks provided to memify pipeline
+        *data_processing_tasks,
+        *data_persistence_tasks,
     ]
 
     await setup()
diff --git a/examples/python/memify_coding_agent_example.py b/examples/python/memify_coding_agent_example.py
index 004a840f8..c0bda215a 100644
--- a/examples/python/memify_coding_agent_example.py
+++ b/examples/python/memify_coding_agent_example.py
@@ -62,8 +62,8 @@ async def main():
     ]
 
     await memify(
-        preprocessing_tasks=subgraph_extraction_tasks,
-        processing_tasks=rule_association_tasks,
+        data_streaming_tasks=subgraph_extraction_tasks,
+        data_processing_tasks=rule_association_tasks,
         node_name=["coding_rules"],
     )
 
diff --git a/examples/python/memify_coding_agent_example_chunks.py b/examples/python/memify_coding_agent_example_chunks.py
index b07bcb815..639b97396 100644
--- a/examples/python/memify_coding_agent_example_chunks.py
+++ b/examples/python/memify_coding_agent_example_chunks.py
@@ -80,8 +80,8 @@ async def main():
     # Memify accepts these tasks and orchestrates forwarding of graph data through these tasks (if data is not specified).
     # If data is explicitely specified in the arguments this specified data will be forwarded through the tasks instead
     await memify(
-        preprocessing_tasks=subgraph_extraction_tasks,
-        processing_tasks=coding_rules_association_tasks,
+        data_streaming_tasks=subgraph_extraction_tasks,
+        data_processing_tasks=coding_rules_association_tasks,
     )
 
     # Find the new specific coding rules added to graph through memify (created based on chat conversation between team members)

From 0e3a10d925fffdb769b1e31fedd35a4460715aa7 Mon Sep 17 00:00:00 2001
From: Igor Ilic <igorilic03@gmail.com>
Date: Wed, 3 Sep 2025 17:49:33 +0200
Subject: [PATCH 08/19] refactor: Change input task names

---
 cognee/api/v1/cognify/memify.py               |  15 +--
 ...y_coding_rule_association_agent_system.txt |   6 -
 ...ify_coding_rule_association_agent_user.txt |   6 -
 .../python/memify_coding_agent_example.py     |  66 +++++++----
 .../memify_coding_agent_example_chunks.py     | 106 ------------------
 5 files changed, 51 insertions(+), 148 deletions(-)
 delete mode 100644 cognee/infrastructure/llm/prompts/memify_coding_rule_association_agent_system.txt
 delete mode 100644 cognee/infrastructure/llm/prompts/memify_coding_rule_association_agent_user.txt
 delete mode 100644 examples/python/memify_coding_agent_example_chunks.py

diff --git a/cognee/api/v1/cognify/memify.py b/cognee/api/v1/cognify/memify.py
index 3c5f7be0f..86f84626a 100644
--- a/cognee/api/v1/cognify/memify.py
+++ b/cognee/api/v1/cognify/memify.py
@@ -1,5 +1,4 @@
 from typing import Union, Optional, List, Type, Any
-from dataclasses import field
 from uuid import UUID
 
 from cognee.shared.logging_utils import get_logger
@@ -18,14 +17,17 @@ from cognee.modules.pipelines.layers.reset_dataset_pipeline_run_status import (
 )
 from cognee.modules.engine.operations.setup import setup
 from cognee.modules.pipelines.layers.pipeline_execution_mode import get_pipeline_executor
+from cognee.tasks.memify.extract_subgraph_chunks import extract_subgraph_chunks
+from cognee.tasks.codingagents.coding_rule_associations import (
+    add_rule_associations,
+)
 
 logger = get_logger("memify")
 
 
 async def memify(
-    data_streaming_tasks: List[Task],
-    data_processing_tasks: List[Task] = [],
-    data_persistence_tasks: List[Task] = [],
+    extraction_tasks: List[Task] = [Task(extract_subgraph_chunks)],
+    enrichment_tasks: List[Task] = [Task(add_rule_associations)],
     data: Optional[Any] = None,
     datasets: Union[str, list[str], list[UUID]] = None,
     user: User = None,
@@ -66,9 +68,8 @@ async def memify(
             data = [memory_fragment]
 
     memify_tasks = [
-        *data_streaming_tasks,  # Unpack tasks provided to memify pipeline
-        *data_processing_tasks,
-        *data_persistence_tasks,
+        *extraction_tasks,  # Unpack tasks provided to memify pipeline
+        *enrichment_tasks,
     ]
 
     await setup()
diff --git a/cognee/infrastructure/llm/prompts/memify_coding_rule_association_agent_system.txt b/cognee/infrastructure/llm/prompts/memify_coding_rule_association_agent_system.txt
deleted file mode 100644
index d9adf45f7..000000000
--- a/cognee/infrastructure/llm/prompts/memify_coding_rule_association_agent_system.txt
+++ /dev/null
@@ -1,6 +0,0 @@
-You are an association agent tasked with suggesting structured developer rules from user-agent interactions stored in a Knowledge Graph.
-You will receive the actual user agent interaction as a set of relationships from a knowledge graph separated by \n---\n each represented as node1 -- relation -- node2 triplet, and the list of the already existing developer rules.
-Each rule represents a single best practice or guideline the agent should follow in the future.
-Suggest rules that are general and not specific to the knowledge graph relationships, strictly technical, add value and improve the future agent behavior.
-Do not suggest rules similar to the existing ones or rules that are not general and dont add value.
-It is acceptable to return an empty rule list.
diff --git a/cognee/infrastructure/llm/prompts/memify_coding_rule_association_agent_user.txt b/cognee/infrastructure/llm/prompts/memify_coding_rule_association_agent_user.txt
deleted file mode 100644
index 9b525c625..000000000
--- a/cognee/infrastructure/llm/prompts/memify_coding_rule_association_agent_user.txt
+++ /dev/null
@@ -1,6 +0,0 @@
-**Here is the User-agent interaction context provided with a set of relationships from a knowledge graph separated by \n---\n each represented as node1 -- relation -- node2 triplet:**
-`{{ chat }}`
-
-
-**Already existing rules:**
-`{{ rules }}`
diff --git a/examples/python/memify_coding_agent_example.py b/examples/python/memify_coding_agent_example.py
index c0bda215a..61af467d3 100644
--- a/examples/python/memify_coding_agent_example.py
+++ b/examples/python/memify_coding_agent_example.py
@@ -7,8 +7,7 @@ from cognee.api.v1.visualize.visualize import visualize_graph
 from cognee.shared.logging_utils import setup_logging, ERROR
 from cognee.api.v1.cognify.memify import memify
 from cognee.modules.pipelines.tasks.task import Task
-from cognee.tasks.memify.extract_subgraph import extract_subgraph
-from cognee.modules.graph.utils import resolve_edges_to_text
+from cognee.tasks.memify.extract_subgraph_chunks import extract_subgraph_chunks
 from cognee.tasks.codingagents.coding_rule_associations import (
     add_rule_associations,
     get_existing_rules,
@@ -26,54 +25,75 @@ async def main():
     await cognee.prune.prune_data()
     await cognee.prune.prune_system(metadata=True)
     print("Data reset complete.\n")
+    print("Adding conversation about rules to cognee:\n")
 
-    # cognee knowledge graph will be created based on this text
-    text = """
-    Natural language processing (NLP) is an interdisciplinary
-    subfield of computer science and information retrieval.
-    """
-
-    coding_rules_text = """
-    Code must be formatted by PEP8 standards.
+    coding_rules_chat_from_principal_engineer = """
+    We want code to be formatted by PEP8 standards.
     Typing and Docstrings must be added.
+    Please also make sure to write NOTE: on all more complex code segments.
+    If there is any duplicate code, try to handle it in one function to avoid code duplication.
+    Susan should also always review new code changes before merging to main.
+    New releases should not happen on Friday so we don't have to fix them during the weekend.
     """
+    print(
+        f"Coding rules conversation with principal engineer: {coding_rules_chat_from_principal_engineer}"
+    )
+
+    coding_rules_chat_from_manager = """
+    Susan should always review new code changes before merging to main.
+    New releases should not happen on Friday so we don't have to fix them during the weekend.
+    """
+    print(f"Coding rules conversation with manager: {coding_rules_chat_from_manager}")
 
-    print("Adding text to cognee:")
-    print(text.strip())
     # Add the text, and make it available for cognify
-    await cognee.add(text)
-    await cognee.add(coding_rules_text, node_set=["coding_rules"])
+    await cognee.add([coding_rules_chat_from_principal_engineer, coding_rules_chat_from_manager])
     print("Text added successfully.\n")
 
     # Use LLMs and cognee to create knowledge graph
     await cognee.cognify()
     print("Cognify process complete.\n")
 
-    subgraph_extraction_tasks = [Task(extract_subgraph)]
+    # Visualize graph after cognification
+    file_path = os.path.join(
+        pathlib.Path(__file__).parent, ".artifacts", "graph_visualization_only_cognify.html"
+    )
+    await visualize_graph(file_path)
+    print(f"Open file to see graph visualization only after cognification: {file_path}")
 
-    rule_association_tasks = [
-        Task(resolve_edges_to_text, task_config={"batch_size": 10}),
+    # After graph is created, create a second pipeline that will go through the graph and enchance it with specific
+    # coding rule nodes
+
+    # extract_subgraph_chunks is a function that returns all document chunks from specified subgraphs (if no subgraph is specifed the whole graph will be sent through memify)
+    subgraph_extraction_tasks = [Task(extract_subgraph_chunks)]
+
+    # add_rule_associations is a function that handles processing coding rules from chunks and keeps track of
+    # existing rules so duplicate rules won't be created. As the result of this processing new Rule nodes will be created
+    # in the graph that specify coding rules found in conversations.
+    coding_rules_association_tasks = [
         Task(
             add_rule_associations,
             rules_nodeset_name="coding_agent_rules",
-            user_prompt_location="memify_coding_rule_association_agent_user.txt",
-            system_prompt_location="memify_coding_rule_association_agent_system.txt",
+            task_config={"batch_size": 1},
         ),
     ]
 
+    # Memify accepts these tasks and orchestrates forwarding of graph data through these tasks (if data is not specified).
+    # If data is explicitely specified in the arguments this specified data will be forwarded through the tasks instead
     await memify(
-        data_streaming_tasks=subgraph_extraction_tasks,
-        data_processing_tasks=rule_association_tasks,
-        node_name=["coding_rules"],
+        extraction_tasks=subgraph_extraction_tasks,
+        enrichment_tasks=coding_rules_association_tasks,
     )
 
+    # Find the new specific coding rules added to graph through memify (created based on chat conversation between team members)
     developer_rules = await get_existing_rules(rules_nodeset_name="coding_agent_rules")
     print(developer_rules)
 
+    # Visualize new graph with added memify context
     file_path = os.path.join(
-        pathlib.Path(__file__).parent, ".artifacts", "graph_visualization.html"
+        pathlib.Path(__file__).parent, ".artifacts", "graph_visualization_after_memify.html"
     )
     await visualize_graph(file_path)
+    print(f"Open file to see graph visualization after memify enhancment: {file_path}")
 
 
 if __name__ == "__main__":
diff --git a/examples/python/memify_coding_agent_example_chunks.py b/examples/python/memify_coding_agent_example_chunks.py
deleted file mode 100644
index 639b97396..000000000
--- a/examples/python/memify_coding_agent_example_chunks.py
+++ /dev/null
@@ -1,106 +0,0 @@
-import asyncio
-import pathlib
-import os
-
-import cognee
-from cognee.api.v1.visualize.visualize import visualize_graph
-from cognee.shared.logging_utils import setup_logging, ERROR
-from cognee.api.v1.cognify.memify import memify
-from cognee.modules.pipelines.tasks.task import Task
-from cognee.tasks.memify.extract_subgraph_chunks import extract_subgraph_chunks
-from cognee.tasks.codingagents.coding_rule_associations import (
-    add_rule_associations,
-    get_existing_rules,
-)
-
-# Prerequisites:
-# 1. Copy `.env.template` and rename it to `.env`.
-# 2. Add your OpenAI API key to the `.env` file in the `LLM_API_KEY` field:
-#    LLM_API_KEY = "your_key_here"
-
-
-async def main():
-    # Create a clean slate for cognee -- reset data and system state
-    print("Resetting cognee data...")
-    await cognee.prune.prune_data()
-    await cognee.prune.prune_system(metadata=True)
-    print("Data reset complete.\n")
-    print("Adding conversation about rules to cognee:\n")
-
-    coding_rules_chat_from_principal_engineer = """
-    We want code to be formatted by PEP8 standards.
-    Typing and Docstrings must be added.
-    Please also make sure to write NOTE: on all more complex code segments.
-    If there is any duplicate code, try to handle it in one function to avoid code duplication.
-    Susan should also always review new code changes before merging to main.
-    New releases should not happen on Friday so we don't have to fix them during the weekend.
-    """
-    print(
-        f"Coding rules conversation with principal engineer: {coding_rules_chat_from_principal_engineer}"
-    )
-
-    coding_rules_chat_from_manager = """
-    Susan should always review new code changes before merging to main.
-    New releases should not happen on Friday so we don't have to fix them during the weekend.
-    """
-    print(f"Coding rules conversation with manager: {coding_rules_chat_from_manager}")
-
-    # Add the text, and make it available for cognify
-    await cognee.add([coding_rules_chat_from_principal_engineer, coding_rules_chat_from_manager])
-    print("Text added successfully.\n")
-
-    # Use LLMs and cognee to create knowledge graph
-    await cognee.cognify()
-    print("Cognify process complete.\n")
-
-    # Visualize graph after cognification
-    file_path = os.path.join(
-        pathlib.Path(__file__).parent, ".artifacts", "graph_visualization_only_cognify.html"
-    )
-    await visualize_graph(file_path)
-    print(f"Open file to see graph visualization only after cognification: {file_path}")
-
-    # After graph is created, create a second pipeline that will go through the graph and enchance it with specific
-    # coding rule nodes
-
-    # extract_subgraph_chunks is a function that returns all document chunks from specified subgraphs (if no subgraph is specifed the whole graph will be sent through memify)
-    subgraph_extraction_tasks = [Task(extract_subgraph_chunks)]
-
-    # add_rule_associations is a function that handles processing coding rules from chunks and keeps track of
-    # existing rules so duplicate rules won't be created. As the result of this processing new Rule nodes will be created
-    # in the graph that specify coding rules found in conversations.
-    coding_rules_association_tasks = [
-        Task(
-            add_rule_associations,
-            rules_nodeset_name="coding_agent_rules",
-            task_config={"batch_size": 1},
-        ),
-    ]
-
-    # Memify accepts these tasks and orchestrates forwarding of graph data through these tasks (if data is not specified).
-    # If data is explicitely specified in the arguments this specified data will be forwarded through the tasks instead
-    await memify(
-        data_streaming_tasks=subgraph_extraction_tasks,
-        data_processing_tasks=coding_rules_association_tasks,
-    )
-
-    # Find the new specific coding rules added to graph through memify (created based on chat conversation between team members)
-    developer_rules = await get_existing_rules(rules_nodeset_name="coding_agent_rules")
-    print(developer_rules)
-
-    # Visualize new graph with added memify context
-    file_path = os.path.join(
-        pathlib.Path(__file__).parent, ".artifacts", "graph_visualization_after_memify.html"
-    )
-    await visualize_graph(file_path)
-    print(f"Open file to see graph visualization after memify enhancment: {file_path}")
-
-
-if __name__ == "__main__":
-    logger = setup_logging(log_level=ERROR)
-    loop = asyncio.new_event_loop()
-    asyncio.set_event_loop(loop)
-    try:
-        loop.run_until_complete(main())
-    finally:
-        loop.run_until_complete(loop.shutdown_asyncgens())

From 3c50ef4d6f8e94a7c6edde0e00b66738705fe83a Mon Sep 17 00:00:00 2001
From: Igor Ilic <igorilic03@gmail.com>
Date: Thu, 4 Sep 2025 14:44:13 +0200
Subject: [PATCH 09/19] docs: Update docstring for memify

---
 cognee/api/v1/cognify/memify.py | 29 +++++++++++++----------------
 1 file changed, 13 insertions(+), 16 deletions(-)

diff --git a/cognee/api/v1/cognify/memify.py b/cognee/api/v1/cognify/memify.py
index 86f84626a..dd089c060 100644
--- a/cognee/api/v1/cognify/memify.py
+++ b/cognee/api/v1/cognify/memify.py
@@ -33,24 +33,24 @@ async def memify(
     user: User = None,
     node_type: Optional[Type] = NodeSet,
     node_name: Optional[List[str]] = None,
-    cypher_query: Optional[str] = None,
-    vector_db_config: dict = None,
-    graph_db_config: dict = None,
+    vector_db_config: Optional[dict] = None,
+    graph_db_config: Optional[dict] = None,
     run_in_background: bool = False,
 ):
     """
-    Prerequisites:
-        - **LLM_API_KEY**: Must be configured (required for entity extraction and graph generation)
-        - **Data Added**: Must have data previously added via `cognee.add()` and `cognee.cognify()`
-        - **Vector Database**: Must be accessible for embeddings storage
-        - **Graph Database**: Must be accessible for relationship storage
-
     Args:
-        datasets: Dataset name(s) or dataset uuid to process. Processes all available data if None.
+        extraction_tasks: List of Cognee Tasks to execute for graph/data extraction.
+        enrichment_tasks: List of Cognee Tasks to handle enrichment of provided graph/data from extraction tasks.
+        data: The data to ingest. Can be anything when custom extraction and enrichment tasks are used.
+              Data provided here will be forwarded to the first extraction task in the pipeline as input.
+              If no data is provided the whole graph (or subgraph if node_name/node_type is specified) will be forwarded
+        datasets: Dataset name(s) or dataset uuid to process. Processes all available datasets if None.
             - Single dataset: "my_dataset"
             - Multiple datasets: ["docs", "research", "reports"]
             - None: Process all datasets for the user
         user: User context for authentication and data access. Uses default if None.
+        node_type: Filter graph to specific entity types (for advanced filtering). Used when no data is provided.
+        node_name: Filter graph to specific named entities (for targeted search). Used when no data is provided.
         vector_db_config: Custom vector database configuration for embeddings storage.
         graph_db_config: Custom graph database configuration for relationship storage.
         run_in_background: If True, starts processing asynchronously and returns immediately.
@@ -60,12 +60,9 @@ async def memify(
     """
 
     if not data:
-        if cypher_query:
-            pass
-        else:
-            memory_fragment = await get_memory_fragment(node_type=node_type, node_name=node_name)
-            # Subgraphs should be a single element in the list to represent one data item
-            data = [memory_fragment]
+        memory_fragment = await get_memory_fragment(node_type=node_type, node_name=node_name)
+        # Subgraphs should be a single element in the list to represent one data item
+        data = [memory_fragment]
 
     memify_tasks = [
         *extraction_tasks,  # Unpack tasks provided to memify pipeline

From c924846b77c77d8b786c6055866112cbdd73fdc4 Mon Sep 17 00:00:00 2001
From: Hande <159312713+hande-k@users.noreply.github.com>
Date: Thu, 4 Sep 2025 16:16:28 +0200
Subject: [PATCH 10/19] improve structure, readability

---
 cognee-starter-kit/src/pipelines/low_level.py | 291 +++++++++++++-----
 1 file changed, 212 insertions(+), 79 deletions(-)

diff --git a/cognee-starter-kit/src/pipelines/low_level.py b/cognee-starter-kit/src/pipelines/low_level.py
index 8b4fccf33..80f4a22e9 100644
--- a/cognee-starter-kit/src/pipelines/low_level.py
+++ b/cognee-starter-kit/src/pipelines/low_level.py
@@ -1,8 +1,14 @@
-import os
-import json
+"""Cognee demo with simplified structure."""
+
+from __future__ import annotations
+
 import asyncio
-import pathlib
-from typing import List, Any
+import json
+import logging
+from collections import defaultdict
+from pathlib import Path
+from typing import Any, Iterable, List, Mapping
+
 from cognee import config, prune, search, SearchType, visualize_graph
 from cognee.low_level import setup, DataPoint
 from cognee.pipelines import run_tasks, Task
@@ -13,120 +19,247 @@ from cognee.modules.data.methods import load_or_create_datasets
 
 
 class Person(DataPoint):
+    """Represent a person."""
+
     name: str
     metadata: dict = {"index_fields": ["name"]}
 
 
 class Department(DataPoint):
+    """Represent a department."""
+
     name: str
     employees: list[Person]
     metadata: dict = {"index_fields": ["name"]}
 
 
 class CompanyType(DataPoint):
+    """Represent a company type."""
+
     name: str = "Company"
 
 
 class Company(DataPoint):
+    """Represent a company."""
+
     name: str
     departments: list[Department]
     is_type: CompanyType
     metadata: dict = {"index_fields": ["name"]}
 
 
-def ingest_files(data: List[Any]):
+ROOT = Path(__file__).resolve().parent
+DATA_DIR = ROOT.parent / "data"
+COGNEE_DIR = ROOT / ".cognee_system"
+ARTIFACTS_DIR = ROOT / ".artifacts"
+GRAPH_HTML = ARTIFACTS_DIR / "graph_visualization.html"
+COMPANIES_JSON = DATA_DIR / "companies.json"
+PEOPLE_JSON = DATA_DIR / "people.json"
+
+
+def load_json_file(path: Path) -> Any:
+    """Load a JSON file."""
+    if not path.exists():
+        raise FileNotFoundError(f"Missing required file: {path}")
+    return json.loads(path.read_text(encoding="utf-8"))
+
+
+def remove_duplicates_preserve_order(seq: Iterable[Any]) -> list[Any]:
+    """Return list with duplicates removed while preserving order."""
+    seen = set()
+    out = []
+    for x in seq:
+        if x in seen:
+            continue
+        seen.add(x)
+        out.append(x)
+    return out
+
+
+def collect_people(payloads: Iterable[Mapping[str, Any]]) -> list[Mapping[str, Any]]:
+    """Collect people from payloads."""
+    people = [person for payload in payloads for person in payload.get("people", [])]
+    return people
+
+
+def collect_companies(payloads: Iterable[Mapping[str, Any]]) -> list[Mapping[str, Any]]:
+    """Collect companies from payloads."""
+    companies = [company for payload in payloads for company in payload.get("companies", [])]
+    return companies
+
+
+def build_people_nodes(people: Iterable[Mapping[str, Any]]) -> dict:
+    """Build person nodes keyed by name."""
+    nodes = {p["name"]: Person(name=p["name"]) for p in people if p.get("name")}
+    return nodes
+
+
+def group_people_by_department(people: Iterable[Mapping[str, Any]]) -> dict:
+    """Group person names by department."""
+    groups = defaultdict(list)
+    for person in people:
+        name = person.get("name")
+        if not name:
+            continue
+        dept = person.get("department", "Unknown")
+        groups[dept].append(name)
+    return groups
+
+
+def collect_declared_departments(
+    groups: Mapping[str, list[str]], companies: Iterable[Mapping[str, Any]]
+) -> set:
+    """Collect department names referenced anywhere."""
+    names = set(groups)
+    for company in companies:
+        for dept in company.get("departments", []):
+            names.add(dept)
+    return names
+
+
+def build_department_nodes(dept_names: Iterable[str]) -> dict:
+    """Build department nodes keyed by name."""
+    nodes = {name: Department(name=name, employees=[]) for name in dept_names}
+    return nodes
+
+
+def build_company_nodes(companies: Iterable[Mapping[str, Any]], company_type: CompanyType) -> dict:
+    """Build company nodes keyed by name."""
+    nodes = {
+        c["name"]: Company(name=c["name"], departments=[], is_type=company_type)
+        for c in companies
+        if c.get("name")
+    }
+    return nodes
+
+
+def iterate_company_department_pairs(companies: Iterable[Mapping[str, Any]]):
+    """Yield (company_name, department_name) pairs."""
+    for company in companies:
+        comp_name = company.get("name")
+        if not comp_name:
+            continue
+        for dept in company.get("departments", []):
+            yield comp_name, dept
+
+
+def attach_departments_to_companies(
+    companies: Iterable[Mapping[str, Any]],
+    dept_nodes: Mapping[str, Department],
+    company_nodes: Mapping[str, Company],
+) -> None:
+    """Attach department nodes to companies."""
+    for comp_name in company_nodes:
+        company_nodes[comp_name].departments = []
+    for comp_name, dept_name in iterate_company_department_pairs(companies):
+        dept = dept_nodes.get(dept_name)
+        company = company_nodes.get(comp_name)
+        if not dept or not company:
+            continue
+        company.departments.append(dept)
+
+
+def attach_employees_to_departments(
+    groups: Mapping[str, list[str]],
+    people_nodes: Mapping[str, Person],
+    dept_nodes: Mapping[str, Department],
+) -> None:
+    """Attach employees to departments."""
+    for dept in dept_nodes.values():
+        dept.employees = []
+    for dept_name, names in groups.items():
+        unique_names = remove_duplicates_preserve_order(names)
+        target = dept_nodes.get(dept_name)
+        if not target:
+            continue
+        employees = [people_nodes[n] for n in unique_names if n in people_nodes]
+        target.employees = employees
+
+
+def build_companies(payloads: Iterable[Mapping[str, Any]]) -> list[Company]:
+    """Build company nodes from payloads."""
+    people = collect_people(payloads)
+    companies = collect_companies(payloads)
+    people_nodes = build_people_nodes(people)
+    groups = group_people_by_department(people)
+    dept_names = collect_declared_departments(groups, companies)
+    dept_nodes = build_department_nodes(dept_names)
+    company_type = CompanyType()
+    company_nodes = build_company_nodes(companies, company_type)
+    attach_departments_to_companies(companies, dept_nodes, company_nodes)
+    attach_employees_to_departments(groups, people_nodes, dept_nodes)
+    result = list(company_nodes.values())
+    return result
+
+
+def load_default_payload() -> list[Mapping[str, Any]]:
+    """Load the default payload from data files."""
+    companies = load_json_file(COMPANIES_JSON)
+    people = load_json_file(PEOPLE_JSON)
+    payload = [{"companies": companies, "people": people}]
+    return payload
+
+
+def ingest_payloads(data: List[Any] | None) -> list[Company]:
+    """Ingest payloads and build company nodes."""
     if not data or data == [None]:
-        companies_file_path = os.path.join(os.path.dirname(__file__), "../data/companies.json")
-        companies = json.loads(open(companies_file_path, "r").read())
-
-        people_file_path = os.path.join(os.path.dirname(__file__), "../data/people.json")
-        people = json.loads(open(people_file_path, "r").read())
-
-        data = [{"companies": companies, "people": people}]
-
-    people_data_points = {}
-    departments_data_points = {}
-    companies_data_points = {}
-
-    for data_item in data:
-        people = data_item["people"]
-        companies = data_item["companies"]
-
-        for person in people:
-            new_person = Person(name=person["name"])
-            people_data_points[person["name"]] = new_person
-
-            if person["department"] not in departments_data_points:
-                departments_data_points[person["department"]] = Department(
-                    name=person["department"], employees=[new_person]
-                )
-            else:
-                departments_data_points[person["department"]].employees.append(new_person)
-
-        # Create a single CompanyType node, so we connect all companies to it.
-        companyType = CompanyType()
-
-        for company in companies:
-            new_company = Company(name=company["name"], departments=[], is_type=companyType)
-            companies_data_points[company["name"]] = new_company
-
-            for department_name in company["departments"]:
-                if department_name not in departments_data_points:
-                    departments_data_points[department_name] = Department(
-                        name=department_name, employees=[]
-                    )
-
-                new_company.departments.append(departments_data_points[department_name])
-
-    return list(companies_data_points.values())
+        data = load_default_payload()
+    companies = build_companies(data)
+    return companies
 
 
-async def main():
-    cognee_directory_path = str(
-        pathlib.Path(os.path.join(pathlib.Path(__file__).parent, ".cognee_system")).resolve()
-    )
-    # Set up the Cognee system directory. Cognee will store system files and databases here.
-    config.system_root_directory(cognee_directory_path)
+async def execute_pipeline() -> None:
+    """Execute Cognee pipeline."""
 
-    # Prune system metadata before running, only if we want "fresh" state.
+    # Configure system paths
+    logging.info("Configuring Cognee directories at %s", COGNEE_DIR)
+    config.system_root_directory(str(COGNEE_DIR))
+    ARTIFACTS_DIR.mkdir(parents=True, exist_ok=True)
+
+    # Reset state and initialize
     await prune.prune_system(metadata=True)
-
     await setup()
 
-    # Get default user
+    # Get user and dataset
     user = await get_default_user()
-
     datasets = await load_or_create_datasets(["demo_dataset"], [], user)
+    dataset_id = datasets[0].id
 
-    pipeline = run_tasks(
-        [
-            Task(ingest_files),
-            Task(add_data_points),
-        ],
-        datasets[0].id,
-        None,
-        user,
-        "demo_pipeline",
-    )
-
+    # Build and run pipeline
+    tasks = [Task(ingest_payloads), Task(add_data_points)]
+    pipeline = run_tasks(tasks, dataset_id, None, user, "demo_pipeline")
     async for status in pipeline:
-        print(status)
+        logging.info("Pipeline status: %s", status)
 
+    # Post-process: index graph edges and visualize
     await index_graph_edges()
+    await visualize_graph(str(GRAPH_HTML))
 
-    # Or use our simple graph preview
-    graph_file_path = str(
-        os.path.join(os.path.dirname(__file__), ".artifacts/graph_visualization.html")
-    )
-    await visualize_graph(graph_file_path)
-
-    # Completion query that uses graph data to form context.
+    # Run query against graph
     completion = await search(
         query_text="Who works for GreenFuture Solutions?",
         query_type=SearchType.GRAPH_COMPLETION,
     )
-    print("Graph completion result is:")
-    print(completion)
+    result = completion
+    logging.info("Graph completion result: %s", result)
+
+
+def configure_logging() -> None:
+    """Configure logging."""
+    logging.basicConfig(
+        level=logging.INFO,
+        format="%(asctime)s | %(levelname)s | %(message)s",
+    )
+
+
+async def main() -> None:
+    """Run main function."""
+    configure_logging()
+    try:
+        await execute_pipeline()
+    except Exception:
+        logging.exception("Run failed")
+        raise
 
 
 if __name__ == "__main__":

From c1106b76fe140f9ed4588a50ff3914e4ef2a2778 Mon Sep 17 00:00:00 2001
From: Igor Ilic <igorilic03@gmail.com>
Date: Thu, 4 Sep 2025 17:53:07 +0200
Subject: [PATCH 11/19] feat: Added new coding rules search

---
 .../retrieval/coding_rules_retriever.py       | 19 +++++++++++++++++++
 cognee/modules/search/methods/search.py       |  4 ++++
 cognee/modules/search/types/SearchType.py     |  1 +
 .../codingagents/coding_rule_associations.py  |  5 +++--
 .../python/memify_coding_agent_example.py     |  9 +++++++--
 5 files changed, 34 insertions(+), 4 deletions(-)
 create mode 100644 cognee/modules/retrieval/coding_rules_retriever.py

diff --git a/cognee/modules/retrieval/coding_rules_retriever.py b/cognee/modules/retrieval/coding_rules_retriever.py
new file mode 100644
index 000000000..2578d1ee1
--- /dev/null
+++ b/cognee/modules/retrieval/coding_rules_retriever.py
@@ -0,0 +1,19 @@
+from cognee.shared.logging_utils import get_logger
+from cognee.tasks.codingagents.coding_rule_associations import get_existing_rules
+
+logger = get_logger("CodingRulesRetriever")
+
+
+class CodingRulesRetriever:
+    """Retriever for handling codeing rule based searches."""
+
+    def __init__(self, rules_nodeset_name):
+        if isinstance(rules_nodeset_name, list):
+            rules_nodeset_name = rules_nodeset_name[0]
+        self.rules_nodeset_name = rules_nodeset_name
+        """Initialize retriever with search parameters."""
+
+    async def get_existing_rules(self, query_text):
+        return await get_existing_rules(
+            rules_nodeset_name=self.rules_nodeset_name, return_list=True
+        )
diff --git a/cognee/modules/search/methods/search.py b/cognee/modules/search/methods/search.py
index 71bf61d6b..b341e4a8a 100644
--- a/cognee/modules/search/methods/search.py
+++ b/cognee/modules/search/methods/search.py
@@ -13,6 +13,7 @@ from cognee.modules.retrieval.insights_retriever import InsightsRetriever
 from cognee.modules.retrieval.summaries_retriever import SummariesRetriever
 from cognee.modules.retrieval.completion_retriever import CompletionRetriever
 from cognee.modules.retrieval.graph_completion_retriever import GraphCompletionRetriever
+from cognee.modules.retrieval.coding_rules_retriever import CodingRulesRetriever
 from cognee.modules.retrieval.graph_summary_completion_retriever import (
     GraphSummaryCompletionRetriever,
 )
@@ -167,6 +168,9 @@ async def specific_search(
         SearchType.CYPHER: CypherSearchRetriever().get_completion,
         SearchType.NATURAL_LANGUAGE: NaturalLanguageRetriever().get_completion,
         SearchType.FEEDBACK: UserQAFeedback(last_k=last_k).add_feedback,
+        SearchType.CODING_RULES: CodingRulesRetriever(
+            rules_nodeset_name=node_name
+        ).get_existing_rules,
     }
 
     # If the query type is FEELING_LUCKY, select the search type intelligently
diff --git a/cognee/modules/search/types/SearchType.py b/cognee/modules/search/types/SearchType.py
index c1f0521b2..0a7cae63a 100644
--- a/cognee/modules/search/types/SearchType.py
+++ b/cognee/modules/search/types/SearchType.py
@@ -15,3 +15,4 @@ class SearchType(Enum):
     GRAPH_COMPLETION_CONTEXT_EXTENSION = "GRAPH_COMPLETION_CONTEXT_EXTENSION"
     FEELING_LUCKY = "FEELING_LUCKY"
     FEEDBACK = "FEEDBACK"
+    CODING_RULES = "CODING_RULES"
diff --git a/cognee/tasks/codingagents/coding_rule_associations.py b/cognee/tasks/codingagents/coding_rule_associations.py
index e722e7728..c809bc68f 100644
--- a/cognee/tasks/codingagents/coding_rule_associations.py
+++ b/cognee/tasks/codingagents/coding_rule_associations.py
@@ -31,7 +31,7 @@ class RuleSet(DataPoint):
     )
 
 
-async def get_existing_rules(rules_nodeset_name: str) -> str:
+async def get_existing_rules(rules_nodeset_name: str, return_list: bool = False) -> str:
     graph_engine = await get_graph_engine()
     nodes_data, _ = await graph_engine.get_nodeset_subgraph(
         node_type=NodeSet, node_name=[rules_nodeset_name]
@@ -46,7 +46,8 @@ async def get_existing_rules(rules_nodeset_name: str) -> str:
         and "text" in item[1]
     ]
 
-    existing_rules = "\n".join(f"- {rule}" for rule in existing_rules)
+    if not return_list:
+        existing_rules = "\n".join(f"- {rule}" for rule in existing_rules)
 
     return existing_rules
 
diff --git a/examples/python/memify_coding_agent_example.py b/examples/python/memify_coding_agent_example.py
index 61af467d3..7f8c58802 100644
--- a/examples/python/memify_coding_agent_example.py
+++ b/examples/python/memify_coding_agent_example.py
@@ -85,8 +85,13 @@ async def main():
     )
 
     # Find the new specific coding rules added to graph through memify (created based on chat conversation between team members)
-    developer_rules = await get_existing_rules(rules_nodeset_name="coding_agent_rules")
-    print(developer_rules)
+    print(
+        await cognee.search(
+            query_text="List me the coding rules",
+            query_type=cognee.SearchType.CODING_RULES,
+            node_name=["coding_agent_rules"],
+        )
+    )
 
     # Visualize new graph with added memify context
     file_path = os.path.join(

From 95bafd942c8b0553f45a7987492ac8cbf6e5ad86 Mon Sep 17 00:00:00 2001
From: Igor Ilic <igorilic03@gmail.com>
Date: Thu, 4 Sep 2025 18:06:02 +0200
Subject: [PATCH 12/19] feat: add coding rule search type

---
 examples/python/memify_coding_agent_example.py | 13 +++++++------
 1 file changed, 7 insertions(+), 6 deletions(-)

diff --git a/examples/python/memify_coding_agent_example.py b/examples/python/memify_coding_agent_example.py
index 7f8c58802..0238cf775 100644
--- a/examples/python/memify_coding_agent_example.py
+++ b/examples/python/memify_coding_agent_example.py
@@ -85,14 +85,15 @@ async def main():
     )
 
     # Find the new specific coding rules added to graph through memify (created based on chat conversation between team members)
-    print(
-        await cognee.search(
-            query_text="List me the coding rules",
-            query_type=cognee.SearchType.CODING_RULES,
-            node_name=["coding_agent_rules"],
-        )
+    coding_rules = await cognee.search(
+        query_text="List me the coding rules",
+        query_type=cognee.SearchType.CODING_RULES,
+        node_name=["coding_agent_rules"],
     )
 
+    for coding_rule in coding_rules:
+        print(coding_rule)
+
     # Visualize new graph with added memify context
     file_path = os.path.join(
         pathlib.Path(__file__).parent, ".artifacts", "graph_visualization_after_memify.html"

From b0d4503f2b3252e1d8c56ec98644d72c219abb31 Mon Sep 17 00:00:00 2001
From: Igor Ilic <igorilic03@gmail.com>
Date: Thu, 4 Sep 2025 18:12:59 +0200
Subject: [PATCH 13/19] refactor: Move memify our of api folder

---
 cognee/__init__.py                                  | 1 +
 cognee/modules/memify/__init__.py                   | 1 +
 cognee/{api/v1/cognify => modules/memify}/memify.py | 0
 examples/python/memify_coding_agent_example.py      | 7 ++-----
 4 files changed, 4 insertions(+), 5 deletions(-)
 create mode 100644 cognee/modules/memify/__init__.py
 rename cognee/{api/v1/cognify => modules/memify}/memify.py (100%)

diff --git a/cognee/__init__.py b/cognee/__init__.py
index 7aa6388d9..be5a16b3b 100644
--- a/cognee/__init__.py
+++ b/cognee/__init__.py
@@ -18,6 +18,7 @@ logger = setup_logging()
 from .api.v1.add import add
 from .api.v1.delete import delete
 from .api.v1.cognify import cognify
+from .modules.memify import memify
 from .api.v1.config.config import config
 from .api.v1.datasets.datasets import datasets
 from .api.v1.prune import prune
diff --git a/cognee/modules/memify/__init__.py b/cognee/modules/memify/__init__.py
new file mode 100644
index 000000000..90aaa8404
--- /dev/null
+++ b/cognee/modules/memify/__init__.py
@@ -0,0 +1 @@
+from .memify import memify
diff --git a/cognee/api/v1/cognify/memify.py b/cognee/modules/memify/memify.py
similarity index 100%
rename from cognee/api/v1/cognify/memify.py
rename to cognee/modules/memify/memify.py
diff --git a/examples/python/memify_coding_agent_example.py b/examples/python/memify_coding_agent_example.py
index 0238cf775..17bf8fc0e 100644
--- a/examples/python/memify_coding_agent_example.py
+++ b/examples/python/memify_coding_agent_example.py
@@ -3,15 +3,12 @@ import pathlib
 import os
 
 import cognee
+from cognee import memify
 from cognee.api.v1.visualize.visualize import visualize_graph
 from cognee.shared.logging_utils import setup_logging, ERROR
-from cognee.api.v1.cognify.memify import memify
 from cognee.modules.pipelines.tasks.task import Task
 from cognee.tasks.memify.extract_subgraph_chunks import extract_subgraph_chunks
-from cognee.tasks.codingagents.coding_rule_associations import (
-    add_rule_associations,
-    get_existing_rules,
-)
+from cognee.tasks.codingagents.coding_rule_associations import add_rule_associations
 
 # Prerequisites:
 # 1. Copy `.env.template` and rename it to `.env`.

From 805f443cd6e88e6a9ae68f3ddaa2594982488c65 Mon Sep 17 00:00:00 2001
From: Igor Ilic <igorilic03@gmail.com>
Date: Thu, 4 Sep 2025 19:08:55 +0200
Subject: [PATCH 14/19] feat: Add memify router

---
 cognee/api/client.py                          |  3 +
 cognee/api/v1/add/routers/get_add_router.py   |  6 --
 cognee/api/v1/memify/__init__.py              |  0
 cognee/api/v1/memify/routers/__init__.py      |  1 +
 .../v1/memify/routers/get_memify_router.py    | 99 +++++++++++++++++++
 cognee/modules/memify/memify.py               | 13 ++-
 .../python/memify_coding_agent_example.py     |  7 +-
 7 files changed, 118 insertions(+), 11 deletions(-)
 create mode 100644 cognee/api/v1/memify/__init__.py
 create mode 100644 cognee/api/v1/memify/routers/__init__.py
 create mode 100644 cognee/api/v1/memify/routers/get_memify_router.py

diff --git a/cognee/api/client.py b/cognee/api/client.py
index 215e4a17e..d6bd71d5f 100644
--- a/cognee/api/client.py
+++ b/cognee/api/client.py
@@ -22,6 +22,7 @@ from cognee.api.v1.settings.routers import get_settings_router
 from cognee.api.v1.datasets.routers import get_datasets_router
 from cognee.api.v1.cognify.routers import get_code_pipeline_router, get_cognify_router
 from cognee.api.v1.search.routers import get_search_router
+from cognee.api.v1.memify.routers import get_memify_router
 from cognee.api.v1.add.routers import get_add_router
 from cognee.api.v1.delete.routers import get_delete_router
 from cognee.api.v1.responses.routers import get_responses_router
@@ -230,6 +231,8 @@ app.include_router(get_add_router(), prefix="/api/v1/add", tags=["add"])
 
 app.include_router(get_cognify_router(), prefix="/api/v1/cognify", tags=["cognify"])
 
+app.include_router(get_memify_router(), prefix="/api/v1/memify", tags=["memify"])
+
 app.include_router(get_search_router(), prefix="/api/v1/search", tags=["search"])
 
 app.include_router(
diff --git a/cognee/api/v1/add/routers/get_add_router.py b/cognee/api/v1/add/routers/get_add_router.py
index 1703d9931..9de818b7d 100644
--- a/cognee/api/v1/add/routers/get_add_router.py
+++ b/cognee/api/v1/add/routers/get_add_router.py
@@ -1,6 +1,3 @@
-import os
-import requests
-import subprocess
 from uuid import UUID
 
 from fastapi import APIRouter
@@ -60,9 +57,6 @@ def get_add_router() -> APIRouter:
 
         ## Notes
         - To add data to datasets not owned by the user, use dataset_id (when ENABLE_BACKEND_ACCESS_CONTROL is set to True)
-        - GitHub repositories are cloned and all files are processed
-        - HTTP URLs are fetched and their content is processed
-        - The ALLOW_HTTP_REQUESTS environment variable controls URL processing
         - datasetId value can only be the UUID of an already existing dataset
         """
         send_telemetry(
diff --git a/cognee/api/v1/memify/__init__.py b/cognee/api/v1/memify/__init__.py
new file mode 100644
index 000000000..e69de29bb
diff --git a/cognee/api/v1/memify/routers/__init__.py b/cognee/api/v1/memify/routers/__init__.py
new file mode 100644
index 000000000..1d1793c35
--- /dev/null
+++ b/cognee/api/v1/memify/routers/__init__.py
@@ -0,0 +1 @@
+from .get_memify_router import get_memify_router
diff --git a/cognee/api/v1/memify/routers/get_memify_router.py b/cognee/api/v1/memify/routers/get_memify_router.py
new file mode 100644
index 000000000..edac2775a
--- /dev/null
+++ b/cognee/api/v1/memify/routers/get_memify_router.py
@@ -0,0 +1,99 @@
+from uuid import UUID
+
+from fastapi import APIRouter
+from fastapi.responses import JSONResponse
+from fastapi import Depends
+from pydantic import Field
+from typing import List, Optional
+
+from cognee.api.DTO import InDTO
+from cognee.modules.users.models import User
+from cognee.modules.users.methods import get_authenticated_user
+from cognee.shared.utils import send_telemetry
+from cognee.modules.pipelines.models import PipelineRunErrored
+from cognee.shared.logging_utils import get_logger
+
+logger = get_logger()
+
+
+class MemifyPayloadDTO(InDTO):
+    extraction_tasks: List[str] = Field(
+        default=None,
+        examples=[[]],
+    )
+    enrichment_tasks: List[str] = (Field(default=None, examples=[[]]),)
+    data: Optional[str] = (Field(default=None),)
+    dataset_names: Optional[List[str]] = Field(default=None)
+    dataset_ids: Optional[List[UUID]] = Field(default=None, examples=[[]])
+    node_name: Optional[List[str]] = Field(default=None)
+    run_in_background: Optional[bool] = Field(default=False)
+
+
+def get_memify_router() -> APIRouter:
+    router = APIRouter()
+
+    @router.post("", response_model=dict)
+    async def memify(payload: MemifyPayloadDTO, user: User = Depends(get_authenticated_user)):
+        """
+        Enrichment pipeline in Cognee, can work with already built graphs. If no data is provided existing knowledge graph will be used as data,
+        custom data can also be provided instead which can be processed with provided extraction and enrichment tasks.
+
+        Provided tasks and data will be arranged to run the Cognee pipeline and execute graph enrichment/creation.
+
+        ## Request Parameters
+        - **extractionTasks** Optional[List[str]]: List of available Cognee Tasks to execute for graph/data extraction.
+        - **enrichmentTasks** Optional[List[str]]: List of available Cognee Tasks to handle enrichment of provided graph/data from extraction tasks.
+        - **data** Optional[List[str]]: The data to ingest. Can be any text data when custom extraction and enrichment tasks are used.
+              Data provided here will be forwarded to the first extraction task in the pipeline as input.
+              If no data is provided the whole graph (or subgraph if node_name/node_type is specified) will be forwarded
+        - **dataset_names** (Optional[List[str]]): Name of the datasets to memify
+        - **dataset_ids** (Optional[List[UUID]]): List of UUIDs of an already existing dataset
+        - **node_name** (Optional[List[str]]):  Filter graph to specific named entities (for targeted search). Used when no data is provided.
+        - **run_in_background** (Optional[bool]): Whether to execute processing asynchronously. Defaults to False (blocking).
+
+        Either datasetName or datasetId must be provided.
+
+        ## Response
+        Returns information about the add operation containing:
+        - Status of the operation
+        - Details about the processed data
+        - Any relevant metadata from the ingestion process
+
+        ## Error Codes
+        - **400 Bad Request**: Neither datasetId nor datasetName provided
+        - **409 Conflict**: Error during memify operation
+        - **403 Forbidden**: User doesn't have permission to use dataset
+
+        ## Notes
+        - To memify datasets not owned by the user, use dataset_id (when ENABLE_BACKEND_ACCESS_CONTROL is set to True)
+        - datasetId value can only be the UUID of an already existing dataset
+        """
+
+        send_telemetry(
+            "Memify API Endpoint Invoked",
+            user.id,
+            additional_properties={"endpoint": "POST /v1/memify"},
+        )
+
+        if not payload.dataset_ids and not payload.dataset_names:
+            raise ValueError("Either datasetId or datasetName must be provided.")
+
+        from cognee import memify
+
+        try:
+            memify_run = await memify(
+                extraction_tasks=payload.extraction_tasks,
+                enrichment_tasks=payload.enrichment_tasks,
+                data=payload.data,
+                datasets=payload.dataset_ids if payload.dataset_ids else payload.dataset_names,
+                node_name=payload.node_name,
+                user=user,
+            )
+
+            if isinstance(memify_run, PipelineRunErrored):
+                return JSONResponse(status_code=420, content=memify_run)
+            return memify_run
+        except Exception as error:
+            return JSONResponse(status_code=409, content={"error": str(error)})
+
+    return router
diff --git a/cognee/modules/memify/memify.py b/cognee/modules/memify/memify.py
index dd089c060..80afd7325 100644
--- a/cognee/modules/memify/memify.py
+++ b/cognee/modules/memify/memify.py
@@ -26,8 +26,8 @@ logger = get_logger("memify")
 
 
 async def memify(
-    extraction_tasks: List[Task] = [Task(extract_subgraph_chunks)],
-    enrichment_tasks: List[Task] = [Task(add_rule_associations)],
+    extraction_tasks: Union[List[Task], List[str]] = [Task(extract_subgraph_chunks)],
+    enrichment_tasks: Union[List[Task], List[str]] = [Task(add_rule_associations)],
     data: Optional[Any] = None,
     datasets: Union[str, list[str], list[UUID]] = None,
     user: User = None,
@@ -38,6 +38,15 @@ async def memify(
     run_in_background: bool = False,
 ):
     """
+    Enrichment pipeline in Cognee, can work with already built graphs. If no data is provided existing knowledge graph will be used as data,
+    custom data can also be provided instead which can be processed with provided extraction and enrichment tasks.
+
+    Provided tasks and data will be arranged to run the Cognee pipeline and execute graph enrichment/creation.
+
+    This is the core processing step in Cognee that converts raw text and documents
+    into an intelligent knowledge graph. It analyzes content, extracts entities and
+    relationships, and creates semantic connections for enhanced search and reasoning.
+
     Args:
         extraction_tasks: List of Cognee Tasks to execute for graph/data extraction.
         enrichment_tasks: List of Cognee Tasks to handle enrichment of provided graph/data from extraction tasks.
diff --git a/examples/python/memify_coding_agent_example.py b/examples/python/memify_coding_agent_example.py
index 17bf8fc0e..1fd3b1528 100644
--- a/examples/python/memify_coding_agent_example.py
+++ b/examples/python/memify_coding_agent_example.py
@@ -55,7 +55,7 @@ async def main():
         pathlib.Path(__file__).parent, ".artifacts", "graph_visualization_only_cognify.html"
     )
     await visualize_graph(file_path)
-    print(f"Open file to see graph visualization only after cognification: {file_path}")
+    print(f"Open file to see graph visualization only after cognification: {file_path}\n")
 
     # After graph is created, create a second pipeline that will go through the graph and enchance it with specific
     # coding rule nodes
@@ -88,15 +88,16 @@ async def main():
         node_name=["coding_agent_rules"],
     )
 
+    print("Coding rules created by memify:")
     for coding_rule in coding_rules:
-        print(coding_rule)
+        print("- " + coding_rule)
 
     # Visualize new graph with added memify context
     file_path = os.path.join(
         pathlib.Path(__file__).parent, ".artifacts", "graph_visualization_after_memify.html"
     )
     await visualize_graph(file_path)
-    print(f"Open file to see graph visualization after memify enhancment: {file_path}")
+    print(f"\nOpen file to see graph visualization after memify enhancment: {file_path}")
 
 
 if __name__ == "__main__":

From e06cf11f49d2a574e0906d32dd022767a2d7cdd9 Mon Sep 17 00:00:00 2001
From: Igor Ilic <igorilic03@gmail.com>
Date: Thu, 4 Sep 2025 19:53:59 +0200
Subject: [PATCH 15/19] fix: Resolve import issue with creating auth dataset

---
 cognee/api/v1/add/routers/get_add_router.py      |  2 +-
 .../api/v1/memify/routers/get_memify_router.py   | 16 ++++++++--------
 .../data/methods/load_or_create_datasets.py      |  2 +-
 cognee/modules/memify/memify.py                  | 16 ++++++++++++++--
 .../modules/retrieval/coding_rules_retriever.py  |  5 ++++-
 5 files changed, 28 insertions(+), 13 deletions(-)

diff --git a/cognee/api/v1/add/routers/get_add_router.py b/cognee/api/v1/add/routers/get_add_router.py
index 9de818b7d..f27d559e1 100644
--- a/cognee/api/v1/add/routers/get_add_router.py
+++ b/cognee/api/v1/add/routers/get_add_router.py
@@ -21,7 +21,7 @@ def get_add_router() -> APIRouter:
     async def add(
         data: List[UploadFile] = File(default=None),
         datasetName: Optional[str] = Form(default=None),
-        datasetId: Union[UUID, Literal[""], None] = Form(default=None, examples=[""]),
+        datasetId: Union[UUID, None] = Form(default=None, examples=[""]),
         node_set: Optional[List[str]] = Form(default=[""], example=[""]),
         user: User = Depends(get_authenticated_user),
     ):
diff --git a/cognee/api/v1/memify/routers/get_memify_router.py b/cognee/api/v1/memify/routers/get_memify_router.py
index edac2775a..817eef9bd 100644
--- a/cognee/api/v1/memify/routers/get_memify_router.py
+++ b/cognee/api/v1/memify/routers/get_memify_router.py
@@ -17,15 +17,15 @@ logger = get_logger()
 
 
 class MemifyPayloadDTO(InDTO):
-    extraction_tasks: List[str] = Field(
+    extraction_tasks: Optional[List[str]] = Field(
         default=None,
         examples=[[]],
     )
-    enrichment_tasks: List[str] = (Field(default=None, examples=[[]]),)
-    data: Optional[str] = (Field(default=None),)
-    dataset_names: Optional[List[str]] = Field(default=None)
+    enrichment_tasks: Optional[List[str]] = Field(default=None, examples=[[]])
+    data: Optional[str] = Field(default="")
+    dataset_names: Optional[List[str]] = Field(default=None, examples=[[]])
     dataset_ids: Optional[List[UUID]] = Field(default=None, examples=[[]])
-    node_name: Optional[List[str]] = Field(default=None)
+    node_name: Optional[List[str]] = Field(default=None, examples=[[]])
     run_in_background: Optional[bool] = Field(default=False)
 
 
@@ -78,10 +78,10 @@ def get_memify_router() -> APIRouter:
         if not payload.dataset_ids and not payload.dataset_names:
             raise ValueError("Either datasetId or datasetName must be provided.")
 
-        from cognee import memify
-
         try:
-            memify_run = await memify(
+            from cognee.modules.memify import memify as cognee_memify
+
+            memify_run = await cognee_memify(
                 extraction_tasks=payload.extraction_tasks,
                 enrichment_tasks=payload.enrichment_tasks,
                 data=payload.data,
diff --git a/cognee/modules/data/methods/load_or_create_datasets.py b/cognee/modules/data/methods/load_or_create_datasets.py
index 1d6ef3efb..2c9a6497c 100644
--- a/cognee/modules/data/methods/load_or_create_datasets.py
+++ b/cognee/modules/data/methods/load_or_create_datasets.py
@@ -2,7 +2,7 @@ from typing import List, Union
 from uuid import UUID
 
 from cognee.modules.data.models import Dataset
-from cognee.modules.data.methods import create_authorized_dataset
+from cognee.modules.data.methods.create_authorized_dataset import create_authorized_dataset
 from cognee.modules.data.exceptions import DatasetNotFoundError
 
 
diff --git a/cognee/modules/memify/memify.py b/cognee/modules/memify/memify.py
index 80afd7325..d8e1087f2 100644
--- a/cognee/modules/memify/memify.py
+++ b/cognee/modules/memify/memify.py
@@ -26,8 +26,8 @@ logger = get_logger("memify")
 
 
 async def memify(
-    extraction_tasks: Union[List[Task], List[str]] = [Task(extract_subgraph_chunks)],
-    enrichment_tasks: Union[List[Task], List[str]] = [Task(add_rule_associations)],
+    extraction_tasks: Union[List[Task], List[str]] = None,
+    enrichment_tasks: Union[List[Task], List[str]] = None,
     data: Optional[Any] = None,
     datasets: Union[str, list[str], list[UUID]] = None,
     user: User = None,
@@ -68,6 +68,18 @@ async def memify(
                           Use pipeline_run_id from return value to monitor progress.
     """
 
+    # Use default coding rules tasks if no tasks were provided
+    if not extraction_tasks:
+        extraction_tasks = [Task(extract_subgraph_chunks)]
+    if not enrichment_tasks:
+        enrichment_tasks = [
+            Task(
+                add_rule_associations,
+                rules_nodeset_name="coding_agent_rules",
+                task_config={"batch_size": 1},
+            )
+        ]
+
     if not data:
         memory_fragment = await get_memory_fragment(node_type=node_type, node_name=node_name)
         # Subgraphs should be a single element in the list to represent one data item
diff --git a/cognee/modules/retrieval/coding_rules_retriever.py b/cognee/modules/retrieval/coding_rules_retriever.py
index 2578d1ee1..364ff3236 100644
--- a/cognee/modules/retrieval/coding_rules_retriever.py
+++ b/cognee/modules/retrieval/coding_rules_retriever.py
@@ -7,8 +7,11 @@ logger = get_logger("CodingRulesRetriever")
 class CodingRulesRetriever:
     """Retriever for handling codeing rule based searches."""
 
-    def __init__(self, rules_nodeset_name):
+    def __init__(self, rules_nodeset_name="coding_agent_rules"):
         if isinstance(rules_nodeset_name, list):
+            if not rules_nodeset_name:
+                # If there is no provided nodeset set to coding_agent_rules
+                rules_nodeset_name = ["coding_agent_rules"]
             rules_nodeset_name = rules_nodeset_name[0]
         self.rules_nodeset_name = rules_nodeset_name
         """Initialize retriever with search parameters."""

From 9e201035493e6a38d614db9cbbd87b7d69a926d6 Mon Sep 17 00:00:00 2001
From: Igor Ilic <igorilic03@gmail.com>
Date: Thu, 4 Sep 2025 20:59:00 +0200
Subject: [PATCH 16/19] feat: Enable multi-user mode to work with memify

---
 .../v1/memify/routers/get_memify_router.py    | 12 +++----
 .../modules/graph/cognee_graph/CogneeGraph.py |  2 +-
 cognee/modules/memify/memify.py               | 32 ++++++++++---------
 3 files changed, 24 insertions(+), 22 deletions(-)

diff --git a/cognee/api/v1/memify/routers/get_memify_router.py b/cognee/api/v1/memify/routers/get_memify_router.py
index 817eef9bd..cf1df8f71 100644
--- a/cognee/api/v1/memify/routers/get_memify_router.py
+++ b/cognee/api/v1/memify/routers/get_memify_router.py
@@ -23,8 +23,8 @@ class MemifyPayloadDTO(InDTO):
     )
     enrichment_tasks: Optional[List[str]] = Field(default=None, examples=[[]])
     data: Optional[str] = Field(default="")
-    dataset_names: Optional[List[str]] = Field(default=None, examples=[[]])
-    dataset_ids: Optional[List[UUID]] = Field(default=None, examples=[[]])
+    dataset_name: Optional[str] = Field(default=None)
+    dataset_id: Optional[UUID] = Field(default=None, examples=[[""]])
     node_name: Optional[List[str]] = Field(default=None, examples=[[]])
     run_in_background: Optional[bool] = Field(default=False)
 
@@ -46,8 +46,8 @@ def get_memify_router() -> APIRouter:
         - **data** Optional[List[str]]: The data to ingest. Can be any text data when custom extraction and enrichment tasks are used.
               Data provided here will be forwarded to the first extraction task in the pipeline as input.
               If no data is provided the whole graph (or subgraph if node_name/node_type is specified) will be forwarded
-        - **dataset_names** (Optional[List[str]]): Name of the datasets to memify
-        - **dataset_ids** (Optional[List[UUID]]): List of UUIDs of an already existing dataset
+        - **dataset_name** (Optional[str]): Name of the datasets to memify
+        - **dataset_id** (Optional[UUID]): List of UUIDs of an already existing dataset
         - **node_name** (Optional[List[str]]):  Filter graph to specific named entities (for targeted search). Used when no data is provided.
         - **run_in_background** (Optional[bool]): Whether to execute processing asynchronously. Defaults to False (blocking).
 
@@ -75,7 +75,7 @@ def get_memify_router() -> APIRouter:
             additional_properties={"endpoint": "POST /v1/memify"},
         )
 
-        if not payload.dataset_ids and not payload.dataset_names:
+        if not payload.dataset_id and not payload.dataset_name:
             raise ValueError("Either datasetId or datasetName must be provided.")
 
         try:
@@ -85,7 +85,7 @@ def get_memify_router() -> APIRouter:
                 extraction_tasks=payload.extraction_tasks,
                 enrichment_tasks=payload.enrichment_tasks,
                 data=payload.data,
-                datasets=payload.dataset_ids if payload.dataset_ids else payload.dataset_names,
+                dataset=payload.dataset_id if payload.dataset_id else payload.dataset_name,
                 node_name=payload.node_name,
                 user=user,
             )
diff --git a/cognee/modules/graph/cognee_graph/CogneeGraph.py b/cognee/modules/graph/cognee_graph/CogneeGraph.py
index 924532ce0..acfe04de7 100644
--- a/cognee/modules/graph/cognee_graph/CogneeGraph.py
+++ b/cognee/modules/graph/cognee_graph/CogneeGraph.py
@@ -76,7 +76,7 @@ class CogneeGraph(CogneeAbstractGraph):
             start_time = time.time()
 
             # Determine projection strategy
-            if node_type is not None and node_name not in [None, []]:
+            if node_type is not None and node_name not in [None, [], ""]:
                 nodes_data, edges_data = await adapter.get_nodeset_subgraph(
                     node_type=node_type, node_name=node_name
                 )
diff --git a/cognee/modules/memify/memify.py b/cognee/modules/memify/memify.py
index d8e1087f2..2d9b32a1b 100644
--- a/cognee/modules/memify/memify.py
+++ b/cognee/modules/memify/memify.py
@@ -4,7 +4,7 @@ from uuid import UUID
 from cognee.shared.logging_utils import get_logger
 
 from cognee.modules.retrieval.utils.brute_force_triplet_search import get_memory_fragment
-
+from cognee.context_global_variables import set_database_global_context_variables
 from cognee.modules.engine.models.node_set import NodeSet
 from cognee.modules.pipelines import run_pipeline
 from cognee.modules.pipelines.tasks.task import Task
@@ -29,7 +29,7 @@ async def memify(
     extraction_tasks: Union[List[Task], List[str]] = None,
     enrichment_tasks: Union[List[Task], List[str]] = None,
     data: Optional[Any] = None,
-    datasets: Union[str, list[str], list[UUID]] = None,
+    dataset: Union[str, UUID] = "main_dataset",
     user: User = None,
     node_type: Optional[Type] = NodeSet,
     node_name: Optional[List[str]] = None,
@@ -53,10 +53,7 @@ async def memify(
         data: The data to ingest. Can be anything when custom extraction and enrichment tasks are used.
               Data provided here will be forwarded to the first extraction task in the pipeline as input.
               If no data is provided the whole graph (or subgraph if node_name/node_type is specified) will be forwarded
-        datasets: Dataset name(s) or dataset uuid to process. Processes all available datasets if None.
-            - Single dataset: "my_dataset"
-            - Multiple datasets: ["docs", "research", "reports"]
-            - None: Process all datasets for the user
+        dataset: Dataset name or dataset uuid to process.
         user: User context for authentication and data access. Uses default if None.
         node_type: Filter graph to specific entity types (for advanced filtering). Used when no data is provided.
         node_name: Filter graph to specific named entities (for targeted search). Used when no data is provided.
@@ -80,7 +77,17 @@ async def memify(
             )
         ]
 
+    await setup()
+
+    user, authorized_dataset_list = await resolve_authorized_user_datasets(dataset, user)
+    authorized_dataset = authorized_dataset_list[0]
+
     if not data:
+        # Will only be used if ENABLE_BACKEND_ACCESS_CONTROL is set to True
+        await set_database_global_context_variables(
+            authorized_dataset.id, authorized_dataset.owner_id
+        )
+
         memory_fragment = await get_memory_fragment(node_type=node_type, node_name=node_name)
         # Subgraphs should be a single element in the list to represent one data item
         data = [memory_fragment]
@@ -90,14 +97,9 @@ async def memify(
         *enrichment_tasks,
     ]
 
-    await setup()
-
-    user, authorized_datasets = await resolve_authorized_user_datasets(datasets, user)
-
-    for dataset in authorized_datasets:
-        await reset_dataset_pipeline_run_status(
-            dataset.id, user, pipeline_names=["memify_pipeline"]
-        )
+    await reset_dataset_pipeline_run_status(
+        authorized_dataset.id, user, pipeline_names=["memify_pipeline"]
+    )
 
     # By calling get pipeline executor we get a function that will have the run_pipeline run in the background or a function that we will need to wait for
     pipeline_executor_func = get_pipeline_executor(run_in_background=run_in_background)
@@ -108,7 +110,7 @@ async def memify(
         tasks=memify_tasks,
         user=user,
         data=data,
-        datasets=datasets,
+        datasets=authorized_dataset.id,
         vector_db_config=vector_db_config,
         graph_db_config=graph_db_config,
         incremental_loading=False,

From 0c7ba7c23610cf966c5660b9ad8d6f5f054dc573 Mon Sep 17 00:00:00 2001
From: Igor Ilic <igorilic03@gmail.com>
Date: Thu, 4 Sep 2025 21:05:24 +0200
Subject: [PATCH 17/19] refactor: Allow none through swagger

---
 cognee/api/v1/add/routers/get_add_router.py       | 3 ++-
 cognee/api/v1/memify/routers/get_memify_router.py | 5 +++--
 2 files changed, 5 insertions(+), 3 deletions(-)

diff --git a/cognee/api/v1/add/routers/get_add_router.py b/cognee/api/v1/add/routers/get_add_router.py
index f27d559e1..dfa7d275b 100644
--- a/cognee/api/v1/add/routers/get_add_router.py
+++ b/cognee/api/v1/add/routers/get_add_router.py
@@ -21,7 +21,8 @@ def get_add_router() -> APIRouter:
     async def add(
         data: List[UploadFile] = File(default=None),
         datasetName: Optional[str] = Form(default=None),
-        datasetId: Union[UUID, None] = Form(default=None, examples=[""]),
+        # Note: Literal is needed for Swagger use
+        datasetId: Union[UUID, Literal[""], None] = Form(default=None, examples=[""]),
         node_set: Optional[List[str]] = Form(default=[""], example=[""]),
         user: User = Depends(get_authenticated_user),
     ):
diff --git a/cognee/api/v1/memify/routers/get_memify_router.py b/cognee/api/v1/memify/routers/get_memify_router.py
index cf1df8f71..1976d7414 100644
--- a/cognee/api/v1/memify/routers/get_memify_router.py
+++ b/cognee/api/v1/memify/routers/get_memify_router.py
@@ -4,7 +4,7 @@ from fastapi import APIRouter
 from fastapi.responses import JSONResponse
 from fastapi import Depends
 from pydantic import Field
-from typing import List, Optional
+from typing import List, Optional, Union, Literal
 
 from cognee.api.DTO import InDTO
 from cognee.modules.users.models import User
@@ -24,7 +24,8 @@ class MemifyPayloadDTO(InDTO):
     enrichment_tasks: Optional[List[str]] = Field(default=None, examples=[[]])
     data: Optional[str] = Field(default="")
     dataset_name: Optional[str] = Field(default=None)
-    dataset_id: Optional[UUID] = Field(default=None, examples=[[""]])
+    # Note: Literal is needed for Swagger use
+    dataset_id: Union[UUID, Literal[""], None] = Field(default=None, examples=[""])
     node_name: Optional[List[str]] = Field(default=None, examples=[[]])
     run_in_background: Optional[bool] = Field(default=False)
 

From aaa17762938ad697003dfac59413d0477d082db8 Mon Sep 17 00:00:00 2001
From: Boris <boris@topoteretes.com>
Date: Fri, 5 Sep 2025 15:39:04 +0200
Subject: [PATCH 18/19] feat: implement new local UI (#1279)

<!-- .github/pull_request_template.md -->

## Description
<!-- Provide a clear description of the changes in this PR -->

## DCO Affirmation
I affirm that all code in every commit of this pull request conforms to
the terms of the Topoteretes Developer Certificate of Origin.

---------

Co-authored-by: Daulet Amirkhanov <damirkhanov01@gmail.com>
---
 cognee-frontend/public/next.svg               |   1 -
 cognee-frontend/public/vercel.svg             |   1 -
 .../src/app/(graph)/GraphVisualization.tsx    |   8 +-
 .../src/app/(graph)/getColorForNodeType.ts    |  26 +-
 cognee-frontend/src/app/account/Account.tsx   |  51 ++
 cognee-frontend/src/app/account/page.tsx      |   1 +
 .../src/app/dashboard/AddDataToCognee.tsx     | 104 ++++
 .../dashboard/CogneeInstancesAccordion.tsx    |  31 +
 .../src/app/dashboard/Dashboard.tsx           | 140 +++++
 .../src/app/dashboard/DatasetsAccordion.tsx   | 346 +++++++++++
 .../dashboard/InstanceDatasetsAccordion.tsx   | 102 ++++
 .../src/app/dashboard/NotebooksAccordion.tsx  | 150 +++++
 cognee-frontend/src/app/dashboard/page.tsx    |   1 +
 cognee-frontend/src/app/plan/Plan.tsx         | 157 +++++
 cognee-frontend/src/app/plan/page.tsx         |   1 +
 cognee-frontend/src/modules/auth/index.ts     |   2 +
 cognee-frontend/src/modules/auth/types.ts     |   6 +
 .../src/modules/auth/useAuthenticatedUser.ts  |  17 +
 .../src/modules/cloud/checkCloudConnection.ts |  10 +
 cognee-frontend/src/modules/cloud/index.ts    |   2 +
 cognee-frontend/src/modules/cloud/syncData.ts |  11 +
 .../src/modules/ingestion/useData.ts          |   2 +
 .../src/modules/ingestion/useDatasets.ts      |  67 ++-
 .../src/modules/notebooks/useNotebooks.ts     | 134 +++++
 .../LoadingIndicator.module.css               |   2 +-
 cognee-frontend/src/ui/Icons/AddIcon.tsx      |   2 +-
 cognee-frontend/src/ui/Icons/BackIcon.tsx     |   8 +
 cognee-frontend/src/ui/Icons/CaretIcon.tsx    |   7 +-
 cognee-frontend/src/ui/Icons/CheckIcon.tsx    |   7 +
 cognee-frontend/src/ui/Icons/CloseIcon.tsx    |   8 +
 cognee-frontend/src/ui/Icons/CloudIcon.tsx    |   7 +
 cognee-frontend/src/ui/Icons/CogneeIcon.tsx   |   7 +
 cognee-frontend/src/ui/Icons/DatasetIcon.tsx  |   9 +
 .../src/ui/Icons/LocalCogneeIcon.tsx          |  10 +
 cognee-frontend/src/ui/Icons/MenuIcon.tsx     |   9 +
 cognee-frontend/src/ui/Icons/MinusIcon.tsx    |   7 +
 cognee-frontend/src/ui/Icons/NotebookIcon.tsx |   8 +
 cognee-frontend/src/ui/Icons/PlayIcon.tsx     |   7 +
 cognee-frontend/src/ui/Icons/PlusIcon.tsx     |   8 +
 cognee-frontend/src/ui/Icons/SearchIcon.tsx   |   9 +-
 cognee-frontend/src/ui/Icons/SettingsIcon.tsx |   7 +-
 cognee-frontend/src/ui/Icons/index.ts         |  26 +-
 cognee-frontend/src/ui/Layout/Header.tsx      |  74 +++
 cognee-frontend/src/ui/Layout/index.ts        |   3 +-
 cognee-frontend/src/ui/elements/Accordion.tsx |  45 ++
 .../src/ui/elements/AvatarImage.tsx           |   0
 cognee-frontend/src/ui/elements/CTAButton.tsx |   4 +-
 .../src/ui/elements/GhostButton.tsx           |   4 +-
 .../src/ui/elements/IconButton.tsx            |  14 +
 cognee-frontend/src/ui/elements/Input.tsx     |   2 +-
 .../src/ui/elements/{ => Modal}/Modal.tsx     |   2 +-
 .../src/ui/elements/Modal/index.ts            |   3 +
 .../src/ui/elements/Modal/useModal.ts         |  49 ++
 .../src/ui/elements/NeutralButton.tsx         |   6 +-
 .../src/ui/elements/Notebook/Notebook.tsx     | 342 +++++++++++
 .../elements/Notebook/NotebookCellHeader.tsx  |  68 +++
 .../src/ui/elements/Notebook/index.ts         |   1 +
 .../src/ui/elements/Notebook/types.ts         |  15 +
 cognee-frontend/src/ui/elements/PopupMenu.tsx |  48 ++
 cognee-frontend/src/ui/elements/Select.tsx    |   6 +-
 cognee-frontend/src/ui/elements/TextArea.tsx  |  27 +-
 cognee-frontend/src/ui/elements/index.ts      |   6 +-
 cognee-frontend/src/utils/fetch.ts            |   4 +
 cognee-frontend/src/utils/index.ts            |   1 +
 cognee-frontend/src/utils/useBoolean.ts       |   2 +
 cognee-frontend/src/utils/useOutsideClick.ts  |  25 +
 cognee/api/client.py                          |  21 +-
 cognee/api/health.py                          |  18 +-
 cognee/api/v1/cloud/routers/__init__.py       |   1 +
 .../api/v1/cloud/routers/get_checks_router.py |  23 +
 .../datasets/routers/get_datasets_router.py   |  16 +-
 cognee/api/v1/notebooks/routers/__init__.py   |   1 +
 .../notebooks/routers/get_notebooks_router.py |  93 +++
 .../v1/search/routers/get_search_router.py    |   3 +-
 cognee/api/v1/sync/__init__.py                |  17 +
 cognee/api/v1/sync/routers/__init__.py        |   3 +
 cognee/api/v1/sync/routers/get_sync_router.py | 134 +++++
 cognee/api/v1/sync/sync.py                    | 548 ++++++++++++++++++
 .../api/v1/users/routers/get_auth_router.py   |  14 +-
 .../databases/relational/__init__.py          |   2 +
 .../databases/relational/get_async_session.py |  15 +
 .../sqlalchemy/SqlAlchemyAdapter.py           |   1 +
 .../relational/with_async_session.py          |  25 +
 .../files/storage/LocalFileStorage.py         |   9 +
 .../files/storage/S3FileStorage.py            |   5 +
 .../files/storage/StorageManager.py           |   8 +-
 .../infrastructure/files/storage/storage.py   |  16 +
 .../exceptions/CloudApiKeyMissingError.py     |  15 +
 .../cloud/exceptions/CloudConnectionError.py  |  15 +
 cognee/modules/cloud/exceptions/__init__.py   |   2 +
 cognee/modules/cloud/operations/__init__.py   |   1 +
 .../modules/cloud/operations/check_api_key.py |  25 +
 .../data/methods/check_dataset_name.py        |   2 +-
 .../modules/data/methods/get_dataset_data.py  |   2 +-
 cognee/modules/notebooks/methods/__init__.py  |   5 +
 .../notebooks/methods/create_notebook.py      |  24 +
 .../notebooks/methods/delete_notebook.py      |  13 +
 .../modules/notebooks/methods/get_notebook.py |  21 +
 .../notebooks/methods/get_notebooks.py        |  18 +
 .../notebooks/methods/update_notebook.py      |  17 +
 cognee/modules/notebooks/models/Notebook.py   |  53 ++
 cognee/modules/notebooks/models/__init__.py   |   1 +
 .../modules/notebooks/operations/__init__.py  |   1 +
 .../operations/run_in_local_sandbox.py        |  69 +++
 .../graph_completion_cot_retriever.py         |   2 +-
 .../retrieval/graph_completion_retriever.py   |   6 +-
 .../modules/retrieval/temporal_retriever.py   |  10 +-
 cognee/modules/search/methods/search.py       |  41 +-
 cognee/modules/sync/__init__.py               |   1 +
 cognee/modules/sync/methods/__init__.py       |  18 +
 .../sync/methods/create_sync_operation.py     |  45 ++
 .../sync/methods/get_sync_operation.py        |  79 +++
 .../sync/methods/update_sync_operation.py     | 117 ++++
 cognee/modules/sync/models/SyncOperation.py   |  86 +++
 cognee/modules/sync/models/__init__.py        |   3 +
 cognee/modules/users/__init__.py              |   1 -
 cognee/modules/users/methods/create_user.py   |  27 +-
 .../get_specific_user_permission_datasets.py  |   3 +-
 118 files changed, 3857 insertions(+), 109 deletions(-)
 delete mode 100644 cognee-frontend/public/next.svg
 delete mode 100644 cognee-frontend/public/vercel.svg
 create mode 100644 cognee-frontend/src/app/account/Account.tsx
 create mode 100644 cognee-frontend/src/app/account/page.tsx
 create mode 100644 cognee-frontend/src/app/dashboard/AddDataToCognee.tsx
 create mode 100644 cognee-frontend/src/app/dashboard/CogneeInstancesAccordion.tsx
 create mode 100644 cognee-frontend/src/app/dashboard/Dashboard.tsx
 create mode 100644 cognee-frontend/src/app/dashboard/DatasetsAccordion.tsx
 create mode 100644 cognee-frontend/src/app/dashboard/InstanceDatasetsAccordion.tsx
 create mode 100644 cognee-frontend/src/app/dashboard/NotebooksAccordion.tsx
 create mode 100644 cognee-frontend/src/app/dashboard/page.tsx
 create mode 100644 cognee-frontend/src/app/plan/Plan.tsx
 create mode 100644 cognee-frontend/src/app/plan/page.tsx
 create mode 100644 cognee-frontend/src/modules/auth/index.ts
 create mode 100644 cognee-frontend/src/modules/auth/types.ts
 create mode 100644 cognee-frontend/src/modules/auth/useAuthenticatedUser.ts
 create mode 100644 cognee-frontend/src/modules/cloud/checkCloudConnection.ts
 create mode 100644 cognee-frontend/src/modules/cloud/index.ts
 create mode 100644 cognee-frontend/src/modules/cloud/syncData.ts
 create mode 100644 cognee-frontend/src/modules/notebooks/useNotebooks.ts
 create mode 100644 cognee-frontend/src/ui/Icons/BackIcon.tsx
 create mode 100644 cognee-frontend/src/ui/Icons/CheckIcon.tsx
 create mode 100644 cognee-frontend/src/ui/Icons/CloseIcon.tsx
 create mode 100644 cognee-frontend/src/ui/Icons/CloudIcon.tsx
 create mode 100644 cognee-frontend/src/ui/Icons/CogneeIcon.tsx
 create mode 100644 cognee-frontend/src/ui/Icons/DatasetIcon.tsx
 create mode 100644 cognee-frontend/src/ui/Icons/LocalCogneeIcon.tsx
 create mode 100644 cognee-frontend/src/ui/Icons/MenuIcon.tsx
 create mode 100644 cognee-frontend/src/ui/Icons/MinusIcon.tsx
 create mode 100644 cognee-frontend/src/ui/Icons/NotebookIcon.tsx
 create mode 100644 cognee-frontend/src/ui/Icons/PlayIcon.tsx
 create mode 100644 cognee-frontend/src/ui/Icons/PlusIcon.tsx
 create mode 100644 cognee-frontend/src/ui/Layout/Header.tsx
 create mode 100644 cognee-frontend/src/ui/elements/Accordion.tsx
 create mode 100644 cognee-frontend/src/ui/elements/AvatarImage.tsx
 create mode 100644 cognee-frontend/src/ui/elements/IconButton.tsx
 rename cognee-frontend/src/ui/elements/{ => Modal}/Modal.tsx (84%)
 create mode 100644 cognee-frontend/src/ui/elements/Modal/index.ts
 create mode 100644 cognee-frontend/src/ui/elements/Modal/useModal.ts
 create mode 100644 cognee-frontend/src/ui/elements/Notebook/Notebook.tsx
 create mode 100644 cognee-frontend/src/ui/elements/Notebook/NotebookCellHeader.tsx
 create mode 100644 cognee-frontend/src/ui/elements/Notebook/index.ts
 create mode 100644 cognee-frontend/src/ui/elements/Notebook/types.ts
 create mode 100644 cognee-frontend/src/ui/elements/PopupMenu.tsx
 create mode 100644 cognee-frontend/src/utils/useOutsideClick.ts
 create mode 100644 cognee/api/v1/cloud/routers/__init__.py
 create mode 100644 cognee/api/v1/cloud/routers/get_checks_router.py
 create mode 100644 cognee/api/v1/notebooks/routers/__init__.py
 create mode 100644 cognee/api/v1/notebooks/routers/get_notebooks_router.py
 create mode 100644 cognee/api/v1/sync/__init__.py
 create mode 100644 cognee/api/v1/sync/routers/__init__.py
 create mode 100644 cognee/api/v1/sync/routers/get_sync_router.py
 create mode 100644 cognee/api/v1/sync/sync.py
 create mode 100644 cognee/infrastructure/databases/relational/get_async_session.py
 create mode 100644 cognee/infrastructure/databases/relational/with_async_session.py
 create mode 100644 cognee/modules/cloud/exceptions/CloudApiKeyMissingError.py
 create mode 100644 cognee/modules/cloud/exceptions/CloudConnectionError.py
 create mode 100644 cognee/modules/cloud/exceptions/__init__.py
 create mode 100644 cognee/modules/cloud/operations/__init__.py
 create mode 100644 cognee/modules/cloud/operations/check_api_key.py
 create mode 100644 cognee/modules/notebooks/methods/__init__.py
 create mode 100644 cognee/modules/notebooks/methods/create_notebook.py
 create mode 100644 cognee/modules/notebooks/methods/delete_notebook.py
 create mode 100644 cognee/modules/notebooks/methods/get_notebook.py
 create mode 100644 cognee/modules/notebooks/methods/get_notebooks.py
 create mode 100644 cognee/modules/notebooks/methods/update_notebook.py
 create mode 100644 cognee/modules/notebooks/models/Notebook.py
 create mode 100644 cognee/modules/notebooks/models/__init__.py
 create mode 100644 cognee/modules/notebooks/operations/__init__.py
 create mode 100644 cognee/modules/notebooks/operations/run_in_local_sandbox.py
 create mode 100644 cognee/modules/sync/__init__.py
 create mode 100644 cognee/modules/sync/methods/__init__.py
 create mode 100644 cognee/modules/sync/methods/create_sync_operation.py
 create mode 100644 cognee/modules/sync/methods/get_sync_operation.py
 create mode 100644 cognee/modules/sync/methods/update_sync_operation.py
 create mode 100644 cognee/modules/sync/models/SyncOperation.py
 create mode 100644 cognee/modules/sync/models/__init__.py

diff --git a/cognee-frontend/public/next.svg b/cognee-frontend/public/next.svg
deleted file mode 100644
index 5174b28c5..000000000
--- a/cognee-frontend/public/next.svg
+++ /dev/null
@@ -1 +0,0 @@
-<svg xmlns="http://www.w3.org/2000/svg" fill="none" viewBox="0 0 394 80"><path fill="#000" d="M262 0h68.5v12.7h-27.2v66.6h-13.6V12.7H262V0ZM149 0v12.7H94v20.4h44.3v12.6H94v21h55v12.6H80.5V0h68.7zm34.3 0h-17.8l63.8 79.4h17.9l-32-39.7 32-39.6h-17.9l-23 28.6-23-28.6zm18.3 56.7-9-11-27.1 33.7h17.8l18.3-22.7z"/><path fill="#000" d="M81 79.3 17 0H0v79.3h13.6V17l50.2 62.3H81Zm252.6-.4c-1 0-1.8-.4-2.5-1s-1.1-1.6-1.1-2.6.3-1.8 1-2.5 1.6-1 2.6-1 1.8.3 2.5 1a3.4 3.4 0 0 1 .6 4.3 3.7 3.7 0 0 1-3 1.8zm23.2-33.5h6v23.3c0 2.1-.4 4-1.3 5.5a9.1 9.1 0 0 1-3.8 3.5c-1.6.8-3.5 1.3-5.7 1.3-2 0-3.7-.4-5.3-1s-2.8-1.8-3.7-3.2c-.9-1.3-1.4-3-1.4-5h6c.1.8.3 1.6.7 2.2s1 1.2 1.6 1.5c.7.4 1.5.5 2.4.5 1 0 1.8-.2 2.4-.6a4 4 0 0 0 1.6-1.8c.3-.8.5-1.8.5-3V45.5zm30.9 9.1a4.4 4.4 0 0 0-2-3.3 7.5 7.5 0 0 0-4.3-1.1c-1.3 0-2.4.2-3.3.5-.9.4-1.6 1-2 1.6a3.5 3.5 0 0 0-.3 4c.3.5.7.9 1.3 1.2l1.8 1 2 .5 3.2.8c1.3.3 2.5.7 3.7 1.2a13 13 0 0 1 3.2 1.8 8.1 8.1 0 0 1 3 6.5c0 2-.5 3.7-1.5 5.1a10 10 0 0 1-4.4 3.5c-1.8.8-4.1 1.2-6.8 1.2-2.6 0-4.9-.4-6.8-1.2-2-.8-3.4-2-4.5-3.5a10 10 0 0 1-1.7-5.6h6a5 5 0 0 0 3.5 4.6c1 .4 2.2.6 3.4.6 1.3 0 2.5-.2 3.5-.6 1-.4 1.8-1 2.4-1.7a4 4 0 0 0 .8-2.4c0-.9-.2-1.6-.7-2.2a11 11 0 0 0-2.1-1.4l-3.2-1-3.8-1c-2.8-.7-5-1.7-6.6-3.2a7.2 7.2 0 0 1-2.4-5.7 8 8 0 0 1 1.7-5 10 10 0 0 1 4.3-3.5c2-.8 4-1.2 6.4-1.2 2.3 0 4.4.4 6.2 1.2 1.8.8 3.2 2 4.3 3.4 1 1.4 1.5 3 1.5 5h-5.8z"/></svg>
\ No newline at end of file
diff --git a/cognee-frontend/public/vercel.svg b/cognee-frontend/public/vercel.svg
deleted file mode 100644
index d2f842227..000000000
--- a/cognee-frontend/public/vercel.svg
+++ /dev/null
@@ -1 +0,0 @@
-<svg xmlns="http://www.w3.org/2000/svg" fill="none" viewBox="0 0 283 64"><path fill="black" d="M141 16c-11 0-19 7-19 18s9 18 20 18c7 0 13-3 16-7l-7-5c-2 3-6 4-9 4-5 0-9-3-10-7h28v-3c0-11-8-18-19-18zm-9 15c1-4 4-7 9-7s8 3 9 7h-18zm117-15c-11 0-19 7-19 18s9 18 20 18c6 0 12-3 16-7l-8-5c-2 3-5 4-8 4-5 0-9-3-11-7h28l1-3c0-11-8-18-19-18zm-10 15c2-4 5-7 10-7s8 3 9 7h-19zm-39 3c0 6 4 10 10 10 4 0 7-2 9-5l8 5c-3 5-9 8-17 8-11 0-19-7-19-18s8-18 19-18c8 0 14 3 17 8l-8 5c-2-3-5-5-9-5-6 0-10 4-10 10zm83-29v46h-9V5h9zM37 0l37 64H0L37 0zm92 5-27 48L74 5h10l18 30 17-30h10zm59 12v10l-3-1c-6 0-10 4-10 10v15h-9V17h9v9c0-5 6-9 13-9z"/></svg>
\ No newline at end of file
diff --git a/cognee-frontend/src/app/(graph)/GraphVisualization.tsx b/cognee-frontend/src/app/(graph)/GraphVisualization.tsx
index 67d6458f8..4e2d1e642 100644
--- a/cognee-frontend/src/app/(graph)/GraphVisualization.tsx
+++ b/cognee-frontend/src/app/(graph)/GraphVisualization.tsx
@@ -1,5 +1,6 @@
 "use client";
 
+import classNames from "classnames";
 import { MutableRefObject, useEffect, useImperativeHandle, useRef, useState, useCallback } from "react";
 import { forceCollide, forceManyBody } from "d3-force-3d";
 import ForceGraph, { ForceGraphMethods, GraphData, LinkObject, NodeObject } from "react-force-graph-2d";
@@ -10,6 +11,7 @@ interface GraphVisuzaliationProps {
   ref: MutableRefObject<GraphVisualizationAPI>;
   data?: GraphData<NodeObject, LinkObject>;
   graphControls: MutableRefObject<GraphControlsAPI>;
+  className?: string;
 }
 
 export interface GraphVisualizationAPI {
@@ -17,7 +19,7 @@ export interface GraphVisualizationAPI {
   setGraphShape: (shape: string) => void;
 }
 
-export default function GraphVisualization({ ref, data, graphControls }: GraphVisuzaliationProps) {
+export default function GraphVisualization({ ref, data, graphControls, className }: GraphVisuzaliationProps) {
   const textSize = 6;
   const nodeSize = 15;
   // const addNodeDistanceFromSourceNode = 15;
@@ -201,7 +203,7 @@ export default function GraphVisualization({ ref, data, graphControls }: GraphVi
     if (typeof window !== "undefined" && data && graphRef.current) {
       // add collision force
       graphRef.current.d3Force("collision", forceCollide(nodeSize * 1.5));
-      graphRef.current.d3Force("charge", forceManyBody().strength(-1500).distanceMin(300).distanceMax(900));
+      graphRef.current.d3Force("charge", forceManyBody().strength(-10).distanceMin(10).distanceMax(50));
     }
   }, [data, graphRef]);
 
@@ -213,7 +215,7 @@ export default function GraphVisualization({ ref, data, graphControls }: GraphVi
   }));
 
   return (
-    <div ref={containerRef} className="w-full h-full" id="graph-container">
+    <div ref={containerRef} className={classNames("w-full h-full", className)} id="graph-container">
       {(data && typeof window !== "undefined") ? (
         <ForceGraph
           ref={graphRef}
diff --git a/cognee-frontend/src/app/(graph)/getColorForNodeType.ts b/cognee-frontend/src/app/(graph)/getColorForNodeType.ts
index 4edaa334d..f26c4d147 100644
--- a/cognee-frontend/src/app/(graph)/getColorForNodeType.ts
+++ b/cognee-frontend/src/app/(graph)/getColorForNodeType.ts
@@ -2,19 +2,19 @@ import colors from "tailwindcss/colors";
 import { formatHex } from "culori";
 
 const NODE_COLORS = {
-  TextDocument: formatHex(colors.blue[500]),
-  DocumentChunk: formatHex(colors.green[500]),
-  TextSummary: formatHex(colors.orange[500]),
-  Entity: formatHex(colors.yellow[300]),
-  EntityType: formatHex(colors.purple[800]),
-  NodeSet: formatHex(colors.indigo[300]),
-  GitHubUser: formatHex(colors.gray[300]),
-  Comment: formatHex(colors.amber[500]),
-  Issue: formatHex(colors.red[500]),
-  Repository: formatHex(colors.stone[400]),
-  Commit: formatHex(colors.teal[500]),
-  File: formatHex(colors.emerald[500]),
-  FileChange: formatHex(colors.sky[500]),
+  TextDocument: formatHex(colors.stone[200]),
+  DocumentChunk: formatHex(colors.stone[300]),
+  TextSummary: formatHex(colors.blue[300]),
+  Entity: formatHex(colors.indigo[300]),
+  EntityType: formatHex(colors.indigo[400]),
+  NodeSet: formatHex(colors.indigo[400]),
+  GitHubUser: formatHex(colors.gray[200]),
+  Comment: formatHex(colors.blue[300]),
+  Issue: formatHex(colors.red[200]),
+  Repository: formatHex(colors.stone[200]),
+  Commit: formatHex(colors.teal[300]),
+  File: formatHex(colors.emerald[300]),
+  FileChange: formatHex(colors.sky[300]),
 };
 
 export default function getColorForNodeType(type: string) {
diff --git a/cognee-frontend/src/app/account/Account.tsx b/cognee-frontend/src/app/account/Account.tsx
new file mode 100644
index 000000000..8161a4d26
--- /dev/null
+++ b/cognee-frontend/src/app/account/Account.tsx
@@ -0,0 +1,51 @@
+import Link from "next/link";
+import { BackIcon } from "@/ui/Icons";
+import { CTAButton } from "@/ui/elements";
+import Header from "@/ui/Layout/Header";
+
+export default function Account() {
+  const account = {
+    name: "John Doe",
+  };
+
+  return (
+    <>
+      <div className="absolute top-0 right-0 bottom-0 left-0 flex flex-row gap-2.5">
+        <div className="flex-1/5 bg-gray-100 h-full"></div>
+        <div className="flex-1/5 bg-gray-100 h-full"></div>
+        <div className="flex-1/5 bg-gray-100 h-full"></div>
+        <div className="flex-1/5 bg-gray-100 h-full"></div>
+        <div className="flex-1/5 bg-gray-100 h-full"></div>
+      </div>
+
+      <Header />
+
+      <div className="relative flex flex-row items-start gap-2.5">
+        <Link href="/dashboard" className="flex-1/5 py-4 px-5 flex flex-row items-center gap-5">
+          <BackIcon />
+          <span>back</span>
+        </Link>
+        <div className="flex-1/5 flex flex-col gap-2.5">
+          <div className="py-4 px-5 rounded-xl bg-white">
+            <div>Account</div>
+            <div className="text-sm text-gray-400 mb-8">Manage your account&apos;s settings.</div>
+            <div>{account.name}</div>
+          </div>
+          <div className="py-4 px-5 rounded-xl bg-white">
+            <div>Plan</div>
+            <div className="text-sm text-gray-400 mb-8">You are using open-source version. Subscribe to get access to hosted cognee with your data!</div>
+            <Link href="/plan">
+              <CTAButton><span className="">Select a plan</span></CTAButton>
+            </Link>
+          </div>
+        </div>
+        <div className="flex-1/5 py-4 px-5 rounded-xl">
+        </div>
+        <div className="flex-1/5 py-4 px-5 rounded-xl">
+        </div>
+        <div className="flex-1/5 py-4 px-5 rounded-xl">
+        </div>
+      </div>
+    </>
+  );
+}
diff --git a/cognee-frontend/src/app/account/page.tsx b/cognee-frontend/src/app/account/page.tsx
new file mode 100644
index 000000000..f6323c313
--- /dev/null
+++ b/cognee-frontend/src/app/account/page.tsx
@@ -0,0 +1 @@
+export { default } from "./Account";
diff --git a/cognee-frontend/src/app/dashboard/AddDataToCognee.tsx b/cognee-frontend/src/app/dashboard/AddDataToCognee.tsx
new file mode 100644
index 000000000..e5f4bb932
--- /dev/null
+++ b/cognee-frontend/src/app/dashboard/AddDataToCognee.tsx
@@ -0,0 +1,104 @@
+import { FormEvent, useCallback, useState } from "react";
+import { CloseIcon, PlusIcon } from "@/ui/Icons";
+import { useModal } from "@/ui/elements/Modal";
+import { CTAButton, GhostButton, IconButton, Modal, Select } from "@/ui/elements";
+
+import addData from "@/modules/ingestion/addData";
+import { Dataset } from "@/modules/ingestion/useDatasets";
+
+interface AddDataToCogneeProps {
+  datasets: Dataset[];
+  refreshDatasets: () => void;
+}
+
+export default function AddDataToCognee({ datasets, refreshDatasets }: AddDataToCogneeProps) {
+  const [filesForUpload, setFilesForUpload] = useState<FileList | null>(null);
+
+  const prepareFiles = useCallback((event: FormEvent<HTMLInputElement>) => {
+    const formElements = event.currentTarget;
+    const files = formElements.files;
+
+    setFilesForUpload(files);
+  }, []);
+
+  const processDataWithCognee = useCallback((state: object, event?: FormEvent<HTMLFormElement>) => {
+    event!.preventDefault();
+
+    if (!filesForUpload) {
+      return;
+    }
+
+    const formElements = event!.currentTarget;
+    const datasetId = formElements.datasetName.value;
+
+    return addData(
+      datasetId ? {
+        id: datasetId,
+      } : {
+        name: "main_dataset",
+      },
+      Array.from(filesForUpload)
+    )
+      .then(() => {
+        refreshDatasets();
+        setFilesForUpload(null);
+      });
+  }, [filesForUpload, refreshDatasets]);
+
+  const {
+    isModalOpen: isAddDataModalOpen,
+    openModal: openAddDataModal,
+    closeModal: closeAddDataModal,
+    isActionLoading: isProcessingDataWithCognee,
+    confirmAction: submitDataToCognee,
+  } = useModal(false, processDataWithCognee);
+
+  return (
+    <>
+      <GhostButton onClick={openAddDataModal} className="mb-5 py-1.5 !px-2 text-sm w-full items-center justify-start">
+        <PlusIcon />
+        Add data to cognee
+      </GhostButton>
+
+      <Modal isOpen={isAddDataModalOpen}>
+        <div className="w-full max-w-2xl">
+          <div className="flex flex-row items-center justify-between">
+            <span className="text-2xl">Add new data to a dataset?</span>
+            <IconButton onClick={closeAddDataModal}><CloseIcon /></IconButton>
+          </div>
+          <div className="mt-8 mb-6">Please select a dataset to add data in.<br/> If you don&apos;t have any, don&apos;t worry, we will create one for you.</div>
+          <form onSubmit={submitDataToCognee}>
+            <div className="max-w-md flex flex-col gap-4">
+              <Select name="datasetName">
+                <option value="">select a dataset</option>
+                {datasets.map((dataset: Dataset) => <option key={dataset.id} value={dataset.id}>{dataset.name}</option>)}
+              </Select>
+
+              <GhostButton className="w-full relative justify-start pl-4">
+                <input onChange={prepareFiles} required name="files" tabIndex={-1} type="file" multiple className="absolute w-full h-full cursor-pointer opacity-0" />
+                <span>select files</span>
+              </GhostButton>
+
+              {filesForUpload?.length && (
+                <div className="pt-4 mt-4 border-t-1 border-t-gray-100">
+                  <div className="mb-1.5">selected files:</div>
+                  {Array.from(filesForUpload || []).map((file) => (
+                    <div key={file.name} className="py-1.5 pl-2">
+                      <span className="text-sm">{file.name}</span>
+                    </div>
+                  ))}
+                </div>
+              )}
+            </div>
+            <div className="flex flex-row gap-4 mt-4 justify-end">
+              <GhostButton type="button" onClick={() => closeAddDataModal()}>cancel</GhostButton>
+              <CTAButton disabled={isProcessingDataWithCognee} type="submit">
+                {isProcessingDataWithCognee ? "processing..." : "add"}
+              </CTAButton>
+            </div>
+          </form>
+        </div>
+      </Modal>
+    </>
+  );
+}
diff --git a/cognee-frontend/src/app/dashboard/CogneeInstancesAccordion.tsx b/cognee-frontend/src/app/dashboard/CogneeInstancesAccordion.tsx
new file mode 100644
index 000000000..037c9e828
--- /dev/null
+++ b/cognee-frontend/src/app/dashboard/CogneeInstancesAccordion.tsx
@@ -0,0 +1,31 @@
+"use client";
+
+import { useBoolean } from "@/utils";
+import { Accordion } from "@/ui/elements";
+
+interface CogneeInstancesAccordionProps {
+  children: React.ReactNode;
+}
+
+export default function CogneeInstancesAccordion({
+  children,
+}: CogneeInstancesAccordionProps) {
+  const {
+    value: isInstancesPanelOpen,
+    setTrue: openInstancesPanel,
+    setFalse: closeInstancesPanel,
+  } = useBoolean(true);
+
+  return (
+    <>
+      <Accordion
+        title={<span>Cognee Instances</span>}
+        isOpen={isInstancesPanelOpen}
+        openAccordion={openInstancesPanel}
+        closeAccordion={closeInstancesPanel}
+      >
+        {children}
+      </Accordion>
+    </>
+  );
+}
diff --git a/cognee-frontend/src/app/dashboard/Dashboard.tsx b/cognee-frontend/src/app/dashboard/Dashboard.tsx
new file mode 100644
index 000000000..c5980fb29
--- /dev/null
+++ b/cognee-frontend/src/app/dashboard/Dashboard.tsx
@@ -0,0 +1,140 @@
+"use client";
+
+import { useCallback, useEffect, useRef, useState } from "react";
+
+import { Header } from "@/ui/Layout";
+import { SearchIcon } from "@/ui/Icons";
+import { Notebook } from "@/ui/elements";
+import { Notebook as NotebookType } from "@/ui/elements/Notebook/types";
+import { Dataset } from "@/modules/ingestion/useDatasets";
+import useNotebooks from "@/modules/notebooks/useNotebooks";
+
+import NotebooksAccordion from "./NotebooksAccordion";
+import CogneeInstancesAccordion from "./CogneeInstancesAccordion";
+import AddDataToCognee from "./AddDataToCognee";
+import InstanceDatasetsAccordion from "./InstanceDatasetsAccordion";
+
+export default function Dashboard() {
+  const {
+    notebooks,
+    refreshNotebooks,
+    runCell,
+    addNotebook,
+    updateNotebook,
+    saveNotebook,
+    removeNotebook,
+  } = useNotebooks();
+
+  useEffect(() => {
+    if (!notebooks.length) {
+      refreshNotebooks()
+        .then((notebooks) => {
+          if (notebooks[0]) {
+            setSelectedNotebookId(notebooks[0].id);
+          }
+        });
+    }
+  }, [notebooks.length, refreshNotebooks]);
+
+  const [selectedNotebookId, setSelectedNotebookId] = useState<string | null>(null);
+
+  const handleNotebookRemove = useCallback((notebookId: string) => {
+    setSelectedNotebookId((currentSelectedNotebookId) => (
+      currentSelectedNotebookId === notebookId ? null : currentSelectedNotebookId
+    ));
+    return removeNotebook(notebookId);
+  }, [removeNotebook]);
+
+  const saveNotebookTimeoutRef = useRef<number | null>(null);
+  const saveNotebookThrottled = useCallback((notebook: NotebookType) => {
+    const throttleTime = 1000;
+
+    if (saveNotebookTimeoutRef.current) {
+      clearTimeout(saveNotebookTimeoutRef.current);
+      saveNotebookTimeoutRef.current = null;
+    }
+
+    saveNotebookTimeoutRef.current = setTimeout(() => {
+      saveNotebook(notebook);
+    }, throttleTime) as unknown as number;
+  }, [saveNotebook]);
+
+  useEffect(() => {
+    return () => {
+      if (saveNotebookTimeoutRef.current) {
+        clearTimeout(saveNotebookTimeoutRef.current);
+        saveNotebookTimeoutRef.current = null;
+      }
+    };
+  }, []);
+
+  const handleNotebookUpdate = useCallback((notebook: NotebookType) => {
+    updateNotebook(notebook);
+    saveNotebookThrottled(notebook);
+  }, [saveNotebookThrottled, updateNotebook]);
+
+  const selectedNotebook = notebooks.find((notebook) => notebook.id === selectedNotebookId);
+
+  // ############################
+  // Datasets logic
+
+  const [datasets, setDatasets] = useState<Dataset[]>([]);
+  const refreshDatasetsRef = useRef(() => {});
+
+  const handleDatasetsChange = useCallback((payload: { datasets: Dataset[], refreshDatasets: () => void }) => {
+    const {
+      datasets,
+      refreshDatasets,
+    } = payload;
+
+    refreshDatasetsRef.current = refreshDatasets;
+    setDatasets(datasets);
+  }, []);
+
+  return (
+    <div className="h-full flex flex-col bg-gray-200">
+      <Header />
+
+      <div className="relative flex-1 flex flex-row gap-2.5 items-start w-full max-w-[1920px] max-h-[calc(100% - 3.5rem)] overflow-hidden mx-auto px-2.5 py-2.5">
+        <div className="px-5 py-4 lg:w-96 bg-white rounded-xl min-h-full">
+          <div className="relative mb-2">
+            <label htmlFor="search-input"><SearchIcon className="absolute left-3 top-[10px] cursor-text" /></label>
+            <input id="search-input" className="text-xs leading-3 w-full h-8 flex flex-row items-center gap-2.5 rounded-3xl pl-9 placeholder-gray-300 border-gray-300 border-[1px] focus:outline-indigo-600" placeholder="Search datasets..." />
+          </div>
+
+          <AddDataToCognee
+            datasets={datasets}
+            refreshDatasets={refreshDatasetsRef.current}
+          />
+
+          <NotebooksAccordion
+            notebooks={notebooks}
+            addNotebook={addNotebook}
+            removeNotebook={handleNotebookRemove}
+            openNotebook={setSelectedNotebookId}
+          />
+
+          <div className="mt-7 mb-14">
+            <CogneeInstancesAccordion>
+              <InstanceDatasetsAccordion
+                onDatasetsChange={handleDatasetsChange}
+              />
+            </CogneeInstancesAccordion>
+          </div>
+        </div>
+
+        <div className="flex-1 flex flex-col justify-between h-full overflow-y-auto">
+            {selectedNotebook && (
+              <Notebook
+                key={selectedNotebook.id}
+                notebook={selectedNotebook}
+                updateNotebook={handleNotebookUpdate}
+                saveNotebook={saveNotebook}
+                runCell={runCell}
+              />
+            )}
+        </div>
+      </div>
+    </div>
+  );
+}
diff --git a/cognee-frontend/src/app/dashboard/DatasetsAccordion.tsx b/cognee-frontend/src/app/dashboard/DatasetsAccordion.tsx
new file mode 100644
index 000000000..55ce23dfa
--- /dev/null
+++ b/cognee-frontend/src/app/dashboard/DatasetsAccordion.tsx
@@ -0,0 +1,346 @@
+"use client";
+
+import { ChangeEvent, useCallback, useEffect, useState } from "react";
+import { useBoolean } from "@/utils";
+import { Accordion, CTAButton, GhostButton, IconButton, Input, Modal, PopupMenu } from "@/ui/elements";
+import { AccordionProps } from "@/ui/elements/Accordion";
+import { CloseIcon, DatasetIcon, MinusIcon, PlusIcon } from "@/ui/Icons";
+import useDatasets, { Dataset } from "@/modules/ingestion/useDatasets";
+import addData from "@/modules/ingestion/addData";
+import cognifyDataset from "@/modules/datasets/cognifyDataset";
+import { DataFile } from '@/modules/ingestion/useData';
+import { LoadingIndicator } from '@/ui/App';
+
+interface DatasetsChangePayload {
+  datasets: Dataset[]
+  refreshDatasets: () => void;
+}
+
+export interface DatasetsAccordionProps extends Omit<AccordionProps, "isOpen" | "openAccordion" | "closeAccordion" | "children"> {
+  onDatasetsChange?: (payload: DatasetsChangePayload) => void;
+}
+
+export default function DatasetsAccordion({
+  title,
+  tools,
+  switchCaretPosition = false,
+  className,
+  contentClassName,
+  onDatasetsChange,
+}: DatasetsAccordionProps) {
+  const {
+    value: isDatasetsPanelOpen,
+    setTrue: openDatasetsPanel,
+    setFalse: closeDatasetsPanel,
+  } = useBoolean(true);
+
+  const {
+    datasets,
+    refreshDatasets,
+    addDataset,
+    removeDataset,
+    getDatasetData,
+    removeDatasetData,
+  } = useDatasets();
+
+  useEffect(() => {
+    if (datasets.length === 0) {
+      refreshDatasets();
+    }
+  }, [datasets.length, refreshDatasets]);
+
+  const [openDatasets, openDataset] = useState<Set<string>>(new Set());
+
+  const toggleDataset = (id: string) => {
+    openDataset((prev) => {
+      const newState = new Set(prev);
+
+      if (newState.has(id)) {
+        newState.delete(id)
+      } else {
+        getDatasetData(id)
+          .then(() => {
+            newState.add(id);
+          });
+      }
+
+      return newState;
+    });
+  };
+
+  const refreshOpenDatasetsData = useCallback(() => {
+    return Promise.all(
+      openDatasets.values().map(
+        (datasetId) => getDatasetData(datasetId)
+      )
+    );
+  }, [getDatasetData, openDatasets]);
+
+  const refreshDatasetsAndData = useCallback(() => {
+    refreshDatasets()
+     .then(refreshOpenDatasetsData);
+  }, [refreshDatasets, refreshOpenDatasetsData]);
+
+  useEffect(() => {
+    onDatasetsChange?.({
+      datasets,
+      refreshDatasets: refreshDatasetsAndData,
+    });
+  }, [datasets, onDatasetsChange, refreshDatasets, refreshDatasetsAndData]);
+
+  const {
+    value: isNewDatasetModalOpen,
+    setTrue: openNewDatasetModal,
+    setFalse: closeNewDatasetModal,
+  } = useBoolean(false);
+
+  const handleDatasetAdd = () => {
+    openNewDatasetModal();
+  };
+
+  const [newDatasetError, setNewDatasetError] = useState("");
+
+  const handleNewDatasetSubmit = (event: React.FormEvent<HTMLFormElement>) => {
+    event.preventDefault();
+    setNewDatasetError("");
+
+    const formElements = event.currentTarget;
+
+    const datasetName = formElements.datasetName.value;
+
+    if (datasetName.trim().length === 0) {
+      setNewDatasetError("Dataset name cannot be empty.");
+      return;
+    }
+
+    if (datasetName.includes(" ") || datasetName.includes(".")) {
+      setNewDatasetError("Dataset name cannot contain spaces or periods.");
+      return;
+    }
+
+    addDataset(datasetName)
+      .then(() => {
+        closeNewDatasetModal();
+        refreshDatasetsAndData();
+      });
+  };
+
+  const {
+    value: isRemoveDatasetModalOpen,
+    setTrue: openRemoveDatasetModal,
+    setFalse: closeRemoveDatasetModal,
+  } = useBoolean(false);
+
+  const [datasetToRemove, setDatasetToRemove] = useState<Dataset | null>(null);
+  
+  const handleDatasetRemove = (dataset: Dataset) => {
+    setDatasetToRemove(dataset);
+    openRemoveDatasetModal();
+  };
+
+  const handleDatasetRemoveCancel = () => {
+    setDatasetToRemove(null);
+    closeRemoveDatasetModal();
+  };
+
+  const handleRemoveDatasetConfirm = (event: React.FormEvent<HTMLButtonElement>) => {
+    event.preventDefault();
+
+    if (datasetToRemove) {
+      removeDataset(datasetToRemove.id)
+        .then(() => {
+          closeRemoveDatasetModal();
+          setDatasetToRemove(null);
+          refreshDatasetsAndData();
+        });
+    }
+  };
+
+  const {
+    value: isProcessingFiles,
+    setTrue: setProcessingFilesInProgress,
+    setFalse: setProcessingFilesDone,
+  } = useBoolean(false);
+
+  const handleAddFiles = (dataset: Dataset, event: ChangeEvent<HTMLInputElement>) => {
+    event.stopPropagation();
+
+    if (isProcessingFiles) {
+      return;
+    }
+
+    setProcessingFilesInProgress();
+
+    if (!event.target.files) {
+      return;
+    }
+
+    const files: File[] = Array.from(event.target.files);
+
+    if (!files.length) {
+      return;
+    }
+
+    return addData(dataset, files)
+      .then(async () => {
+        await getDatasetData(dataset.id);
+        
+        const onUpdate = () => {};
+
+        return cognifyDataset(dataset, onUpdate)
+          .finally(() => {
+            setProcessingFilesDone();
+          });
+      });
+  };
+
+  const [dataToRemove, setDataToRemove] = useState<DataFile | null>(null);
+  const {
+    value: isRemoveDataModalOpen,
+    setTrue: openRemoveDataModal,
+    setFalse: closeRemoveDataModal,
+  } = useBoolean(false);
+
+  const handleDataRemove = (data: DataFile) => {
+    setDataToRemove(data);
+
+    openRemoveDataModal();
+  };
+  const handleDataRemoveCancel = () => {
+    setDataToRemove(null);
+    closeRemoveDataModal();
+  };
+  const handleDataRemoveConfirm = (event: React.FormEvent<HTMLButtonElement>) => {
+    event.preventDefault();
+
+    if (dataToRemove) {
+      removeDatasetData(dataToRemove.datasetId, dataToRemove.id)
+         .then(() => {
+          closeRemoveDataModal();
+          setDataToRemove(null);
+          refreshDatasetsAndData();
+        });
+    }
+  }
+
+  return (
+    <>
+      <Accordion
+        title={title || <span>Datasets</span>}
+        isOpen={isDatasetsPanelOpen}
+        openAccordion={openDatasetsPanel}
+        closeAccordion={closeDatasetsPanel}
+        tools={tools || <IconButton onClick={handleDatasetAdd}><PlusIcon /></IconButton>}
+        switchCaretPosition={switchCaretPosition}
+        className={className}
+        contentClassName={contentClassName}
+      >
+        <div className="flex flex-col">
+          {datasets.length === 0 && (
+            <div className="flex flex-row items-baseline-last text-sm text-gray-400 mt-2 px-2">
+              <span>No datasets here, add one by clicking +</span>
+            </div>
+          )}
+          {datasets.map((dataset) => {
+            return (
+              <Accordion
+                key={dataset.id}
+                title={(
+                  <div className="flex flex-row gap-2 items-center py-1.5 cursor-pointer">
+                    {isProcessingFiles ? <LoadingIndicator /> : <DatasetIcon />}
+                    <span className="text-xs">{dataset.name}</span>
+                  </div>
+                )}
+                isOpen={openDatasets.has(dataset.id)}
+                openAccordion={() => toggleDataset(dataset.id)}
+                closeAccordion={() => toggleDataset(dataset.id)}
+                tools={(
+                  <IconButton className="relative">
+                    <input tabIndex={-1} type="file" multiple onChange={handleAddFiles.bind(null, dataset)} className="absolute w-full h-full cursor-pointer opacity-0" />
+                    <PopupMenu>
+                      <div className="flex flex-col gap-0.5">
+                        <div className="hover:bg-gray-100 w-full text-left px-2 cursor-pointer relative">
+                          <input tabIndex={-1} type="file" multiple onChange={handleAddFiles.bind(null, dataset)} className="absolute w-full h-full cursor-pointer opacity-0" />
+                          <span>add data</span>
+                        </div>
+                      </div>
+                      <div className="flex flex-col gap-0.5 items-start">
+                        <div onClick={() => handleDatasetRemove(dataset)} className="hover:bg-gray-100 w-full text-left px-2 cursor-pointer">delete</div>
+                      </div>
+                    </PopupMenu>
+                  </IconButton>
+                )}
+                className="first:pt-1.5"
+                switchCaretPosition={true}
+              >
+                <>
+                  {dataset.data?.length === 0 && (
+                    <div className="flex flex-row items-baseline-last text-sm text-gray-400 mt-2 px-2">
+                      <span>No data in a dataset, add by clicking &quot;add data&quot; in a dropdown menu</span>
+                    </div>
+                  )}
+                  {dataset.data?.map((data) => (
+                    <div key={data.id} className="flex flex-row gap-2 items-center justify-between py-1.5 pl-6 last:pb-2.5">
+                      <span className="text-xs">{data.name}</span>
+                      <div>
+                        <IconButton onClick={() => handleDataRemove(data)}><MinusIcon /></IconButton>
+                      </div>
+                    </div>
+                  ))}
+                </>
+              </Accordion>
+            );
+          })}
+        </div>
+      </Accordion>
+
+      <Modal isOpen={isNewDatasetModalOpen}>
+        <div className="w-full max-w-2xl">
+          <div className="flex flex-row items-center justify-between">
+            <span className="text-2xl">Create a new dataset?</span>
+            <IconButton onClick={closeNewDatasetModal}><CloseIcon /></IconButton>
+          </div>
+          <div className="mt-8 mb-6">Please provide a name for the dataset being created.</div>
+          <form onSubmit={handleNewDatasetSubmit}>
+            <div className="max-w-md">
+              <Input name="datasetName" type="text" placeholder="Dataset name" required />
+              {newDatasetError && <span className="text-sm pl-4 text-gray-400">{newDatasetError}</span>}
+            </div>
+            <div className="flex flex-row gap-4 mt-4 justify-end">
+              <GhostButton type="button" onClick={() => closeNewDatasetModal()}>cancel</GhostButton>
+              <CTAButton type="submit">create</CTAButton>
+            </div>
+          </form>
+        </div>
+      </Modal>
+
+      <Modal isOpen={isRemoveDatasetModalOpen}>
+        <div className="w-full max-w-2xl">
+          <div className="flex flex-row items-center justify-between">
+            <span className="text-2xl">Delete <span className="text-indigo-600">{datasetToRemove?.name}</span> dataset?</span>
+            <IconButton onClick={handleDatasetRemoveCancel}><CloseIcon /></IconButton>
+          </div>
+          <div className="mt-8 mb-6">Are you sure you want to delete <span className="text-indigo-600">{datasetToRemove?.name}</span>? This action cannot be undone.</div>
+          <div className="flex flex-row gap-4 mt-4 justify-end">
+            <GhostButton type="button" onClick={handleDatasetRemoveCancel}>cancel</GhostButton>
+            <CTAButton onClick={handleRemoveDatasetConfirm} type="submit">delete</CTAButton>
+          </div>
+        </div>
+      </Modal>
+
+      <Modal isOpen={isRemoveDataModalOpen}>
+        <div className="w-full max-w-2xl">
+          <div className="flex flex-row items-center justify-between">
+            <span className="text-2xl">Delete <span className="text-indigo-600">{dataToRemove?.name}</span> data?</span>
+            <IconButton onClick={handleDataRemoveCancel}><CloseIcon /></IconButton>
+          </div>
+          <div className="mt-8 mb-6">Are you sure you want to delete <span className="text-indigo-600">{dataToRemove?.name}</span>? This action cannot be undone.</div>
+          <div className="flex flex-row gap-4 mt-4 justify-end">
+            <GhostButton type="button" onClick={handleDataRemoveCancel}>cancel</GhostButton>
+            <CTAButton onClick={handleDataRemoveConfirm} type="submit">delete</CTAButton>
+          </div>
+        </div>
+      </Modal>
+    </>
+  );
+}
diff --git a/cognee-frontend/src/app/dashboard/InstanceDatasetsAccordion.tsx b/cognee-frontend/src/app/dashboard/InstanceDatasetsAccordion.tsx
new file mode 100644
index 000000000..fd0605349
--- /dev/null
+++ b/cognee-frontend/src/app/dashboard/InstanceDatasetsAccordion.tsx
@@ -0,0 +1,102 @@
+import { useCallback, useEffect } from "react";
+
+import { fetch, useBoolean } from "@/utils";
+import { checkCloudConnection } from "@/modules/cloud";
+import { CloseIcon, CloudIcon, LocalCogneeIcon } from "@/ui/Icons";
+import { CTAButton, GhostButton, IconButton, Input, Modal } from "@/ui/elements";
+
+import DatasetsAccordion, { DatasetsAccordionProps } from "./DatasetsAccordion";
+
+type InstanceDatasetsAccordionProps = Omit<DatasetsAccordionProps, "title">;
+
+export default function InstanceDatasetsAccordion({ onDatasetsChange }: InstanceDatasetsAccordionProps) {
+  const {
+    value: isLocalCogneeConnected,
+    setTrue: setLocalCogneeConnected,
+  } = useBoolean(false);
+
+  const {
+    value: isCloudCogneeConnected,
+    setTrue: setCloudCogneeConnected,
+  } = useBoolean(false);
+
+  const checkConnectionToCloudCognee = useCallback((apiKey: string) => {
+      return checkCloudConnection(apiKey)
+        .then(setCloudCogneeConnected)
+    }, [setCloudCogneeConnected]);
+
+  useEffect(() => {
+    const checkConnectionToLocalCognee = () => {
+      fetch.checkHealth()
+        .then(setLocalCogneeConnected)
+    };
+
+    checkConnectionToLocalCognee();
+
+    checkConnectionToCloudCognee("");
+  }, [checkConnectionToCloudCognee, setCloudCogneeConnected, setLocalCogneeConnected]);
+
+  const {
+    value: isCloudConnectedModalOpen,
+    setTrue: openCloudConnectionModal,
+    setFalse: closeCloudConnectionModal,
+  } = useBoolean(false);
+
+  const handleCloudConnectionConfirm = (event: React.FormEvent<HTMLFormElement>) => {
+    event.preventDefault();
+
+    const apiKeyValue = event.currentTarget.apiKey.value;
+
+    checkConnectionToCloudCognee(apiKeyValue)
+      .then(() => {
+        closeCloudConnectionModal();
+      });
+  };
+
+  return (
+    <>
+      <DatasetsAccordion
+        title={(
+          <div className="flex flex-row items-center justify-between">
+            <div className="flex flex-row items-center gap-2">
+              <LocalCogneeIcon className="text-indigo-700" />
+              <span className="text-xs">local cognee</span>
+            </div>
+          </div>
+        )}
+        tools={isLocalCogneeConnected ? <span className="text-xs text-indigo-600">Connected</span> : <span className="text-xs text-gray-400">Not connected</span>}
+        switchCaretPosition={true}
+        className="pt-3 pb-1.5"
+        contentClassName="pl-4"
+        onDatasetsChange={onDatasetsChange}
+      />
+
+      <button className="w-full flex flex-row items-center justify-between py-1.5 cursor-pointer" onClick={!isCloudCogneeConnected ? openCloudConnectionModal : () => {}}>
+        <div className="flex flex-row items-center gap-2">
+          <CloudIcon color="#000000" />
+          <span className="text-xs">cloud cognee</span>
+        </div>
+        {isCloudCogneeConnected ? <span className="text-xs text-indigo-600">Connected</span> : <span className="text-xs text-gray-400">Not connected</span>}
+      </button>
+
+      <Modal isOpen={isCloudConnectedModalOpen}>
+        <div className="w-full max-w-2xl">
+          <div className="flex flex-row items-center justify-between">
+            <span className="text-2xl">Connect to cloud?</span>
+            <IconButton onClick={closeCloudConnectionModal}><CloseIcon /></IconButton>
+          </div>
+          <div className="mt-8 mb-6">Please provide your API key. You can find it on <a className="!text-indigo-600" href="https://platform.cognee.ai">our platform.</a></div>
+          <form onSubmit={handleCloudConnectionConfirm}>
+            <div className="max-w-md">
+              <Input name="apiKey" type="text" placeholder="cloud API key" required />
+            </div>
+            <div className="flex flex-row gap-4 mt-4 justify-end">
+              <GhostButton type="button" onClick={() => closeCloudConnectionModal()}>cancel</GhostButton>
+              <CTAButton type="submit">connect</CTAButton>
+            </div>
+          </form>
+        </div>
+      </Modal>
+    </>
+  );
+}
diff --git a/cognee-frontend/src/app/dashboard/NotebooksAccordion.tsx b/cognee-frontend/src/app/dashboard/NotebooksAccordion.tsx
new file mode 100644
index 000000000..174efaa9e
--- /dev/null
+++ b/cognee-frontend/src/app/dashboard/NotebooksAccordion.tsx
@@ -0,0 +1,150 @@
+"use client";
+
+import { FormEvent, useCallback, useState } from "react";
+import { useBoolean } from "@/utils";
+import { Accordion, CTAButton, GhostButton, IconButton, Input, Modal } from "@/ui/elements";
+import { CloseIcon, MinusIcon, NotebookIcon, PlusIcon } from "@/ui/Icons";
+import { Notebook } from "@/ui/elements/Notebook/types";
+import { LoadingIndicator } from "@/ui/App";
+import { useModal } from "@/ui/elements/Modal";
+
+interface NotebooksAccordionProps {
+  notebooks: Notebook[];
+  addNotebook: (name: string) => Promise<Notebook>;
+  removeNotebook: (id: string) => Promise<void>;
+  openNotebook: (id: string) => void;
+}
+
+export default function NotebooksAccordion({
+  notebooks,
+  addNotebook,
+  removeNotebook,
+  openNotebook,
+}: NotebooksAccordionProps) {
+  const {
+    value: isNotebookPanelOpen,
+    setTrue: openNotebookPanel,
+    setFalse: closeNotebookPanel,
+  } = useBoolean(true);
+
+  const {
+    value: isNotebookLoading,
+    setTrue: notebookLoading,
+    setFalse: notebookLoaded,
+  } = useBoolean(false);
+
+  // Notebook removal modal
+  const [notebookToRemove, setNotebookToRemove] = useState<Notebook | null>(null);
+
+  const handleNotebookRemove = (notebook: Notebook) => {
+    setNotebookToRemove(notebook);
+    openRemoveNotebookModal();
+  };
+
+  const {
+    value: isRemoveNotebookModalOpen,
+    setTrue: openRemoveNotebookModal,
+    setFalse: closeRemoveNotebookModal,
+  } = useBoolean(false);
+
+  const handleNotebookRemoveCancel = () => {
+    closeRemoveNotebookModal();
+    setNotebookToRemove(null);
+  };
+
+  const handleNotebookRemoveConfirm = () => {
+    notebookLoading();
+    removeNotebook(notebookToRemove!.id)
+      .finally(notebookLoaded)
+      .finally(closeRemoveNotebookModal);
+      setNotebookToRemove(null);
+  };
+
+  const handleNotebookAdd = useCallback((_: object, formEvent?: FormEvent<HTMLFormElement>) => {
+    if (!formEvent) {
+      return;
+    }
+
+    formEvent.preventDefault();
+
+    const formElements = formEvent.currentTarget;
+    const notebookName = formElements.notebookName.value.trim();
+
+    return addNotebook(notebookName)
+  }, [addNotebook]);
+
+  const {
+    isModalOpen: isNewNotebookModalOpen,
+    openModal: openNewNotebookModal,
+    closeModal: closeNewNotebookModal,
+    confirmAction: handleNewNotebookSubmit,
+    isActionLoading: isNewDatasetLoading,
+  } = useModal<Notebook | void>(false, handleNotebookAdd);
+
+  return (
+    <>
+      <Accordion
+        title={<span>Notebooks</span>}
+        isOpen={isNotebookPanelOpen}
+        openAccordion={openNotebookPanel}
+        closeAccordion={closeNotebookPanel}
+        tools={isNewDatasetLoading ? (
+          <LoadingIndicator />
+        ) : (
+          <IconButton onClick={openNewNotebookModal}><PlusIcon /></IconButton>
+        )}
+      >
+        {notebooks.length === 0 && (
+          <div className="flex flex-row items-baseline-last text-sm text-gray-400 mt-2 px-2">
+            <span>No notebooks here, add one by clicking +</span>
+          </div>
+        )}
+        {notebooks.map((notebook: Notebook) => (
+          <div key={notebook.id} className="flex flex-row gap-2.5 items-center justify-between py-1.5 first:pt-3">
+            <button onClick={() => openNotebook(notebook.id)} className="flex flex-row gap-2 items-center cursor-pointer">
+              {isNotebookLoading ? <LoadingIndicator /> : <NotebookIcon />}
+              <span className="text-xs">{notebook.name}</span>
+            </button>
+            <div>
+              {notebook.deletable && <IconButton onClick={() => handleNotebookRemove(notebook)}><MinusIcon /></IconButton>}
+            </div>
+          </div>
+        ))}
+      </Accordion>
+
+      <Modal isOpen={isNewNotebookModalOpen}>
+        <div className="w-full max-w-2xl">
+          <div className="flex flex-row items-center justify-between">
+            <span className="text-2xl">Create a new notebook?</span>
+            <IconButton onClick={closeNewNotebookModal}><CloseIcon /></IconButton>
+          </div>
+          <div className="mt-8 mb-6">Please provide a name for the notebook being created.</div>
+          <form onSubmit={handleNewNotebookSubmit}>
+            <div className="max-w-md">
+              <Input name="notebookName" type="text" placeholder="Notebook name" required />
+              {/* {newDatasetError && <span className="text-sm pl-4 text-gray-400">{newDatasetError}</span>} */}
+            </div>
+            <div className="flex flex-row gap-4 mt-4 justify-end">
+              <GhostButton type="button" onClick={() => closeNewNotebookModal()}>cancel</GhostButton>
+              <CTAButton type="submit">create</CTAButton>
+            </div>
+          </form>
+        </div>
+      </Modal>
+
+      <Modal isOpen={isRemoveNotebookModalOpen}>
+        <div className="w-full max-w-2xl">
+          <div className="flex flex-row items-center justify-between">
+            <span className="text-2xl">Delete <span className="text-indigo-600">{notebookToRemove?.name}</span> notebook?</span>
+            <IconButton onClick={handleNotebookRemoveCancel}><CloseIcon /></IconButton>
+          </div>
+          <div className="mt-8 mb-6">Are you sure you want to delete <span className="text-indigo-600">{notebookToRemove?.name}</span>? This action cannot be undone.</div>
+          <div className="flex flex-row gap-4 mt-4 justify-end">
+            <GhostButton type="button" onClick={handleNotebookRemoveCancel}>cancel</GhostButton>
+            <CTAButton onClick={handleNotebookRemoveConfirm} type="submit">delete</CTAButton>
+          </div>
+        </div>
+      </Modal>
+    </>
+  );
+}
diff --git a/cognee-frontend/src/app/dashboard/page.tsx b/cognee-frontend/src/app/dashboard/page.tsx
new file mode 100644
index 000000000..2ab67cdd6
--- /dev/null
+++ b/cognee-frontend/src/app/dashboard/page.tsx
@@ -0,0 +1 @@
+export { default } from "./Dashboard";
diff --git a/cognee-frontend/src/app/plan/Plan.tsx b/cognee-frontend/src/app/plan/Plan.tsx
new file mode 100644
index 000000000..fcca31566
--- /dev/null
+++ b/cognee-frontend/src/app/plan/Plan.tsx
@@ -0,0 +1,157 @@
+import Link from "next/link";
+import { BackIcon, CheckIcon } from "@/ui/Icons";
+import { CTAButton, NeutralButton } from "@/ui/elements";
+import Header from "@/ui/Layout/Header";
+
+export default function Plan() {
+  return (
+    <>
+      <div className="absolute top-0 right-0 bottom-0 left-0 flex flex-row gap-2.5">
+        <div className="flex-1/5 bg-gray-100 h-full"></div>
+        <div className="flex-3/5 h-full flex flex-row gap-2.5">
+          <div className="flex-1/3 bg-gray-100 h-full"></div>
+          <div className="flex-1/3 bg-gray-100 h-full"></div>
+          <div className="flex-1/3 bg-gray-100 h-full"></div>
+        </div>
+        <div className="flex-1/5 bg-gray-100 h-full"></div>
+      </div>
+
+      <Header />
+
+      <div className="relative flex flex-row items-start justify-stretch gap-2.5">
+        <div className="flex-1/5 h-full">
+          <Link href="/dashboard" className="py-4 px-5 flex flex-row items-center gap-5">
+            <BackIcon />
+            <span>back</span>
+          </Link>
+        </div>
+
+        <div className="flex-3/5">
+          <div className="grid grid-cols-3 gap-x-2.5">
+            <div className="pt-13 py-4 px-5 mb-2.5 rounded-tl-xl rounded-tr-xl bg-white h-full">
+              <div>Basic</div>
+              <div className="text-3xl mb-4 font-bold">Free</div>
+            </div>
+
+            <div className="pt-13 py-4 px-5 mb-2.5 rounded-tl-xl rounded-tr-xl bg-white h-full">
+              <div>On-prem Subscription</div>
+              <div className="mb-4"><span className="text-3xl font-bold">$2470</span><span className="text-gray-400"> /per month</span></div>
+              <div className="mb-9"><span className="font-bold">Save 20% </span>yearly</div>
+            </div>
+
+            <div className="pt-13 py-4 px-5 mb-2.5 rounded-tl-xl rounded-tr-xl bg-white h-full">
+              <div>Cloud Subscription</div>
+              <div className="mb-4"><span className="text-3xl font-bold">$25</span><span className="text-gray-400"> /per month</span></div>
+              <div className="mb-9 text-gray-400">(beta pricing)</div>
+            </div>
+
+            <div className="bg-white rounded-bl-xl rounded-br-xl h-full">
+              <div className="mb-1 invisible">Everything in the free plan, plus...</div>
+              <div className="flex flex-col gap-3 mb-28">
+                <div className="flex flex-row gap-2"><CheckIcon className="mt-1 shrink-0" />License to use Cognee open source</div>
+                <div className="flex flex-row gap-2"><CheckIcon className="mt-1 shrink-0" />Cognee tasks and pipelines</div>
+                <div className="flex flex-row gap-2"><CheckIcon className="mt-1 shrink-0" />Custom schema and ontology generation</div>
+                <div className="flex flex-row gap-2"><CheckIcon className="mt-1 shrink-0" />Integrated evaluations</div>
+                <div className="flex flex-row gap-2"><CheckIcon className="mt-1 shrink-0" />More than 28 data sources supported</div>
+              </div>
+            </div>
+
+            <div className="bg-white rounded-bl-xl rounded-br-xl h-full">
+              <div className="mb-1 text-gray-400">Everything in the free plan, plus...</div>
+              <div className="flex flex-col gap-3 mb-10">
+                <div className="flex flex-row gap-2"><CheckIcon className="mt-1 shrink-0" />License to use Cognee open source and Cognee Platform</div>
+                <div className="flex flex-row gap-2"><CheckIcon className="mt-1 shrink-0" />1 day SLA</div>
+                <div className="flex flex-row gap-2"><CheckIcon className="mt-1 shrink-0" />On-prem deployment</div>
+                <div className="flex flex-row gap-2"><CheckIcon className="mt-1 shrink-0" />Hands-on support</div>
+                <div className="flex flex-row gap-2"><CheckIcon className="mt-1 shrink-0" />Architecture review</div>
+                <div className="flex flex-row gap-2"><CheckIcon className="mt-1 shrink-0" />Roadmap prioritization</div>
+                <div className="flex flex-row gap-2"><CheckIcon className="mt-1 shrink-0" />Knowledge transfer</div>
+              </div>
+            </div>
+
+            <div className="bg-white rounded-bl-xl rounded-br-xl h-full">
+              <div className="mb-1 text-gray-400">Everything in the free plan, plus...</div>
+              <div className="flex flex-col gap-3 mb-10">
+                <div className="flex flex-row gap-2"><CheckIcon className="mt-1 shrink-0" />Fully hosted cloud platform</div>
+                <div className="flex flex-row gap-2"><CheckIcon className="mt-1 shrink-0" />Multi-tenant architecture</div>
+                <div className="flex flex-row gap-2"><CheckIcon className="mt-1 shrink-0" />Comprehensive API endpoints</div>
+                <div className="flex flex-row gap-2"><CheckIcon className="mt-1 shrink-0" />Automated scaling and parallel processing</div>
+                <div className="flex flex-row gap-2"><CheckIcon className="mt-1 shrink-0" />Ability to group memories per user and domain</div>
+                <div className="flex flex-row gap-2"><CheckIcon className="mt-1 shrink-0" />Automatic updates and priority support</div>
+                <div className="flex flex-row gap-2"><CheckIcon className="mt-1 shrink-0" />1 GB ingestion + 10,000 API calls</div>
+              </div>
+            </div>
+
+            <div className="pt-4 pb-14 mb-2.5">
+              <NeutralButton>Try for free</NeutralButton>
+            </div>
+
+            <div className="pt-4 pb-14 mb-2.5">
+              <CTAButton>Talk to us</CTAButton>
+            </div>
+
+            <div className="pt-4 pb-14 mb-2.5">
+              <NeutralButton>Sign up for Cogwit Beta</NeutralButton>
+            </div>
+          </div>
+
+          <div className="grid grid-cols-4 py-4 px-5 bg-[rgba(255,255,255,0.5)] mb-12">
+            <div>Feature Comparison</div>
+            <div className="text-center">Basic</div>
+            <div className="text-center">On-prem</div>
+            <div className="text-center">Cloud</div>
+
+            <div className="border-b-[1px] border-b-gray-100 py-3">Data Sources</div>
+            <div className="text-center border-b-[1px] border-b-gray-100 py-3">28+</div>
+            <div className="text-center border-b-[1px] border-b-gray-100 py-3">28+</div>
+            <div className="text-center border-b-[1px] border-b-gray-100 py-3">28+</div>
+
+            <div className="border-b-[1px] border-b-gray-100 py-3">Deployment</div>
+            <div className="text-center border-b-[1px] border-b-gray-100 py-3">Self-hosted</div>
+            <div className="text-center border-b-[1px] border-b-gray-100 py-3">On-premise</div>
+            <div className="text-center border-b-[1px] border-b-gray-100 py-3">Cloud</div>
+
+            <div className="border-b-[1px] border-b-gray-100 py-3">API Calls</div>
+            <div className="text-center border-b-[1px] border-b-gray-100 py-3">Limited</div>
+            <div className="text-center border-b-[1px] border-b-gray-100 py-3">Unlimited</div>
+            <div className="text-center border-b-[1px] border-b-gray-100 py-3">10,000</div>
+
+            <div className="border-b-[1px] border-b-gray-100 py-3">Support</div>
+            <div className="text-center border-b-[1px] border-b-gray-100 py-3">Community</div>
+            <div className="text-center border-b-[1px] border-b-gray-100 py-3">Hands-on</div>
+            <div className="text-center border-b-[1px] border-b-gray-100 py-3">Priority</div>
+
+            <div className="border-b-[1px] border-b-gray-100 py-3">SLA</div>
+            <div className="text-center border-b-[1px] border-b-gray-100 py-3">—</div>
+            <div className="text-center border-b-[1px] border-b-gray-100 py-3">1 day</div>
+            <div className="text-center border-b-[1px] border-b-gray-100 py-3">Standard</div>
+          </div>
+
+          <div className="grid grid-cols-2 gap-x-2.5 gap-y-2.5 mb-12">
+            <div className="bg-[rgba(255,255,255,0.5)] py-4 px-5">
+              <div>Can I change my plan anytime?</div>
+              <div className="text-gray-500 mt-6">Yes, you can upgrade or downgrade your plan at any time. Changes take effect immediately.</div>
+            </div>
+            <div className="bg-[rgba(255,255,255,0.5)] py-4 px-5">
+              <div>What happens to my data if I downgrade?</div>
+              <div className="text-gray-500 mt-6">Your data is preserved, but features may be limited based on your new plan constraints.</div>
+            </div>
+            <div className="bg-[rgba(255,255,255,0.5)] py-4 px-5">
+              <div>Do you offer educational discounts?</div>
+              <div className="text-gray-500 mt-6">Yes, we offer special pricing for educational institutions and students. Contact us for details.</div>
+            </div>
+            <div className="bg-[rgba(255,255,255,0.5)] py-4 px-5">
+              <div>Is there a free trial for paid plans?</div>
+              <div className="text-gray-500 mt-6">All new accounts start with a 14-day free trial of our Pro plan features.</div>
+            </div>
+          </div>
+        </div>
+
+        <div className="flex-1/5 h-full text-center flex flex-col self-end mb-12">
+          <span className="text-sm mb-2">Need a custom solution?</span>
+          <CTAButton>Contact us</CTAButton>
+        </div>
+      </div>
+    </>
+  );
+}
diff --git a/cognee-frontend/src/app/plan/page.tsx b/cognee-frontend/src/app/plan/page.tsx
new file mode 100644
index 000000000..a1352fe8e
--- /dev/null
+++ b/cognee-frontend/src/app/plan/page.tsx
@@ -0,0 +1 @@
+export { default } from "./Plan";
diff --git a/cognee-frontend/src/modules/auth/index.ts b/cognee-frontend/src/modules/auth/index.ts
new file mode 100644
index 000000000..ea21cce2b
--- /dev/null
+++ b/cognee-frontend/src/modules/auth/index.ts
@@ -0,0 +1,2 @@
+export { default as useAuthenticatedUser } from "./useAuthenticatedUser";
+export { type User } from "./types";
diff --git a/cognee-frontend/src/modules/auth/types.ts b/cognee-frontend/src/modules/auth/types.ts
new file mode 100644
index 000000000..3441b4149
--- /dev/null
+++ b/cognee-frontend/src/modules/auth/types.ts
@@ -0,0 +1,6 @@
+export interface User {
+  id: string;
+  name: string;
+  email: string;
+  avatarImagePath: string;
+}
diff --git a/cognee-frontend/src/modules/auth/useAuthenticatedUser.ts b/cognee-frontend/src/modules/auth/useAuthenticatedUser.ts
new file mode 100644
index 000000000..f789f3de4
--- /dev/null
+++ b/cognee-frontend/src/modules/auth/useAuthenticatedUser.ts
@@ -0,0 +1,17 @@
+import { useEffect, useState } from "react";
+import { fetch } from "@/utils";
+import { User } from "./types";
+
+export default function useAuthenticatedUser() {
+  const [user, setUser] = useState<User | null>(null);
+
+  useEffect(() => {
+    if (!user) {
+      fetch("/v1/auth/me")
+        .then((response) => response.json())
+        .then((data) => setUser(data));
+    }
+  }, [user]);
+
+  return { user };
+}
diff --git a/cognee-frontend/src/modules/cloud/checkCloudConnection.ts b/cognee-frontend/src/modules/cloud/checkCloudConnection.ts
new file mode 100644
index 000000000..dfc40767d
--- /dev/null
+++ b/cognee-frontend/src/modules/cloud/checkCloudConnection.ts
@@ -0,0 +1,10 @@
+import { fetch } from "@/utils";
+
+export default function checkCloudConnection(apiKey: string) {
+  return fetch("/v1/checks/connection", {
+    method: "POST",
+    headers: {
+      "X-Api-Key": apiKey,
+    },
+  });
+}
diff --git a/cognee-frontend/src/modules/cloud/index.ts b/cognee-frontend/src/modules/cloud/index.ts
new file mode 100644
index 000000000..409f803c3
--- /dev/null
+++ b/cognee-frontend/src/modules/cloud/index.ts
@@ -0,0 +1,2 @@
+export { default as syncData } from "./syncData";
+export { default as checkCloudConnection } from "./checkCloudConnection";
diff --git a/cognee-frontend/src/modules/cloud/syncData.ts b/cognee-frontend/src/modules/cloud/syncData.ts
new file mode 100644
index 000000000..dc4360a27
--- /dev/null
+++ b/cognee-frontend/src/modules/cloud/syncData.ts
@@ -0,0 +1,11 @@
+import { fetch } from "@/utils";
+
+export default function syncData(datasetId?: string) {
+  return fetch("/v1/sync", {
+    method: "POST",
+    headers: {
+      "Content-Type": "application/json",
+    },
+    ...(datasetId ? { body: JSON.stringify({ datasetId }) } : { body: "{}" }),
+  });
+}
diff --git a/cognee-frontend/src/modules/ingestion/useData.ts b/cognee-frontend/src/modules/ingestion/useData.ts
index 4368e296e..941521135 100644
--- a/cognee-frontend/src/modules/ingestion/useData.ts
+++ b/cognee-frontend/src/modules/ingestion/useData.ts
@@ -5,6 +5,7 @@ export interface DataFile {
   id: string;
   name: string;
   file: File;
+  datasetId: string;
 }
 
 const useData = () => {
@@ -16,6 +17,7 @@ const useData = () => {
         id: v4(),
         name: file.name,
         file,
+        datasetId: "",
       }))
     );
   }, []);
diff --git a/cognee-frontend/src/modules/ingestion/useDatasets.ts b/cognee-frontend/src/modules/ingestion/useDatasets.ts
index 9ae4ddcb2..7ef2b6b79 100644
--- a/cognee-frontend/src/modules/ingestion/useDatasets.ts
+++ b/cognee-frontend/src/modules/ingestion/useDatasets.ts
@@ -1,7 +1,9 @@
 import { useCallback, useEffect, useRef, useState } from 'react';
 import { v4 } from 'uuid';
-import { DataFile } from './useData';
+
 import { fetch } from '@/utils';
+import { DataFile } from './useData';
+import createDataset from "../datasets/createDataset";
 
 export interface Dataset {
   id: string;
@@ -56,21 +58,24 @@ function useDatasets() {
   }, []);
 
   const addDataset = useCallback((datasetName: string) => {
-    setDatasets((datasets) => [
-      ...datasets,
-      {
-        id: v4(),
-        name: datasetName,
-        data: [],
-        status: 'DATASET_INITIALIZED',
-      }
-    ]);
+    return createDataset({ name: datasetName  })
+      .then((dataset) => {
+        setDatasets((datasets) => [
+          ...datasets,
+          dataset,
+        ]);
+      });
   }, []);
 
   const removeDataset = useCallback((datasetId: string) => {
-    setDatasets((datasets) =>
-      datasets.filter((dataset) => dataset.id !== datasetId)
-    );
+    return fetch(`/v1/datasets/${datasetId}`, {
+      method: 'DELETE',
+    })
+      .then(() => {
+        setDatasets((datasets) =>
+          datasets.filter((dataset) => dataset.id !== datasetId)
+        );
+      });
   }, []);
 
   const fetchDatasets = useCallback(() => {
@@ -94,7 +99,41 @@ function useDatasets() {
       });
   }, [checkDatasetStatuses]);
 
-  return { datasets, addDataset, removeDataset, refreshDatasets: fetchDatasets };
+  const getDatasetData = useCallback((datasetId: string) => {
+    return fetch(`/v1/datasets/${datasetId}/data`)
+      .then((response) => response.json())
+      .then((data) => {
+        const datasetIndex = datasets.findIndex((dataset) => dataset.id === datasetId);
+
+        if (datasetIndex >= 0) {
+          setDatasets((datasets) => [
+           ...datasets.slice(0, datasetIndex),
+            {
+             ...datasets[datasetIndex],
+              data,
+            },
+           ...datasets.slice(datasetIndex + 1),
+          ]);
+        }
+
+        return data;
+      });
+  }, [datasets]);
+
+  const removeDatasetData = useCallback((datasetId: string, dataId: string) => {
+    return fetch(`/v1/datasets/${datasetId}/data/${dataId}`, {
+      method: 'DELETE',
+    });
+  }, []);
+
+  return {
+    datasets,
+    addDataset,
+    removeDataset,
+    getDatasetData,
+    removeDatasetData,
+    refreshDatasets: fetchDatasets,
+  };
 };
 
 export default useDatasets;
diff --git a/cognee-frontend/src/modules/notebooks/useNotebooks.ts b/cognee-frontend/src/modules/notebooks/useNotebooks.ts
new file mode 100644
index 000000000..f36f97448
--- /dev/null
+++ b/cognee-frontend/src/modules/notebooks/useNotebooks.ts
@@ -0,0 +1,134 @@
+import { useCallback, useState } from "react";
+import { fetch } from "@/utils";
+import { Cell, Notebook } from "@/ui/elements/Notebook/types";
+
+function useNotebooks() {
+  const [notebooks, setNotebooks] = useState<Notebook[]>([]);
+
+  const addNotebook = useCallback((notebookName: string) => {
+    return fetch("/v1/notebooks", {
+        body: JSON.stringify({ name: notebookName }),
+        method: "POST",
+        headers: {
+          "Content-Type": "application/json",
+        },
+      })
+      .then((response) => response.json())
+      .then((notebook) => {
+        setNotebooks((notebooks) => [
+          ...notebooks,
+          notebook,
+        ]);
+
+        return notebook;
+      });
+  }, []);
+
+  const removeNotebook = useCallback((notebookId: string) => {
+    return fetch(`/v1/notebooks/${notebookId}`, {
+        method: "DELETE",
+      })
+      .then(() => {
+        setNotebooks((notebooks) =>
+          notebooks.filter((notebook) => notebook.id !== notebookId)
+        );
+      });
+  }, []);
+
+  const fetchNotebooks = useCallback(() => {
+    return fetch("/v1/notebooks", {
+        headers: {
+          "Content-Type": "application/json",
+        },
+      })
+      .then((response) => response.json())
+      .then((notebooks) => {
+        setNotebooks(notebooks);
+
+        return notebooks;
+      })
+      .catch((error) => {
+        console.error("Error fetching notebooks:", error);
+      });
+  }, []);
+
+  const updateNotebook = useCallback((updatedNotebook: Notebook) => {
+    setNotebooks((existingNotebooks) =>
+      existingNotebooks.map((notebook) =>
+        notebook.id === updatedNotebook.id
+          ? updatedNotebook
+          : notebook
+      )
+    );
+  }, []);
+
+  const saveNotebook = useCallback((notebook: Notebook) => {
+    return fetch(`/v1/notebooks/${notebook.id}`, {
+        body: JSON.stringify({
+          name: notebook.name,
+          cells: notebook.cells,
+        }),
+        method: "PUT",
+        headers: {
+          "Content-Type": "application/json",
+        },
+      })
+      .then((response) => response.json())
+  }, []);
+
+  const runCell = useCallback((notebook: Notebook, cell: Cell) => {
+    setNotebooks((existingNotebooks) =>
+      existingNotebooks.map((existingNotebook) =>
+        existingNotebook.id === notebook.id ? {
+          ...existingNotebook,
+          cells: existingNotebook.cells.map((existingCell) =>
+            existingCell.id === cell.id ? {
+              ...existingCell,
+              result: undefined,
+              error: undefined,
+            } : existingCell
+          ),
+        } : notebook
+      )
+    );
+
+    return fetch(`/v1/notebooks/${notebook.id}/${cell.id}/run`, {
+        body: JSON.stringify({
+          content: cell.content,
+        }),
+        method: "POST",
+        headers: {
+          "Content-Type": "application/json",
+        },
+      })
+      .then((response) => response.json())
+      .then((response) => {
+        setNotebooks((existingNotebooks) =>
+          existingNotebooks.map((existingNotebook) =>
+            existingNotebook.id === notebook.id ? {
+              ...existingNotebook,
+              cells: existingNotebook.cells.map((existingCell) =>
+                existingCell.id === cell.id ? {
+                 ...existingCell,
+                  result: response.result,
+                  error: response.error,
+                } : existingCell
+              ),
+            } : notebook
+          )
+        );
+      });
+  }, []);
+
+  return {
+    notebooks,
+    addNotebook,
+    saveNotebook,
+    updateNotebook,
+    removeNotebook,
+    refreshNotebooks: fetchNotebooks,
+    runCell,
+  };
+};
+
+export default useNotebooks;
diff --git a/cognee-frontend/src/ui/App/Loading/DefaultLoadingIndicator/LoadingIndicator.module.css b/cognee-frontend/src/ui/App/Loading/DefaultLoadingIndicator/LoadingIndicator.module.css
index 472081d57..d66b1e7f8 100644
--- a/cognee-frontend/src/ui/App/Loading/DefaultLoadingIndicator/LoadingIndicator.module.css
+++ b/cognee-frontend/src/ui/App/Loading/DefaultLoadingIndicator/LoadingIndicator.module.css
@@ -3,7 +3,7 @@
   width: 1rem;
   height: 1rem;
   border-radius: 50%;
-  border: 0.18rem solid white;
+  border: 0.18rem solid var(--color-indigo-600);;
   border-top-color: transparent;
   border-bottom-color: transparent;
   animation: spin 2s linear infinite;
diff --git a/cognee-frontend/src/ui/Icons/AddIcon.tsx b/cognee-frontend/src/ui/Icons/AddIcon.tsx
index b9092feec..da150c8a3 100644
--- a/cognee-frontend/src/ui/Icons/AddIcon.tsx
+++ b/cognee-frontend/src/ui/Icons/AddIcon.tsx
@@ -1,4 +1,4 @@
-export default function SearchIcon({ width = 24, height = 24, color = 'currentColor', className = '' }) {
+export default function AddIcon({ width = 24, height = 24, color = 'currentColor', className = '' }) {
   return (
     <svg width={width} height={height} viewBox="0 0 50 50" fill="none" xmlns="http://www.w3.org/2000/svg" className={className}>
       <path d="M24.9999 46L24.9999 4M46.0049 25.005L4.00488 25.005" stroke={color} strokeWidth="8" strokeLinecap="round"/>
diff --git a/cognee-frontend/src/ui/Icons/BackIcon.tsx b/cognee-frontend/src/ui/Icons/BackIcon.tsx
new file mode 100644
index 000000000..796fb923b
--- /dev/null
+++ b/cognee-frontend/src/ui/Icons/BackIcon.tsx
@@ -0,0 +1,8 @@
+export default function BackIcon({ width = 16, height = 16, color = "#17191C", className = "" }) {
+  return (
+    <svg className={className} width={width} height={height} viewBox="0 0 16 16" fill="none" xmlns="http://www.w3.org/2000/svg">
+      <path d="M7.99992 12.6666L3.33325 7.99998L7.99992 3.33331" stroke={color} strokeWidth="1.33333" strokeLinecap="round" strokeLinejoin="round"/>
+      <path d="M12.6666 8H3.33325" stroke={color} strokeWidth="1.33333" strokeLinecap="round" strokeLinejoin="round"/>
+    </svg>
+  );
+}
diff --git a/cognee-frontend/src/ui/Icons/CaretIcon.tsx b/cognee-frontend/src/ui/Icons/CaretIcon.tsx
index 29a5eca62..cef9b9a9a 100644
--- a/cognee-frontend/src/ui/Icons/CaretIcon.tsx
+++ b/cognee-frontend/src/ui/Icons/CaretIcon.tsx
@@ -1,8 +1,7 @@
-export default function CaretIcon({ width = 50, height = 36, color = "currentColor", className = "" }) {
+export default function CaretIcon({ width = 17, height = 16, color = "#000000", className = "" }) {
   return (
-    <svg width={width} height={height} viewBox="0 0 50 36" fill="none" xmlns="http://www.w3.org/2000/svg" className={className}>
-      <path d="M4 32L25 5" stroke={color} strokeWidth="8" strokeLinecap="round"/>
-      <path d="M46 32L25 5" stroke={color} strokeWidth="8" strokeLinecap="round"/>
+    <svg className={className} width={width} height={height} viewBox="0 0 17 16" fill="none" xmlns="http://www.w3.org/2000/svg">
+      <path d="M4.04877 6L8.09755 10L12.1463 6" stroke={color} strokeWidth="1.33333" strokeLinecap="round" strokeLinejoin="round"/>
     </svg>
   );
 }
diff --git a/cognee-frontend/src/ui/Icons/CheckIcon.tsx b/cognee-frontend/src/ui/Icons/CheckIcon.tsx
new file mode 100644
index 000000000..68610b1eb
--- /dev/null
+++ b/cognee-frontend/src/ui/Icons/CheckIcon.tsx
@@ -0,0 +1,7 @@
+export default function CheckIcon({ width = 17, height = 18, color = "#5C10F4", className = "" }) {
+  return (
+    <svg className={className} width={width} height={height} viewBox="0 0 17 18" fill="none" xmlns="http://www.w3.org/2000/svg">
+      <path d="M14.1693 4.60767L6.41823 12.3587L2.89502 8.83551" stroke={color} strokeWidth="1.40928" strokeLinecap="round" strokeLinejoin="round"/>
+    </svg>
+  );
+}
diff --git a/cognee-frontend/src/ui/Icons/CloseIcon.tsx b/cognee-frontend/src/ui/Icons/CloseIcon.tsx
new file mode 100644
index 000000000..7ea30123d
--- /dev/null
+++ b/cognee-frontend/src/ui/Icons/CloseIcon.tsx
@@ -0,0 +1,8 @@
+export default function CloseIcon({ width = 29, height = 29, color = "#000000", className = "" }) {
+  return (
+    <svg className={className} width={width} height={height} viewBox="0 0 29 29" fill="none" xmlns="http://www.w3.org/2000/svg">
+      <path d="M9.02429 20.0913L20.5737 8.5419" stroke={color} strokeWidth="1.33333" strokeLinecap="round" strokeLinejoin="round"/>
+      <path d="M9.02441 8.54199L20.5738 20.0914" stroke={color} strokeWidth="1.33333" strokeLinecap="round" strokeLinejoin="round"/>
+    </svg>
+  );
+}
diff --git a/cognee-frontend/src/ui/Icons/CloudIcon.tsx b/cognee-frontend/src/ui/Icons/CloudIcon.tsx
new file mode 100644
index 000000000..9578c24d4
--- /dev/null
+++ b/cognee-frontend/src/ui/Icons/CloudIcon.tsx
@@ -0,0 +1,7 @@
+export default function CloudIcon({ width = 16, height = 12, color = "#5C10F4", className = "" }) {
+  return (
+    <svg className={className} width={width} height={height} viewBox="0 0 16 12" fill="none" xmlns="http://www.w3.org/2000/svg">
+      <path d="M11.6666 10.6666H5.99994C5.13452 10.6664 4.28621 10.4256 3.54979 9.97096C2.81338 9.51636 2.21789 8.86595 1.82986 8.09239C1.44183 7.31883 1.27654 6.45261 1.35247 5.59053C1.4284 4.72844 1.74256 3.90445 2.25984 3.21063C2.77712 2.51682 3.47714 1.98051 4.28168 1.66164C5.08622 1.34277 5.96357 1.2539 6.81571 1.40496C7.66785 1.55602 8.4612 1.94106 9.1071 2.51705C9.753 3.09304 10.226 3.8373 10.4733 4.66665H11.6666C12.4623 4.66665 13.2253 4.98272 13.7879 5.54533C14.3505 6.10794 14.6666 6.871 14.6666 7.66665C14.6666 8.4623 14.3505 9.22536 13.7879 9.78797C13.2253 10.3506 12.4623 10.6666 11.6666 10.6666Z" stroke={color} strokeWidth="1.33333" strokeLinecap="round" strokeLinejoin="round"/>
+    </svg>
+  );
+}
diff --git a/cognee-frontend/src/ui/Icons/CogneeIcon.tsx b/cognee-frontend/src/ui/Icons/CogneeIcon.tsx
new file mode 100644
index 000000000..d9f95e0f2
--- /dev/null
+++ b/cognee-frontend/src/ui/Icons/CogneeIcon.tsx
@@ -0,0 +1,7 @@
+export default function CogneeIcon({ width = 21, height = 24, color="#6510F4", className="" }) {
+  return (
+    <svg className={className} width={width} height={height} viewBox="0 0 21 24" fill="none" xmlns="http://www.w3.org/2000/svg">
+      <path fillRule="evenodd" clipRule="evenodd" d="M10.2423 2.05148C10.1507 2.15398 10.083 2.30864 10.083 2.49201V21.508C10.083 22.7797 9.14692 24 7.77076 24C6.41621 24 5.45848 22.7869 5.45848 21.508V6.6326C5.45848 6.21738 5.18157 6.05752 5.04152 6.05752C4.97012 6.05752 4.87507 6.08986 4.78377 6.19205C4.69222 6.29455 4.62455 6.44919 4.62455 6.6326V15.9872C4.62455 17.2589 3.68844 18.4792 2.31227 18.4792C0.957707 18.4792 0 17.2661 0 15.9872V11.4632C0 10.0904 1.10659 8.97124 2.4639 8.97124C2.556 8.97124 2.64505 8.98455 2.72924 9.00931V6.6326C2.72924 5.35369 3.68695 4.14057 5.04152 4.14057C6.41768 4.14057 7.3538 5.3609 7.3538 6.6326V21.508C7.3538 21.6913 7.42147 21.846 7.51303 21.9485C7.60433 22.0507 7.69934 22.0831 7.77076 22.0831C7.91081 22.0831 8.18772 21.9232 8.18772 21.508V2.49201C8.18772 1.2131 9.14545 0 10.5 0C11.8762 0 12.8123 1.22033 12.8123 2.49201V21.508C12.8123 21.6913 12.8799 21.846 12.9715 21.9485C13.0628 22.0507 13.1579 22.0831 13.2292 22.0831C13.3693 22.0831 13.6462 21.9232 13.6462 21.508V6.6326C13.6462 5.35369 14.6039 4.14057 15.9585 4.14057C17.3346 4.14057 18.2708 5.3609 18.2708 6.6326V9.00931C18.355 8.98455 18.444 8.97124 18.5361 8.97124C19.8934 8.97124 21 10.0904 21 11.4632V15.9872C21 17.2589 20.0639 18.4792 18.6877 18.4792C17.3332 18.4792 16.3754 17.2661 16.3754 15.9872V6.6326C16.3754 6.21738 16.0986 6.05752 15.9585 6.05752C15.8871 6.05752 15.7921 6.08986 15.7007 6.19205C15.6092 6.29455 15.5415 6.44919 15.5415 6.6326V21.508C15.5415 22.7797 14.6054 24 13.2292 24C11.8747 24 10.917 22.7869 10.917 21.508V2.49201C10.917 2.07679 10.6401 1.91693 10.5 1.91693C10.4286 1.91693 10.3336 1.94928 10.2423 2.05148ZM18.2708 10.8501V15.9872C18.2708 16.1706 18.3384 16.3253 18.43 16.4278C18.5213 16.53 18.6163 16.5623 18.6877 16.5623C18.8278 16.5623 19.1047 16.4024 19.1047 15.9872V11.4632C19.1047 11.1492 18.8466 10.8882 18.5361 10.8882C18.444 10.8882 18.355 10.8749 18.2708 10.8501ZM2.72924 10.8501C2.64505 10.8749 2.556 10.8882 2.4639 10.8882C2.15334 10.8882 1.89531 11.1492 1.89531 11.4632V15.9872C1.89531 16.1706 1.96298 16.3253 2.05453 16.4278C2.14582 16.53 2.24088 16.5623 2.31227 16.5623C2.45235 16.5623 2.72924 16.4024 2.72924 15.9872V10.8501Z" fill={color}/>
+    </svg>
+  );
+}
diff --git a/cognee-frontend/src/ui/Icons/DatasetIcon.tsx b/cognee-frontend/src/ui/Icons/DatasetIcon.tsx
new file mode 100644
index 000000000..d17ff0470
--- /dev/null
+++ b/cognee-frontend/src/ui/Icons/DatasetIcon.tsx
@@ -0,0 +1,9 @@
+export default function DatasetIcon({ width = 16, height = 16, color = "#000000", className = '' }) {
+  return (
+    <svg className={className} width={width} height={height} viewBox="0 0 16 16" fill="none" xmlns="http://www.w3.org/2000/svg">
+      <path d="M7.99998 6.55042C10.932 6.55042 13.3088 5.53177 13.3088 4.27521C13.3088 3.01865 10.932 2 7.99998 2C5.068 2 2.69116 3.01865 2.69116 4.27521C2.69116 5.53177 5.068 6.55042 7.99998 6.55042Z" stroke={color} strokeWidth="1.17679"/>
+      <path d="M2.69116 8.82568C2.69116 8.82568 2.69116 10.6027 2.69116 11.8593C2.69116 13.1159 5.06801 14.1345 7.99998 14.1345C10.932 14.1345 13.3088 13.1159 13.3088 11.8593C13.3088 11.2321 13.3088 8.82568 13.3088 8.82568" stroke={color} strokeWidth="1.17679" strokeLinecap="square"/>
+      <path d="M2.69116 4.27515C2.69116 4.27515 2.69116 6.81056 2.69116 8.06716C2.69116 9.32376 5.06801 10.3424 7.99998 10.3424C10.932 10.3424 13.3088 9.32376 13.3088 8.06716C13.3088 7.43996 13.3088 4.27515 13.3088 4.27515" stroke={color} strokeWidth="1.17679"/>
+    </svg>
+  );
+}
diff --git a/cognee-frontend/src/ui/Icons/LocalCogneeIcon.tsx b/cognee-frontend/src/ui/Icons/LocalCogneeIcon.tsx
new file mode 100644
index 000000000..37f6016fc
--- /dev/null
+++ b/cognee-frontend/src/ui/Icons/LocalCogneeIcon.tsx
@@ -0,0 +1,10 @@
+export default function LocalCogneeIcon({ width = 16, height = 16, color = "#000000", className = "" }) {
+  return (
+    <svg className={className} width={width} height={height} viewBox="0 0 16 16" fill="none" xmlns="http://www.w3.org/2000/svg">
+      <path d="M14.6667 8H1.33334" stroke={color} strokeWidth="1.33333" strokeLinecap="round" strokeLinejoin="round"/>
+      <path d="M3.63334 3.40663L1.33334 7.99996V12C1.33334 12.3536 1.47382 12.6927 1.72387 12.9428C1.97392 13.1928 2.31305 13.3333 2.66668 13.3333H13.3333C13.687 13.3333 14.0261 13.1928 14.2762 12.9428C14.5262 12.6927 14.6667 12.3536 14.6667 12V7.99996L12.3667 3.40663C12.2563 3.18448 12.0861 2.99754 11.8753 2.86681C11.6645 2.73608 11.4214 2.66676 11.1733 2.66663H4.82668C4.57862 2.66676 4.33552 2.73608 4.12471 2.86681C3.91389 2.99754 3.74373 3.18448 3.63334 3.40663Z" stroke={color} strokeWidth="1.33333" strokeLinecap="round" strokeLinejoin="round"/>
+      <path d="M4 10.6666H4.00667" stroke={color} strokeWidth="1.33333" strokeLinecap="round" strokeLinejoin="round"/>
+      <path d="M6.66666 10.6666H6.67332" stroke={color} strokeWidth="1.33333" strokeLinecap="round" strokeLinejoin="round"/>
+    </svg>
+  );
+}
diff --git a/cognee-frontend/src/ui/Icons/MenuIcon.tsx b/cognee-frontend/src/ui/Icons/MenuIcon.tsx
new file mode 100644
index 000000000..666b3293d
--- /dev/null
+++ b/cognee-frontend/src/ui/Icons/MenuIcon.tsx
@@ -0,0 +1,9 @@
+export default function AddIcon({ width = 16, height = 16, color = "#000000", className = "" }) {
+  return (
+    <svg className={className} width={width} height={height} viewBox="0 0 16 16" fill="none" xmlns="http://www.w3.org/2000/svg">
+      <circle cx="8" cy="4" r="1" fill={color} />
+      <circle cx="8" cy="8" r="1" fill={color} />
+      <circle cx="8" cy="12" r="1" fill={color} />
+    </svg>
+  );
+}
diff --git a/cognee-frontend/src/ui/Icons/MinusIcon.tsx b/cognee-frontend/src/ui/Icons/MinusIcon.tsx
new file mode 100644
index 000000000..7757d81a6
--- /dev/null
+++ b/cognee-frontend/src/ui/Icons/MinusIcon.tsx
@@ -0,0 +1,7 @@
+export default function MinusIcon({ width = 16, height = 16, color = "#000000", className = "" }) {
+  return (
+    <svg className={className} width={width} height={height} viewBox="0 0 16 16" fill="none" xmlns="http://www.w3.org/2000/svg">
+      <path d="M4.09637 8H12.8675" stroke={color} strokeWidth="1.33333" strokeLinecap="round" strokeLinejoin="round"/>
+    </svg>
+  );
+}
diff --git a/cognee-frontend/src/ui/Icons/NotebookIcon.tsx b/cognee-frontend/src/ui/Icons/NotebookIcon.tsx
new file mode 100644
index 000000000..a46228d80
--- /dev/null
+++ b/cognee-frontend/src/ui/Icons/NotebookIcon.tsx
@@ -0,0 +1,8 @@
+export default function NotebookIcon({ width = 16, height = 16, color = "#000000", className = "" }) {
+  return (
+    <svg className={className} width={width} height={height} viewBox="0 0 16 16" fill="none" xmlns="http://www.w3.org/2000/svg">
+      <path d="M8 2V14" stroke={color} strokeWidth="1.33333" strokeLinecap="round" strokeLinejoin="round"/>
+      <path d="M12.6667 2H3.33333C2.59695 2 2 2.59695 2 3.33333V12.6667C2 13.403 2.59695 14 3.33333 14H12.6667C13.403 14 14 13.403 14 12.6667V3.33333C14 2.59695 13.403 2 12.6667 2Z" stroke={color} strokeWidth="1.33333" strokeLinecap="round" strokeLinejoin="round"/>
+    </svg>
+  );
+}
diff --git a/cognee-frontend/src/ui/Icons/PlayIcon.tsx b/cognee-frontend/src/ui/Icons/PlayIcon.tsx
new file mode 100644
index 000000000..865f103b0
--- /dev/null
+++ b/cognee-frontend/src/ui/Icons/PlayIcon.tsx
@@ -0,0 +1,7 @@
+export default function PlayIcon({ width = 11, height = 14, color = "#000000", className = "" }) {
+  return (
+    <svg className={className} width={width} height={height} viewBox="0 0 11 14" fill="none" xmlns="http://www.w3.org/2000/svg">
+      <path d="M1 1L10.3333 7L1 13V1Z" stroke={color} strokeWidth="1.33" strokeLinecap="round" strokeLinejoin="round"/>
+    </svg>
+  );
+}
diff --git a/cognee-frontend/src/ui/Icons/PlusIcon.tsx b/cognee-frontend/src/ui/Icons/PlusIcon.tsx
new file mode 100644
index 000000000..69a760e20
--- /dev/null
+++ b/cognee-frontend/src/ui/Icons/PlusIcon.tsx
@@ -0,0 +1,8 @@
+export default function PlusIcon({ width = 16, height = 16, color = "#000000", className = "" }) {
+  return (
+    <svg className={className} width={width} height={height} viewBox="0 0 16 16" fill="none" xmlns="http://www.w3.org/2000/svg">
+      <path d="M4.09637 8H12.8675" stroke={color} strokeWidth="1.33333" strokeLinecap="round" strokeLinejoin="round"/>
+      <path d="M8.48193 3.33331V12.6666" stroke={color} strokeWidth="1.33333" strokeLinecap="round" strokeLinejoin="round"/>
+    </svg>
+  );
+}
diff --git a/cognee-frontend/src/ui/Icons/SearchIcon.tsx b/cognee-frontend/src/ui/Icons/SearchIcon.tsx
index 3a3baac33..56cddf4c2 100644
--- a/cognee-frontend/src/ui/Icons/SearchIcon.tsx
+++ b/cognee-frontend/src/ui/Icons/SearchIcon.tsx
@@ -1,9 +1,8 @@
-export default function SearchIcon({ width = 24, height = 24, color = 'currentColor', className = '' }) {
+export default function SearchIcon({ width = 12, height = 12, color = "#D8D8D8", className = "" }) {
   return (
-    <svg width={width} height={height} viewBox="0 0 50 50" fill="none" xmlns="http://www.w3.org/2000/svg" className={className}>
-      <circle cx="19.5" cy="19.5" r="17" stroke={color} strokeWidth="5"/>
-      <path d="M8 19.5C8 13.1487 13.1487 8 19.5 8" stroke={color}/>
-      <path d="M43.2782 48.9312C44.897 50.4344 47.428 50.3406 48.9312 48.7218C50.4344 47.103 50.3406 44.572 48.7218 43.0688L43.2782 48.9312ZM46 46L48.7218 43.0688L34.7218 30.0688L32 33L29.2782 35.9312L43.2782 48.9312L46 46Z" fill={color}/>
+    <svg className={className} width={width} height={height} viewBox="0 0 12 12" fill="none" xmlns="http://www.w3.org/2000/svg">
+      <path d="M5.5 9.5C7.70914 9.5 9.5 7.70914 9.5 5.5C9.5 3.29086 7.70914 1.5 5.5 1.5C3.29086 1.5 1.5 3.29086 1.5 5.5C1.5 7.70914 3.29086 9.5 5.5 9.5Z" stroke={color} strokeLinecap="round" strokeLinejoin="round"/>
+      <path d="M10.5 10.5L8.35001 8.34998" stroke={color} strokeLinecap="round" strokeLinejoin="round"/>
     </svg>
   );
 }
diff --git a/cognee-frontend/src/ui/Icons/SettingsIcon.tsx b/cognee-frontend/src/ui/Icons/SettingsIcon.tsx
index ce006f49b..87e4c9872 100644
--- a/cognee-frontend/src/ui/Icons/SettingsIcon.tsx
+++ b/cognee-frontend/src/ui/Icons/SettingsIcon.tsx
@@ -1,7 +1,8 @@
-export default function SettingsIcon({ width = 32, height = 33, color = "#E8EAED" }) {
+export default function SettingsIcon({ width = 16, height = 17, color = "#000000" }) {
   return (
-    <svg width={width} height={height} viewBox="0 0 54 56" fill="none" xmlns="http://www.w3.org/2000/svg">
-      <path d="M21.2482 55.75L20.1336 46.8322C19.1495 46.5357 18.0853 46.0691 16.9408 45.4324C15.7964 44.7962 14.8231 44.1145 14.0209 43.3874L5.79611 46.8854L0.0449219 36.8646L7.15432 31.5042C7.06336 30.9472 6.98833 30.3731 6.92923 29.7822C6.86962 29.1912 6.83982 28.6169 6.83982 28.0594C6.83982 27.5414 6.86962 26.9969 6.92923 26.426C6.98833 25.8545 7.06336 25.2111 7.15432 24.4958L0.0449219 19.1354L5.79611 9.23329L13.9615 12.672C14.8824 11.9053 15.8786 11.2136 16.9501 10.5969C18.021 9.98023 19.0624 9.50385 20.0743 9.16777L21.2482 0.25H32.7522L33.8668 9.22713C35.0487 9.64235 36.0932 10.1187 37.0002 10.6562C37.9072 11.1938 38.8412 11.8657 39.8022 12.672L48.2043 9.23329L53.9555 19.1354L46.6087 24.6739C46.7788 25.31 46.8738 25.8941 46.8939 26.426C46.9134 26.9573 46.9232 27.482 46.9232 28C46.9232 28.4784 46.9034 28.9833 46.8638 29.5147C46.8242 30.0466 46.7333 30.69 46.5909 31.4449L53.819 36.8646L48.0678 46.8854L39.8022 43.328C38.8412 44.1343 37.8746 44.826 36.9023 45.4031C35.93 45.9802 34.9182 46.4368 33.8668 46.7729L32.7522 55.75H21.2482ZM23.9169 52.6667H29.9471L31.0856 44.3178C32.6391 43.9067 34.0374 43.3424 35.2805 42.625C36.5241 41.9076 37.7901 40.9243 39.0784 39.675L46.769 42.9542L49.8346 37.7125L43.0867 32.6427C43.3437 31.765 43.5138 30.9577 43.597 30.2208C43.6797 29.4833 43.7211 28.7431 43.7211 28C43.7211 27.2173 43.6797 26.4771 43.597 25.7792C43.5138 25.0819 43.3437 24.3141 43.0867 23.476L49.9533 18.2875L46.8877 13.0458L39.019 16.3427C38.0863 15.319 36.8599 14.3593 35.3398 13.4636C33.8203 12.5684 32.3824 11.9746 31.0263 11.6822L30.0835 3.33333H23.9346L22.9741 11.6229C21.4206 11.9548 19.9925 12.4895 18.6898 13.227C17.3876 13.9639 16.0921 14.9768 14.8033 16.2656L7.11269 13.0458L4.04709 18.2875L10.7356 23.2802C10.4787 23.9719 10.2988 24.7229 10.196 25.5333C10.0932 26.3437 10.0419 27.1857 10.0419 28.0594C10.0419 28.842 10.0932 29.6187 10.196 30.3896C10.2988 31.1604 10.4589 31.9115 10.6763 32.6427L4.04709 37.7125L7.11269 42.9542L14.7439 39.7167C15.9536 40.9382 17.2096 41.9177 18.5118 42.6551C19.8145 43.392 21.2822 43.966 22.9148 44.3771L23.9169 52.6667ZM26.9169 35.7083C29.0676 35.7083 30.8901 34.9611 32.3845 33.4668C33.8783 31.9729 34.6253 30.1506 34.6253 28C34.6253 25.8494 33.8783 24.0271 32.3845 22.5333C30.8901 21.0389 29.0676 20.2917 26.9169 20.2917C24.755 20.2917 22.9297 21.0389 21.4409 22.5333C19.9527 24.0271 19.2086 25.8494 19.2086 28C19.2086 30.1506 19.9527 31.9729 21.4409 33.4668C22.9297 34.9611 24.755 35.7083 26.9169 35.7083Z" fill={color} />
+    <svg width={width} height={height} viewBox="0 0 16 17" fill="none" xmlns="http://www.w3.org/2000/svg">
+      <path d="M8.14667 1.35278H7.85333C7.49971 1.35278 7.16057 1.49326 6.91053 1.74331C6.66048 1.99336 6.52 2.33249 6.52 2.68612V2.80612C6.51976 3.03993 6.45804 3.26958 6.34103 3.47201C6.22401 3.67444 6.05583 3.84254 5.85333 3.95945L5.56667 4.12612C5.36398 4.24314 5.13405 4.30475 4.9 4.30475C4.66595 4.30475 4.43603 4.24314 4.23333 4.12612L4.13333 4.07278C3.82738 3.89629 3.46389 3.84841 3.12267 3.93966C2.78145 4.0309 2.49037 4.25381 2.31333 4.55945L2.16667 4.81278C1.99018 5.11874 1.9423 5.48223 2.03354 5.82345C2.12478 6.16467 2.34769 6.45575 2.65333 6.63278L2.75333 6.69945C2.95485 6.81579 3.12241 6.98284 3.23937 7.184C3.35632 7.38517 3.4186 7.61343 3.42 7.84612V8.18612C3.42093 8.42106 3.35977 8.65209 3.2427 8.85579C3.12563 9.05949 2.95681 9.22864 2.75333 9.34612L2.65333 9.40612C2.34769 9.58315 2.12478 9.87423 2.03354 10.2155C1.9423 10.5567 1.99018 10.9202 2.16667 11.2261L2.31333 11.4795C2.49037 11.7851 2.78145 12.008 3.12267 12.0992C3.46389 12.1905 3.82738 12.1426 4.13333 11.9661L4.23333 11.9128C4.43603 11.7958 4.66595 11.7342 4.9 11.7342C5.13405 11.7342 5.36398 11.7958 5.56667 11.9128L5.85333 12.0795C6.05583 12.1964 6.22401 12.3645 6.34103 12.5669C6.45804 12.7693 6.51976 12.999 6.52 13.2328V13.3528C6.52 13.7064 6.66048 14.0455 6.91053 14.2956C7.16057 14.5456 7.49971 14.6861 7.85333 14.6861H8.14667C8.50029 14.6861 8.83943 14.5456 9.08948 14.2956C9.33953 14.0455 9.48 13.7064 9.48 13.3528V13.2328C9.48024 12.999 9.54196 12.7693 9.65898 12.5669C9.77599 12.3645 9.94418 12.1964 10.1467 12.0795L10.4333 11.9128C10.636 11.7958 10.866 11.7342 11.1 11.7342C11.3341 11.7342 11.564 11.7958 11.7667 11.9128L11.8667 11.9661C12.1726 12.1426 12.5361 12.1905 12.8773 12.0992C13.2186 12.008 13.5096 11.7851 13.6867 11.4795L13.8333 11.2194C14.0098 10.9135 14.0577 10.55 13.9665 10.2088C13.8752 9.86756 13.6523 9.57648 13.3467 9.39945L13.2467 9.34612C13.0432 9.22864 12.8744 9.05949 12.7573 8.85579C12.6402 8.65209 12.5791 8.42106 12.58 8.18612V7.85278C12.5791 7.61784 12.6402 7.38682 12.7573 7.18311C12.8744 6.97941 13.0432 6.81026 13.2467 6.69278L13.3467 6.63278C13.6523 6.45575 13.8752 6.16467 13.9665 5.82345C14.0577 5.48223 14.0098 5.11874 13.8333 4.81278L13.6867 4.55945C13.5096 4.25381 13.2186 4.0309 12.8773 3.93966C12.5361 3.84841 12.1726 3.89629 11.8667 4.07278L11.7667 4.12612C11.564 4.24314 11.3341 4.30475 11.1 4.30475C10.866 4.30475 10.636 4.24314 10.4333 4.12612L10.1467 3.95945C9.94418 3.84254 9.77599 3.67444 9.65898 3.47201C9.54196 3.26958 9.48024 3.03993 9.48 2.80612V2.68612C9.48 2.33249 9.33953 1.99336 9.08948 1.74331C8.83943 1.49326 8.50029 1.35278 8.14667 1.35278Z" stroke={color} strokeWidth="1.33333" strokeLinecap="round" strokeLinejoin="round"/>
+      <path d="M8 10.0195C9.10457 10.0195 10 9.12404 10 8.01947C10 6.9149 9.10457 6.01947 8 6.01947C6.89543 6.01947 6 6.9149 6 8.01947C6 9.12404 6.89543 10.0195 8 10.0195Z" stroke="black" strokeWidth="1.33333" strokeLinecap="round" strokeLinejoin="round"/>
     </svg>
   );
 }
diff --git a/cognee-frontend/src/ui/Icons/index.ts b/cognee-frontend/src/ui/Icons/index.ts
index 0adaa8fd1..3d3f8124f 100644
--- a/cognee-frontend/src/ui/Icons/index.ts
+++ b/cognee-frontend/src/ui/Icons/index.ts
@@ -1,7 +1,19 @@
-export { default as AddIcon } from './AddIcon';
-export { default as CaretIcon } from './CaretIcon';
-export { default as SearchIcon } from './SearchIcon';
-export { default as DeleteIcon } from './DeleteIcon';
-export { default as GithubIcon } from './GitHubIcon';
-export { default as DiscordIcon } from './DiscordIcon';
-export { default as SettingsIcon } from './SettingsIcon';
+export { default as AddIcon } from "./AddIcon";
+export { default as BackIcon } from "./BackIcon";
+export { default as PlayIcon } from "./PlayIcon";
+export { default as MenuIcon } from "./MenuIcon";
+export { default as PlusIcon } from "./PlusIcon";
+export { default as MinusIcon } from "./MinusIcon";
+export { default as CloseIcon } from "./CloseIcon";
+export { default as CheckIcon } from "./CheckIcon";
+export { default as CaretIcon } from "./CaretIcon";
+export { default as CloudIcon } from "./CloudIcon";
+export { default as SearchIcon } from "./SearchIcon";
+export { default as DeleteIcon } from "./DeleteIcon";
+export { default as GithubIcon } from "./GitHubIcon";
+export { default as CogneeIcon } from "./CogneeIcon";
+export { default as DiscordIcon } from "./DiscordIcon";
+export { default as DatasetIcon } from "./DatasetIcon";
+export { default as SettingsIcon } from "./SettingsIcon";
+export { default as NotebookIcon } from "./NotebookIcon";
+export { default as LocalCogneeIcon } from "./LocalCogneeIcon";
diff --git a/cognee-frontend/src/ui/Layout/Header.tsx b/cognee-frontend/src/ui/Layout/Header.tsx
new file mode 100644
index 000000000..465153e1a
--- /dev/null
+++ b/cognee-frontend/src/ui/Layout/Header.tsx
@@ -0,0 +1,74 @@
+"use client";
+
+import Link from "next/link";
+import Image from "next/image";
+import { useBoolean } from "@/utils";
+
+import { CloseIcon, CloudIcon, CogneeIcon } from "../Icons";
+import { CTAButton, GhostButton, IconButton, Modal } from "../elements";
+import { useAuthenticatedUser } from "@/modules/auth";
+import syncData from "@/modules/cloud/syncData";
+
+export default function Header() {
+  const { user } = useAuthenticatedUser();
+
+  const {
+    value: isSyncModalOpen,
+    setTrue: openSyncModal,
+    setFalse: closeSyncModal,
+  } = useBoolean(false);
+
+  const handleDataSyncConfirm = () => {
+    syncData()
+      .finally(() => {
+        closeSyncModal();
+      });
+  };
+
+  return (
+    <>
+      <header className="relative bg-[rgba(244,244,244,0.5)] flex flex-row h-14 min-h-14 px-5 items-center justify-between w-full max-w-[1920px] mx-auto">
+        <div className="flex flex-row gap-4 items-center">
+          <CogneeIcon />
+          <div className="text-lg">Cognee Graph Interface</div>
+        </div>
+
+        <div className="flex flex-row items-center gap-2.5">
+          <GhostButton onClick={openSyncModal} className="text-indigo-700 gap-3 pl-4 pr-4">
+            <CloudIcon />
+            <div>Sync</div>
+          </GhostButton>
+          <a href="/plan">
+            <GhostButton className="text-indigo-700 pl-4 pr-4">Premium</GhostButton>
+          </a>
+          {/* <div className="px-2 py-2 mr-3">
+            <SettingsIcon />
+          </div> */}
+          <Link href="/account" className="bg-indigo-600 w-8 h-8 rounded-full overflow-hidden">
+            {user?.avatarImagePath ? (
+              <Image width="32" height="32" alt="Name of the user" src={user.avatarImagePath} />
+            ) : (
+              <div className="w-8 h-8 rounded-full text-white flex items-center justify-center">
+                {user?.email?.charAt(0) || "C"}
+              </div>
+            )}
+          </Link>
+        </div>
+      </header>
+
+      <Modal isOpen={isSyncModalOpen}>
+        <div className="w-full max-w-2xl">
+          <div className="flex flex-row items-center justify-between">
+            <span className="text-2xl">Sync local datasets with cloud datasets?</span>
+            <IconButton onClick={closeSyncModal}><CloseIcon /></IconButton>
+          </div>
+          <div className="mt-8 mb-6">Are you sure you want to sync local datasets to cloud?</div>
+          <div className="flex flex-row gap-4 mt-4 justify-end">
+            <GhostButton type="button" onClick={closeSyncModal}>cancel</GhostButton>
+            <CTAButton onClick={handleDataSyncConfirm} type="submit">confirm</CTAButton>
+          </div>
+        </div>
+      </Modal>
+    </>
+  );
+}
diff --git a/cognee-frontend/src/ui/Layout/index.ts b/cognee-frontend/src/ui/Layout/index.ts
index 54938ca4d..af5a67ac5 100644
--- a/cognee-frontend/src/ui/Layout/index.ts
+++ b/cognee-frontend/src/ui/Layout/index.ts
@@ -1 +1,2 @@
-export { default as Divider } from './Divider/Divider';
+export { default as Divider } from "./Divider/Divider";
+export { default as Header } from "./Header";
diff --git a/cognee-frontend/src/ui/elements/Accordion.tsx b/cognee-frontend/src/ui/elements/Accordion.tsx
new file mode 100644
index 000000000..8779d6d36
--- /dev/null
+++ b/cognee-frontend/src/ui/elements/Accordion.tsx
@@ -0,0 +1,45 @@
+import classNames from "classnames";
+import { CaretIcon } from "../Icons";
+
+export interface AccordionProps {
+  isOpen: boolean;
+  title: React.ReactNode;
+  openAccordion: () => void;
+  closeAccordion: () => void;
+  tools?: React.ReactNode;
+  children: React.ReactNode;
+  className?: string;
+  contentClassName?: string;
+  switchCaretPosition?: boolean;
+}
+
+export default function Accordion({ title, tools, children, isOpen, openAccordion, closeAccordion, className, contentClassName, switchCaretPosition = false }: AccordionProps) {
+  return (
+    <div className={classNames("flex flex-col", className)}>
+      <div className="flex flex-row justify-between items-center">
+        <button className={classNames("flex flex-row items-center pr-2", switchCaretPosition ? "gap-1.5" : "gap-4")} onClick={isOpen ? closeAccordion : openAccordion}>
+          {switchCaretPosition ? (
+            <>
+              <CaretIcon className={classNames("transition-transform", isOpen ? "rotate-360" : "rotate-270")} />
+              {title}
+            </>
+          ) : (
+            <>
+              {title}
+              <CaretIcon className={classNames("transition-transform", isOpen ? "rotate-0" : "rotate-180")} />
+            </>
+          )}
+        </button>
+        {tools}
+      </div>
+
+      {isOpen && (
+        <div className={classNames("grid transition-[grid-template-rows] duration-300 ease-in-out [grid-template-rows:0fr]", contentClassName, {
+          "[grid-template-rows:1fr]": isOpen,
+        })}>
+          {children}
+        </div>
+      )}
+    </div>
+  );
+}
diff --git a/cognee-frontend/src/ui/elements/AvatarImage.tsx b/cognee-frontend/src/ui/elements/AvatarImage.tsx
new file mode 100644
index 000000000..e69de29bb
diff --git a/cognee-frontend/src/ui/elements/CTAButton.tsx b/cognee-frontend/src/ui/elements/CTAButton.tsx
index c38384cdd..02f1871fc 100644
--- a/cognee-frontend/src/ui/elements/CTAButton.tsx
+++ b/cognee-frontend/src/ui/elements/CTAButton.tsx
@@ -1,8 +1,8 @@
-import classNames from 'classnames';
+import classNames from "classnames";
 import { ButtonHTMLAttributes } from "react";
 
 export default function CTAButton({ children, className, ...props }: ButtonHTMLAttributes<HTMLButtonElement>) {
   return (
-    <button className={classNames("flex flex-row justify-center items-center gap-2 cursor-pointer rounded-3xl bg-indigo-600 px-4 py-3 text-white hover:bg-indigo-500 focus-visible:outline-2 focus-visible:outline-offset-2 focus-visible:outline-indigo-600", className)} {...props}>{children}</button>
+    <button className={classNames("flex flex-row justify-center items-center gap-2 cursor-pointer rounded-3xl bg-indigo-600 px-10 h-8 text-white hover:bg-indigo-500 focus-visible:outline-2 focus-visible:outline-offset-2 focus-visible:outline-indigo-600", className)} {...props}>{children}</button>
   );
 }
diff --git a/cognee-frontend/src/ui/elements/GhostButton.tsx b/cognee-frontend/src/ui/elements/GhostButton.tsx
index 333dcc394..a27a0ff94 100644
--- a/cognee-frontend/src/ui/elements/GhostButton.tsx
+++ b/cognee-frontend/src/ui/elements/GhostButton.tsx
@@ -1,8 +1,8 @@
-import classNames from 'classnames';
+import classNames from "classnames";
 import { ButtonHTMLAttributes } from "react";
 
 export default function CTAButton({ children, className, ...props }: ButtonHTMLAttributes<HTMLButtonElement>) {
   return (
-    <button className={classNames("flex flex-row justify-center items-center gap-2 cursor-pointer rounded-3xl bg-transparent px-4 py-3 text-white shadow-xs border-1 hover:bg-gray-400 focus-visible:outline-2 focus-visible:outline-offset-2 focus-visible:outline-indigo-600", className)} {...props}>{children}</button>
+    <button className={classNames("flex flex-row justify-center items-center gap-2 cursor-pointer rounded-3xl bg-transparent px-10 h-8 text-black hover:bg-gray-200 focus-visible:outline-2 focus-visible:outline-offset-2 focus-visible:outline-indigo-600", className)} {...props}>{children}</button>
   );
 }
diff --git a/cognee-frontend/src/ui/elements/IconButton.tsx b/cognee-frontend/src/ui/elements/IconButton.tsx
new file mode 100644
index 000000000..cbc35df5b
--- /dev/null
+++ b/cognee-frontend/src/ui/elements/IconButton.tsx
@@ -0,0 +1,14 @@
+import classNames from "classnames";
+import { ButtonHTMLAttributes } from "react";
+
+interface ButtonProps extends ButtonHTMLAttributes<HTMLButtonElement> {
+  as?: React.ElementType;
+}
+
+export default function IconButton({ as, children, className, ...props }: ButtonProps) {
+  const Element = as || "button";
+
+  return (
+    <Element className={classNames("flex flex-row justify-center items-center gap-2 cursor-pointer rounded-xl bg-transparent p-[0.5rem] m-[-0.5rem] text-black hover:bg-gray-50 focus-visible:outline-2 focus-visible:outline-offset-2 focus-visible:outline-indigo-600", className)} {...props}>{children}</Element>
+  );
+}
diff --git a/cognee-frontend/src/ui/elements/Input.tsx b/cognee-frontend/src/ui/elements/Input.tsx
index 904658eba..76451f9fa 100644
--- a/cognee-frontend/src/ui/elements/Input.tsx
+++ b/cognee-frontend/src/ui/elements/Input.tsx
@@ -3,6 +3,6 @@ import { InputHTMLAttributes } from "react"
 
 export default function Input({ className, ...props }: InputHTMLAttributes<HTMLInputElement>) {
   return (
-    <input className={classNames("block w-full rounded-md bg-white px-4 py-4 text-base text-gray-900 outline-1 -outline-offset-1 outline-gray-300 placeholder:text-gray-400 focus:outline-2 focus:-outline-offset-2 focus:outline-indigo-600", className)} {...props} />
+    <input className={classNames("block w-full rounded-3xl bg-white px-4 h-10 text-base text-gray-900 outline-1 -outline-offset-1 outline-gray-300 placeholder:text-gray-400 focus:outline-2 focus:-outline-offset-2 focus:outline-indigo-600", className)} {...props} />
   )
 }
diff --git a/cognee-frontend/src/ui/elements/Modal.tsx b/cognee-frontend/src/ui/elements/Modal/Modal.tsx
similarity index 84%
rename from cognee-frontend/src/ui/elements/Modal.tsx
rename to cognee-frontend/src/ui/elements/Modal/Modal.tsx
index fd1db3c32..9d559a7ac 100644
--- a/cognee-frontend/src/ui/elements/Modal.tsx
+++ b/cognee-frontend/src/ui/elements/Modal/Modal.tsx
@@ -5,7 +5,7 @@ interface ModalProps {
 
 export default function Modal({ isOpen, children }: ModalProps) {
   return isOpen && (
-    <div className="fixed top-0 left-0 right-0 bottom-0 backdrop-blur-lg z-1 flex items-center justify-center">
+    <div className="fixed top-0 left-0 right-0 bottom-0 backdrop-blur-lg z-20 flex items-center justify-center">
       {children}
     </div>
   );
diff --git a/cognee-frontend/src/ui/elements/Modal/index.ts b/cognee-frontend/src/ui/elements/Modal/index.ts
new file mode 100644
index 000000000..6386401d6
--- /dev/null
+++ b/cognee-frontend/src/ui/elements/Modal/index.ts
@@ -0,0 +1,3 @@
+export { default as Modal } from "./Modal";
+export { default as useModal } from "./useModal";
+
diff --git a/cognee-frontend/src/ui/elements/Modal/useModal.ts b/cognee-frontend/src/ui/elements/Modal/useModal.ts
new file mode 100644
index 000000000..4947d32ca
--- /dev/null
+++ b/cognee-frontend/src/ui/elements/Modal/useModal.ts
@@ -0,0 +1,49 @@
+import { FormEvent, useCallback, useState } from "react";
+import { useBoolean } from "@/utils";
+
+export default function useModal<ConfirmActionReturnType = void>(initiallyOpen?: boolean, confirmCallback?: (state: object, event?: FormEvent<HTMLFormElement>) => Promise<ConfirmActionReturnType> | ConfirmActionReturnType) {
+  const [modalState, setModalState] = useState<object>({});
+  const [isActionLoading, setLoading] = useState(false);
+
+  const {
+    value: isModalOpen,
+    setTrue: openModalInternal,
+    setFalse: closeModalInternal,
+  } = useBoolean(initiallyOpen || false);
+
+  const openModal = useCallback((state?: object) => {
+    if (state) {
+      setModalState(state);
+    }
+    openModalInternal();
+  }, [openModalInternal]);
+
+  const closeModal = useCallback(() => {
+    closeModalInternal();
+    setModalState({});
+  }, [closeModalInternal]);
+
+  const confirmAction = useCallback((event?: FormEvent<HTMLFormElement>) => {
+    if (confirmCallback) {
+      setLoading(true);
+
+      const maybePromise = confirmCallback(modalState, event);
+
+      if (maybePromise instanceof Promise) {
+        return maybePromise
+          .finally(closeModal)
+          .finally(() => setLoading(false));
+      } else {
+        return maybePromise; // Not a promise.
+      }
+    }
+  }, [closeModal, confirmCallback, modalState]);
+
+  return {
+    isModalOpen,
+    openModal,
+    closeModal,
+    confirmAction,
+    isActionLoading,
+  };
+}
diff --git a/cognee-frontend/src/ui/elements/NeutralButton.tsx b/cognee-frontend/src/ui/elements/NeutralButton.tsx
index 5b274ad65..7b991fcb8 100644
--- a/cognee-frontend/src/ui/elements/NeutralButton.tsx
+++ b/cognee-frontend/src/ui/elements/NeutralButton.tsx
@@ -1,8 +1,8 @@
-import classNames from 'classnames';
+import classNames from "classnames";
 import { ButtonHTMLAttributes } from "react";
 
-export default function CTAButton({ children, className, ...props }: ButtonHTMLAttributes<HTMLButtonElement>) {
+export default function NeutralButton({ children, className, ...props }: ButtonHTMLAttributes<HTMLButtonElement>) {
   return (
-    <button className={classNames("flex flex-row justify-center items-center gap-2 cursor-pointer rounded-3xl bg-transparent px-4 py-3 text-white shadow-xs border-1 border-white hover:bg-gray-400 focus-visible:outline-2 focus-visible:outline-offset-2 focus-visible:outline-indigo-600", className)} {...props}>{children}</button>
+    <button className={classNames("flex flex-row justify-center items-center gap-2 cursor-pointer rounded-3xl bg-transparent px-10 h-8 text-black border-1 border-indigo-600 hover:bg-gray-100 focus-visible:outline-2 focus-visible:outline-offset-2 focus-visible:outline-indigo-600", className)} {...props}>{children}</button>
   );
 }
diff --git a/cognee-frontend/src/ui/elements/Notebook/Notebook.tsx b/cognee-frontend/src/ui/elements/Notebook/Notebook.tsx
new file mode 100644
index 000000000..0e037890a
--- /dev/null
+++ b/cognee-frontend/src/ui/elements/Notebook/Notebook.tsx
@@ -0,0 +1,342 @@
+"use client";
+
+import { v4 as uuid4 } from "uuid";
+import classNames from "classnames";
+import { Fragment, MutableRefObject, useCallback, useEffect, useRef, useState } from "react";
+
+import { CaretIcon, PlusIcon } from "@/ui/Icons";
+import { IconButton, PopupMenu, TextArea } from "@/ui/elements";
+import { GraphControlsAPI } from "@/app/(graph)/GraphControls";
+import GraphVisualization, { GraphVisualizationAPI } from "@/app/(graph)/GraphVisualization";
+
+import NotebookCellHeader from "./NotebookCellHeader";
+import { Cell, Notebook as NotebookType } from "./types";
+
+interface NotebookProps {
+  notebook: NotebookType;
+  runCell: (notebook: NotebookType, cell: Cell) => Promise<void>;
+  updateNotebook: (updatedNotebook: NotebookType) => void;
+  saveNotebook: (notebook: NotebookType) => void;
+}
+
+export default function Notebook({ notebook, updateNotebook, saveNotebook, runCell }: NotebookProps) {
+  const saveCells = useCallback(() => {
+    saveNotebook(notebook);
+  }, [notebook, saveNotebook]);
+
+  useEffect(() => {
+    window.addEventListener("beforeunload", saveCells);
+
+    return () => {
+      window.removeEventListener("beforeunload", saveCells);
+    };
+  }, [saveCells]);
+
+  useEffect(() => {
+    if (notebook.cells.length === 0) {
+      const newCell: Cell = {
+        id: uuid4(),
+        name: "first cell",
+        type: "code",
+        content: "",
+      };
+      updateNotebook({
+       ...notebook,
+        cells: [newCell],
+      });
+    }
+  }, [notebook, saveNotebook, updateNotebook]);
+
+  const handleCellRun = useCallback((cell: Cell) => {
+    return runCell(notebook, cell);
+  }, [notebook, runCell]);
+
+  const handleCellAdd = useCallback((afterCellIndex: number, cellType: "markdown" | "code") => {
+    const newCell: Cell = {
+      id: uuid4(),
+      name: "new cell",
+      type: cellType,
+      content: "",
+    };
+
+    const newNotebook = {
+      ...notebook,
+      cells: [
+        ...notebook.cells.slice(0, afterCellIndex + 1),
+        newCell,
+        ...notebook.cells.slice(afterCellIndex + 1),
+      ],
+    };
+
+    toggleCellOpen(newCell.id);
+    updateNotebook(newNotebook);
+  }, [notebook, updateNotebook]);
+
+  const handleCellRemove = useCallback((cell: Cell) => {
+    updateNotebook({
+      ...notebook,
+      cells: notebook.cells.filter((c: Cell) => c.id !== cell.id),
+    });
+  }, [notebook, updateNotebook]);
+
+  const handleCellInputChange = useCallback((notebook: NotebookType, cell: Cell, value: string) => {
+    const newCell = {...cell, content: value };
+
+    updateNotebook({
+      ...notebook,
+      cells: notebook.cells.map((cell: Cell) => (cell.id === newCell.id ? newCell : cell)),
+    });
+  }, [updateNotebook]);
+
+  const handleCellUp = useCallback((cell: Cell) => {
+    const index = notebook.cells.indexOf(cell);
+
+    if (index > 0) {
+      const newCells = [...notebook.cells];
+      newCells[index] = notebook.cells[index - 1];
+      newCells[index - 1] = cell;
+
+      updateNotebook({
+        ...notebook,
+        cells: newCells,
+      });
+    }
+  }, [notebook, updateNotebook]);
+
+  const handleCellDown = useCallback((cell: Cell) => {
+    const index = notebook.cells.indexOf(cell);
+
+    if (index < notebook.cells.length - 1) {
+      const newCells = [...notebook.cells];
+      newCells[index] = notebook.cells[index + 1];
+      newCells[index + 1] = cell;
+
+      updateNotebook({
+        ...notebook,
+        cells: newCells,
+      });
+    }
+  }, [notebook, updateNotebook]);
+
+  const handleCellRename = useCallback((cell: Cell) => {
+    const newName = prompt("Enter a new name for the cell:");
+
+    if (newName) {
+      updateNotebook({
+       ...notebook,
+        cells: notebook.cells.map((c: Cell) => (c.id === cell.id ? {...c, name: newName } : c)),
+      });
+    }
+  }, [notebook, updateNotebook]);
+
+  const [openCells, setOpenCells] = useState(new Set(notebook.cells.map((c: Cell) => c.id)));
+
+  const toggleCellOpen = (id: string) => {
+    setOpenCells((prev) => {
+      const newState = new Set(prev);
+
+      if (newState.has(id)) {
+        newState.delete(id)
+      } else {
+        newState.add(id);
+      }
+
+      return newState;
+    });
+  };
+
+  return (
+    <div className="bg-white rounded-xl flex flex-col gap-0.5 px-7 py-5 flex-1">
+      <div className="mb-5">{notebook.name}</div>
+
+      {notebook.cells.map((cell: Cell, index) => (
+        <Fragment key={cell.id}>
+          <div key={cell.id} className="flex flex-row rounded-xl border-1 border-gray-100">
+            <div className="flex flex-col flex-1 relative">
+              {cell.type === "code" ? (
+                <>
+                  <div className="absolute left-[-1.35rem] top-2.5">
+                    <IconButton className="p-[0.25rem] m-[-0.25rem]" onClick={toggleCellOpen.bind(null, cell.id)}>
+                      <CaretIcon className={classNames("transition-transform", openCells.has(cell.id) ? "rotate-0" : "rotate-180")} />
+                    </IconButton>
+                  </div>
+
+                  <NotebookCellHeader
+                    cell={cell}
+                    runCell={handleCellRun}
+                    renameCell={handleCellRename}
+                    removeCell={handleCellRemove}
+                    moveCellUp={handleCellUp}
+                    moveCellDown={handleCellDown}
+                    className="rounded-tl-xl rounded-tr-xl"
+                  />
+
+                  {openCells.has(cell.id) && (
+                    <>
+                      <TextArea
+                        value={cell.content}
+                        onChange={handleCellInputChange.bind(null, notebook, cell)}
+                        // onKeyUp={handleCellRunOnEnter}
+                        isAutoExpanding
+                        name="cellInput"
+                        placeholder="Type your code here..."
+                        contentEditable={true}
+                        className="resize-none min-h-36 max-h-96 overflow-y-auto rounded-tl-none rounded-tr-none rounded-bl-xl rounded-br-xl border-0 !outline-0"
+                      />
+
+                      <div className="flex flex-col bg-gray-100 overflow-x-auto max-w-full">
+                        {cell.result && (
+                          <div className="px-2 py-2">
+                            output: <CellResult content={cell.result} />
+                          </div>
+                        )}
+                        {cell.error && (
+                          <div className="px-2 py-2">
+                            error: {cell.error}
+                          </div>
+                        )}
+                      </div>
+                    </>
+                  )}
+                </>
+              ) : (
+                openCells.has(cell.id) && (
+                  <TextArea
+                    value={cell.content}
+                    onChange={handleCellInputChange.bind(null, notebook, cell)}
+                    // onKeyUp={handleCellRunOnEnter}
+                    isAutoExpanding
+                    name="cellInput"
+                    placeholder="Type your text here..."
+                    contentEditable={true}
+                    className="resize-none min-h-24 max-h-96 overflow-y-auto rounded-tl-none rounded-tr-none rounded-bl-xl rounded-br-xl border-0 !outline-0"
+                  />
+                )
+              )}
+            </div>
+          </div>
+          <div className="ml-[-1.35rem]">
+            <PopupMenu
+              openToRight={true}
+              triggerElement={<PlusIcon />}
+              triggerClassName="p-[0.25rem] m-[-0.25rem]"
+            >
+              <div className="flex flex-col gap-0.5">
+                <button
+                  onClick={() => handleCellAdd(index, "markdown")}
+                  className="hover:bg-gray-100 w-full text-left px-2 cursor-pointer"
+                >
+                  <span>text</span>
+                </button>
+              </div>
+              <div
+                onClick={() => handleCellAdd(index, "code")}
+                className="hover:bg-gray-100 w-full text-left px-2 cursor-pointer"
+              >
+                <span>code</span>
+              </div>
+            </PopupMenu>
+          </div>
+        </Fragment>
+      ))}
+    </div>
+  );
+}
+
+
+function CellResult({ content = [] }) {
+  const parsedContent = [];
+
+  const graphRef = useRef<GraphVisualizationAPI>();
+  const graphControls = useRef<GraphControlsAPI>({
+    setSelectedNode: () => {},
+    getSelectedNode: () => null,
+  });
+
+  for (const line of content) {
+    try {
+      if (Array.isArray(line)) {
+        for (const item of line) {
+          if (typeof item === "string") {
+            parsedContent.push(
+              <pre key={item.slice(0, -10)}>
+                {item}
+              </pre>
+            );
+          }
+          if (typeof item === "object" && item["search_result"] && Array.isArray(item["search_result"])) {
+            for (const result of item["search_result"]) {
+              parsedContent.push(
+                <div className="w-full h-full bg-white">
+                  <span className="text-sm pl-2 mb-4">query response (dataset: {item["dataset_name"]})</span>
+                  <span className="block px-2 py-2">{result}</span>
+                </div>
+              );
+            }
+          }
+          if (typeof item === "object" && item["graph"] && typeof item["graph"] === "object") {
+            parsedContent.push(
+              <div className="w-full h-full bg-white">
+                <span className="text-sm pl-2 mb-4">reasoning graph</span>
+                <GraphVisualization
+                  data={transformToVisualizationData(item["graph"])}
+                  ref={graphRef as MutableRefObject<GraphVisualizationAPI>}
+                  graphControls={graphControls}
+                  className="min-h-48"
+                />
+              </div>
+            );
+          }
+        }
+      }
+    } catch (error) {
+      console.error(error);
+      parsedContent.push(line);
+    }
+  }
+
+  return parsedContent.map((item, index) => (
+    <div key={index} className="px-2 py-1">
+      {item}
+      {/* {typeof item === "object" && item["search_result"] && Array.isArray(item["search_result"]) && (
+        (item["search_result"] as []).map((result: string) => (<pre key={result.slice(0, -10)}>{result}</pre>))
+      )}
+      {typeof item === "object" && item["graph"] && typeof item["graph"] === "object" && (
+        (item["graph"])
+      )} */}
+    </div>
+  ));
+
+};
+
+function transformToVisualizationData(triplets) {
+  // Implementation to transform triplet to visualization data
+
+  const nodes = {};
+  const links = {};
+
+  for (const triplet of triplets) {
+    nodes[triplet.source.id] = {
+      id: triplet.source.id,
+      label: triplet.source.attributes.name,
+      type: triplet.source.attributes.type,
+      attributes: triplet.source.attributes,
+    };
+    nodes[triplet.destination.id] = {
+      id: triplet.destination.id,
+      label: triplet.destination.attributes.name,
+      type: triplet.destination.attributes.type,
+      attributes: triplet.destination.attributes,
+    };
+    links[`${triplet.source.id}_${triplet.attributes.relationship_name}_${triplet.destination.id}`] = {
+      source: triplet.source.id,
+      target: triplet.destination.id,
+      label: triplet.attributes.relationship_name,
+    }
+  }
+
+  return {
+    nodes: Object.values(nodes),
+    links: Object.values(links),
+  };
+}
diff --git a/cognee-frontend/src/ui/elements/Notebook/NotebookCellHeader.tsx b/cognee-frontend/src/ui/elements/Notebook/NotebookCellHeader.tsx
new file mode 100644
index 000000000..e5a41d9c2
--- /dev/null
+++ b/cognee-frontend/src/ui/elements/Notebook/NotebookCellHeader.tsx
@@ -0,0 +1,68 @@
+import classNames from "classnames";
+
+import { useBoolean } from "@/utils";
+import { LocalCogneeIcon, PlayIcon } from "@/ui/Icons";
+import { PopupMenu } from "@/ui/elements";
+import { LoadingIndicator } from "@/ui/App";
+
+import { Cell } from "./types";
+import IconButton from "../IconButton";
+
+interface NotebookCellHeaderProps {
+  cell: Cell;
+  runCell: (cell: Cell) => Promise<void>;
+  renameCell: (cell: Cell) => void;
+  removeCell: (cell: Cell) => void;
+  moveCellUp: (cell: Cell) => void;
+  moveCellDown: (cell: Cell) => void;
+  className?: string;
+}
+
+export default function NotebookCellHeader({
+  cell,
+  runCell,
+  renameCell,
+  removeCell,
+  moveCellUp,
+  moveCellDown,
+  className,
+}: NotebookCellHeaderProps) {
+  const {
+    value: isRunningCell,
+    setTrue: setIsRunningCell,
+    setFalse: setIsNotRunningCell,
+  } = useBoolean(false);
+
+  const handleCellRun = () => {
+    setIsRunningCell();
+    runCell(cell)
+      .then(() => {
+        setIsNotRunningCell();
+      });
+  };
+
+  return (
+    <div className={classNames("flex flex-row justify-between items-center h-9 bg-gray-100", className)}>
+      <div className="flex flex-row items-center px-3.5">
+        {isRunningCell ? <LoadingIndicator /> : <IconButton onClick={handleCellRun}><PlayIcon /></IconButton>}
+        <span className="ml-4">{cell.name}</span>
+      </div>
+      <div className="pr-4 flex flex-row items-center gap-8">
+        <div className="flex flex-row items-center gap-2">
+          <LocalCogneeIcon className="text-indigo-700" />
+          <span className="text-xs">local cognee</span>
+        </div>
+        <PopupMenu>
+          <div className="flex flex-col gap-0.5">
+            <button onClick={() => moveCellUp(cell)} className="hover:bg-gray-100 w-full text-left px-2 cursor-pointer">move cell up</button>
+            <button onClick={() => moveCellDown(cell)} className="hover:bg-gray-100 w-full text-left px-2 cursor-pointer">move cell down</button>
+          </div>
+          <div className="flex flex-col gap-0.5 items-start">
+            <button onClick={() => renameCell(cell)} className="hover:bg-gray-100 w-full text-left px-2 cursor-pointer">rename</button>
+            <button onClick={() => removeCell(cell)} className="hover:bg-gray-100 w-full text-left px-2 cursor-pointer">delete</button>
+          </div>
+        </PopupMenu>
+      </div>
+    </div>
+  );
+}
diff --git a/cognee-frontend/src/ui/elements/Notebook/index.ts b/cognee-frontend/src/ui/elements/Notebook/index.ts
new file mode 100644
index 000000000..5aa89a67f
--- /dev/null
+++ b/cognee-frontend/src/ui/elements/Notebook/index.ts
@@ -0,0 +1 @@
+export { default } from "./Notebook";
diff --git a/cognee-frontend/src/ui/elements/Notebook/types.ts b/cognee-frontend/src/ui/elements/Notebook/types.ts
new file mode 100644
index 000000000..3c3cb4ad5
--- /dev/null
+++ b/cognee-frontend/src/ui/elements/Notebook/types.ts
@@ -0,0 +1,15 @@
+export interface Cell {
+  id: string;
+  name: string;
+  type: "markdown" | "code";
+  content: string;
+  result?: [];
+  error?: string;
+}
+
+export interface Notebook {
+  id: string;
+  name: string;
+  cells: Cell[];
+  deletable?: boolean;
+}
diff --git a/cognee-frontend/src/ui/elements/PopupMenu.tsx b/cognee-frontend/src/ui/elements/PopupMenu.tsx
new file mode 100644
index 000000000..f4f43a1c6
--- /dev/null
+++ b/cognee-frontend/src/ui/elements/PopupMenu.tsx
@@ -0,0 +1,48 @@
+"use client";
+
+import { useBoolean, useOutsideClick } from "@/utils";
+import { MenuIcon } from "@/ui/Icons";
+import { IconButton } from "@/ui/elements";
+import classNames from 'classnames';
+
+interface PopupMenuProps {
+  children: React.ReactNode;
+  triggerElement?: React.ReactNode;
+  triggerClassName?: string;
+  openToRight?: boolean;
+}
+
+export default function PopupMenu({ triggerElement, triggerClassName, children, openToRight = false }: PopupMenuProps) {
+  const {
+    value: isMenuOpen,
+    setFalse: closeMenu,
+    toggle: toggleMenu,
+  } = useBoolean(false);
+
+  const menuRootRef = useOutsideClick<HTMLDivElement>(closeMenu);
+
+  return (
+    <div className="relative inline-block" ref={menuRootRef}>
+      <IconButton as="div" className={triggerClassName} onClick={toggleMenu}>
+        {triggerElement || <MenuIcon />}
+      </IconButton>
+
+      {isMenuOpen && (
+        <div
+          className={
+            classNames(
+              "absolute top-full flex flex-col gap-4 pl-1 py-3 pr-4",
+              "whitespace-nowrap bg-white border-1 border-gray-100 z-10",
+              {
+                "left-0": openToRight,
+                "right-0": !openToRight,
+              },
+            )
+          }
+        >
+          {children}
+        </div>
+      )}
+    </div>
+  );
+};
diff --git a/cognee-frontend/src/ui/elements/Select.tsx b/cognee-frontend/src/ui/elements/Select.tsx
index 11611fdb1..9f5118276 100644
--- a/cognee-frontend/src/ui/elements/Select.tsx
+++ b/cognee-frontend/src/ui/elements/Select.tsx
@@ -8,7 +8,7 @@ export default function Select({ children, className, ...props }: SelectHTMLAttr
       <select
         className={
           classNames(
-            "block w-full appearance-none rounded-md bg-white pl-4 pr-8 py-4 text-base text-gray-900 outline-1 -outline-offset-1 outline-gray-300 focus:outline-2 focus:-outline-offset-2 focus:outline-indigo-600",
+            "block w-full appearance-none rounded-3xl bg-white pl-4 pr-8 h-8 text-base text-gray-900 outline-1 -outline-offset-1 outline-gray-300 focus:outline-2 focus:-outline-offset-2 focus:outline-indigo-600",
             className,
           )
         }
@@ -16,8 +16,8 @@ export default function Select({ children, className, ...props }: SelectHTMLAttr
       >
         {children}
       </select>
-      <span className="pointer-events-none absolute top-1/2 -mt-0.5 right-3 text-indigo-600 rotate-180">
-        <CaretIcon height={8} width={12} />
+      <span className="pointer-events-none absolute top-1/3 -mt-0.5 right-3 text-indigo-600 rotate-180">
+        <CaretIcon />
       </span>
     </div>
   );
diff --git a/cognee-frontend/src/ui/elements/TextArea.tsx b/cognee-frontend/src/ui/elements/TextArea.tsx
index ab306125f..59b991664 100644
--- a/cognee-frontend/src/ui/elements/TextArea.tsx
+++ b/cognee-frontend/src/ui/elements/TextArea.tsx
@@ -24,10 +24,8 @@ export default function TextArea({
     const fakeTextAreaElement = event.target as HTMLDivElement;
     const newValue = fakeTextAreaElement.innerText;
 
-    if (newValue !== value) {
-      onChange?.(newValue);
-    }
-  }, [onChange, value]);
+    onChange?.(newValue);
+  }, [onChange]);
 
   const handleKeyUp = useCallback((event: Event) => {
     if (onKeyUp) {
@@ -55,8 +53,15 @@ export default function TextArea({
   useLayoutEffect(() => {
     const fakeTextAreaElement = fakeTextAreaRef.current;
 
-    if (fakeTextAreaElement) {
+    if (fakeTextAreaElement && fakeTextAreaElement.innerText.trim() !== "") {
       fakeTextAreaElement.innerText = placeholder;
+    }
+  }, [placeholder]);
+
+  useLayoutEffect(() => {
+    const fakeTextAreaElement = fakeTextAreaRef.current;
+
+    if (fakeTextAreaElement) {
       fakeTextAreaElement.addEventListener("input", handleTextChange);
       fakeTextAreaElement.addEventListener("keyup", handleKeyUp);
     }
@@ -67,15 +72,21 @@ export default function TextArea({
         fakeTextAreaElement.removeEventListener("keyup", handleKeyUp);
       }
     };
-  }, []);
+  }, [handleKeyUp, handleTextChange]);
 
   useEffect(() => {
     const fakeTextAreaElement = fakeTextAreaRef.current;
     const textAreaText = fakeTextAreaElement?.innerText;
-    if (fakeTextAreaElement && textAreaText !== value && textAreaText !== placeholder) {
+
+    if (fakeTextAreaElement && (value === "" || value === "\n")) {
+      fakeTextAreaElement.innerText = placeholder;
+      return;
+    }
+
+    if (fakeTextAreaElement && textAreaText !== value) {
       fakeTextAreaElement.innerText = value;
     }
-  }, [value]);
+  }, [placeholder, value]);
 
   return isAutoExpanding ? (
     <>
diff --git a/cognee-frontend/src/ui/elements/index.ts b/cognee-frontend/src/ui/elements/index.ts
index 4b3dc2f3d..551b06596 100644
--- a/cognee-frontend/src/ui/elements/index.ts
+++ b/cognee-frontend/src/ui/elements/index.ts
@@ -1,8 +1,12 @@
-export { default as Modal } from "./Modal";
+export { default as Modal } from "./Modal/Modal";
 export { default as Input } from "./Input";
 export { default as Select } from "./Select";
 export { default as TextArea } from "./TextArea";
 export { default as CTAButton } from "./CTAButton";
+export { default as PopupMenu } from "./PopupMenu";
+export { default as IconButton } from "./IconButton";
 export { default as GhostButton } from "./GhostButton";
 export { default as NeutralButton } from "./NeutralButton";
 export { default as StatusIndicator } from "./StatusIndicator";
+export { default as Accordion } from "./Accordion";
+export { default as Notebook } from "./Notebook"; 
diff --git a/cognee-frontend/src/utils/fetch.ts b/cognee-frontend/src/utils/fetch.ts
index 74d298f85..1e6cd02a4 100644
--- a/cognee-frontend/src/utils/fetch.ts
+++ b/cognee-frontend/src/utils/fetch.ts
@@ -47,3 +47,7 @@ export default async function fetch(url: string, options: RequestInit = {}): Pro
       return Promise.reject(error);
     });
 }
+
+fetch.checkHealth = () => {
+  return global.fetch(`${backendApiUrl.replace("/api", "")}/health`);
+};
diff --git a/cognee-frontend/src/utils/index.ts b/cognee-frontend/src/utils/index.ts
index aca9732de..902331cfe 100644
--- a/cognee-frontend/src/utils/index.ts
+++ b/cognee-frontend/src/utils/index.ts
@@ -1,3 +1,4 @@
 export { default as fetch } from "./fetch";
 export { default as handleServerErrors } from "./handleServerErrors";
 export { default as useBoolean } from "./useBoolean";
+export { default as useOutsideClick } from "./useOutsideClick";
diff --git a/cognee-frontend/src/utils/useBoolean.ts b/cognee-frontend/src/utils/useBoolean.ts
index 182ee8606..6105c8e47 100644
--- a/cognee-frontend/src/utils/useBoolean.ts
+++ b/cognee-frontend/src/utils/useBoolean.ts
@@ -5,10 +5,12 @@ export default function useBoolean(initialValue: boolean) {
 
   const setTrue = useCallback(() => setValue(true), []);
   const setFalse = useCallback(() => setValue(false), []);
+  const toggle = useCallback(() => setValue((prevValue) => !prevValue), []);
 
   return {
     value,
     setTrue,
     setFalse,
+    toggle,
   };
 }
diff --git a/cognee-frontend/src/utils/useOutsideClick.ts b/cognee-frontend/src/utils/useOutsideClick.ts
new file mode 100644
index 000000000..ddabdc459
--- /dev/null
+++ b/cognee-frontend/src/utils/useOutsideClick.ts
@@ -0,0 +1,25 @@
+import { useEffect, useRef } from "react";
+
+export default function useOutsideClick<ElementType extends HTMLElement>(callbackFn: () => void, isEnabled = true) {
+  const rootElementRef = useRef<ElementType>(null);
+
+  useEffect(() => {
+    function handleClickOutside(event: MouseEvent) {
+      const clickedElement = event.target;
+
+      if (clickedElement && rootElementRef.current && !rootElementRef.current?.contains(clickedElement as Node)) {
+        callbackFn();
+      }
+    }
+
+    if (isEnabled) {
+      document.addEventListener("click", handleClickOutside);
+
+      return () => {
+        document.removeEventListener("click", handleClickOutside);
+      };
+    }
+  }, [callbackFn, isEnabled]);
+
+  return rootElementRef;
+}
diff --git a/cognee/api/client.py b/cognee/api/client.py
index 69b774909..7d5f48672 100644
--- a/cognee/api/client.py
+++ b/cognee/api/client.py
@@ -9,7 +9,7 @@ from contextlib import asynccontextmanager
 from fastapi import Request
 from fastapi import FastAPI, status
 from fastapi.encoders import jsonable_encoder
-from fastapi.responses import JSONResponse, Response
+from fastapi.responses import JSONResponse
 from fastapi.middleware.cors import CORSMiddleware
 from fastapi.exceptions import RequestValidationError
 from fastapi.openapi.utils import get_openapi
@@ -17,6 +17,8 @@ from fastapi.openapi.utils import get_openapi
 from cognee.exceptions import CogneeApiError
 from cognee.shared.logging_utils import get_logger, setup_logging
 from cognee.api.health import health_checker, HealthStatus
+from cognee.api.v1.cloud.routers import get_checks_router
+from cognee.api.v1.notebooks.routers import get_notebooks_router
 from cognee.api.v1.permissions.routers import get_permissions_router
 from cognee.api.v1.settings.routers import get_settings_router
 from cognee.api.v1.datasets.routers import get_datasets_router
@@ -26,6 +28,7 @@ from cognee.api.v1.memify.routers import get_memify_router
 from cognee.api.v1.add.routers import get_add_router
 from cognee.api.v1.delete.routers import get_delete_router
 from cognee.api.v1.responses.routers import get_responses_router
+from cognee.api.v1.sync.routers import get_sync_router
 from cognee.api.v1.users.routers import (
     get_auth_router,
     get_register_router,
@@ -85,7 +88,7 @@ app.add_middleware(
     CORSMiddleware,
     allow_origins=allowed_origins,  # Now controlled by env var
     allow_credentials=True,
-    allow_methods=["OPTIONS", "GET", "POST", "DELETE"],
+    allow_methods=["OPTIONS", "GET", "PUT", "POST", "DELETE"],
     allow_headers=["*"],
 )
 # To allow origins, set CORS_ALLOWED_ORIGINS env variable to a comma-separated list, e.g.:
@@ -256,6 +259,8 @@ app.include_router(get_delete_router(), prefix="/api/v1/delete", tags=["delete"]
 
 app.include_router(get_responses_router(), prefix="/api/v1/responses", tags=["responses"])
 
+app.include_router(get_sync_router(), prefix="/api/v1/sync", tags=["sync"])
+
 codegraph_routes = get_code_pipeline_router()
 if codegraph_routes:
     app.include_router(codegraph_routes, prefix="/api/v1/code-pipeline", tags=["code-pipeline"])
@@ -266,6 +271,18 @@ app.include_router(
     tags=["users"],
 )
 
+app.include_router(
+    get_notebooks_router(),
+    prefix="/api/v1/notebooks",
+    tags=["notebooks"],
+)
+
+app.include_router(
+    get_checks_router(),
+    prefix="/api/v1/checks",
+    tags=["checks"],
+)
+
 
 def start_api_server(host: str = "0.0.0.0", port: int = 8000):
     """
diff --git a/cognee/api/health.py b/cognee/api/health.py
index bdb3b1fe3..f3f36c2ed 100644
--- a/cognee/api/health.py
+++ b/cognee/api/health.py
@@ -1,9 +1,10 @@
 """Health check system for cognee API."""
 
+from io import BytesIO
 import time
 import asyncio
 from datetime import datetime, timezone
-from typing import Dict, Any, Optional
+from typing import Dict
 from enum import Enum
 from pydantic import BaseModel
 
@@ -117,12 +118,9 @@ class HealthChecker:
             engine = await get_graph_engine()
 
             # Test basic operation with actual graph query
-            if hasattr(engine, "execute"):
-                # For SQL-like graph DBs (Neo4j, Memgraph)
-                await engine.execute("MATCH () RETURN count(*) LIMIT 1")
-            elif hasattr(engine, "query"):
+            if hasattr(engine, "query"):
                 # For other graph engines
-                engine.query("MATCH () RETURN count(*) LIMIT 1", {})
+                await engine.query("MATCH () RETURN count(*) LIMIT 1", {})
             # If engine exists but no test method, consider it healthy
 
             response_time = int((time.time() - start_time) * 1000)
@@ -167,8 +165,8 @@ class HealthChecker:
             else:
                 # For S3, test basic operations
                 test_path = "health_check_test"
-                await storage.store(test_path, b"test")
-                await storage.delete(test_path)
+                await storage.store(test_path, BytesIO(b"test"))
+                await storage.remove(test_path)
 
             response_time = int((time.time() - start_time) * 1000)
             return ComponentHealth(
@@ -190,8 +188,8 @@ class HealthChecker:
         """Check LLM provider health (non-critical)."""
         start_time = time.time()
         try:
-            from cognee.infrastructure.llm.LLMGateway import LLMGateway
             from cognee.infrastructure.llm.config import get_llm_config
+            from cognee.infrastructure.llm import LLMGateway
 
             config = get_llm_config()
 
@@ -225,7 +223,7 @@ class HealthChecker:
 
             # Test actual embedding generation with minimal text
             engine = get_embedding_engine()
-            await engine.embed_text("test")
+            await engine.embed_text(["test"])
 
             response_time = int((time.time() - start_time) * 1000)
             return ComponentHealth(
diff --git a/cognee/api/v1/cloud/routers/__init__.py b/cognee/api/v1/cloud/routers/__init__.py
new file mode 100644
index 000000000..4a77d16d9
--- /dev/null
+++ b/cognee/api/v1/cloud/routers/__init__.py
@@ -0,0 +1 @@
+from .get_checks_router import get_checks_router
diff --git a/cognee/api/v1/cloud/routers/get_checks_router.py b/cognee/api/v1/cloud/routers/get_checks_router.py
new file mode 100644
index 000000000..cc02d61d9
--- /dev/null
+++ b/cognee/api/v1/cloud/routers/get_checks_router.py
@@ -0,0 +1,23 @@
+from fastapi import APIRouter, Depends, Request
+
+from cognee.modules.users.models import User
+from cognee.modules.users.methods import get_authenticated_user
+from cognee.modules.cloud.operations import check_api_key
+from cognee.modules.cloud.exceptions import CloudApiKeyMissingError
+
+
+def get_checks_router():
+    router = APIRouter()
+
+    @router.post("/connection")
+    async def get_connection_check_endpoint(
+        request: Request, user: User = Depends(get_authenticated_user)
+    ):
+        api_token = request.headers.get("X-Api-Key")
+
+        if api_token is None:
+            return CloudApiKeyMissingError()
+
+        return await check_api_key(api_token)
+
+    return router
diff --git a/cognee/api/v1/datasets/routers/get_datasets_router.py b/cognee/api/v1/datasets/routers/get_datasets_router.py
index ff310e4b4..be8b5af8d 100644
--- a/cognee/api/v1/datasets/routers/get_datasets_router.py
+++ b/cognee/api/v1/datasets/routers/get_datasets_router.py
@@ -5,6 +5,7 @@ from typing import List, Optional
 from typing_extensions import Annotated
 from fastapi import status
 from fastapi import APIRouter
+from fastapi.encoders import jsonable_encoder
 from fastapi import HTTPException, Query, Depends
 from fastapi.responses import JSONResponse, FileResponse
 
@@ -47,6 +48,7 @@ class DataDTO(OutDTO):
     extension: str
     mime_type: str
     raw_data_location: str
+    dataset_id: UUID
 
 
 class GraphNodeDTO(OutDTO):
@@ -328,7 +330,7 @@ def get_datasets_router() -> APIRouter:
             },
         )
 
-        from cognee.modules.data.methods import get_dataset_data, get_dataset
+        from cognee.modules.data.methods import get_dataset_data
 
         # Verify user has permission to read dataset
         dataset = await get_authorized_existing_datasets([dataset_id], "read", user)
@@ -339,12 +341,20 @@ def get_datasets_router() -> APIRouter:
                 content=ErrorResponseDTO(f"Dataset ({str(dataset_id)}) not found."),
             )
 
-        dataset_data = await get_dataset_data(dataset_id=dataset[0].id)
+        dataset_id = dataset[0].id
+
+        dataset_data = await get_dataset_data(dataset_id=dataset_id)
 
         if dataset_data is None:
             return []
 
-        return dataset_data
+        return [
+            dict(
+                **jsonable_encoder(data),
+                dataset_id=dataset_id,
+            )
+            for data in dataset_data
+        ]
 
     @router.get("/status", response_model=dict[str, PipelineRunStatus])
     async def get_dataset_status(
diff --git a/cognee/api/v1/notebooks/routers/__init__.py b/cognee/api/v1/notebooks/routers/__init__.py
new file mode 100644
index 000000000..9bf276e7c
--- /dev/null
+++ b/cognee/api/v1/notebooks/routers/__init__.py
@@ -0,0 +1 @@
+from .get_notebooks_router import get_notebooks_router
diff --git a/cognee/api/v1/notebooks/routers/get_notebooks_router.py b/cognee/api/v1/notebooks/routers/get_notebooks_router.py
new file mode 100644
index 000000000..3891214b1
--- /dev/null
+++ b/cognee/api/v1/notebooks/routers/get_notebooks_router.py
@@ -0,0 +1,93 @@
+from uuid import UUID
+from fastapi.encoders import jsonable_encoder
+from fastapi.responses import JSONResponse
+from pydantic import Field
+from typing import List, Optional
+from fastapi import APIRouter, Depends
+
+from cognee.api.DTO import InDTO
+from cognee.infrastructure.databases.relational import get_async_session
+from cognee.modules.notebooks.models import Notebook, NotebookCell
+from cognee.modules.notebooks.operations import run_in_local_sandbox
+from cognee.modules.users.models import User
+from cognee.modules.users.methods import get_authenticated_user
+from cognee.modules.notebooks.methods import (
+    create_notebook,
+    delete_notebook,
+    get_notebook,
+    get_notebooks,
+    update_notebook,
+)
+
+
+class NotebookData(InDTO):
+    name: Optional[str] = Field(...)
+    cells: Optional[List[NotebookCell]] = Field(default=[])
+
+
+def get_notebooks_router():
+    router = APIRouter()
+
+    @router.get("")
+    async def get_notebooks_endpoint(user: User = Depends(get_authenticated_user)):
+        return await get_notebooks(user.id)
+
+    @router.post("")
+    async def create_notebook_endpoint(
+        notebook_data: NotebookData, user: User = Depends(get_authenticated_user)
+    ):
+        return await create_notebook(user.id, notebook_data.name, notebook_data.cells)
+
+    @router.put("/{notebook_id}")
+    async def update_notebook_endpoint(
+        notebook_id: UUID, notebook_data: NotebookData, user: User = Depends(get_authenticated_user)
+    ):
+        async with get_async_session(auto_commit=True) as session:
+            notebook: Notebook = await get_notebook(notebook_id, user.id, session)
+
+            if notebook is None:
+                return JSONResponse(status_code=404, content={"error": "Notebook not found"})
+
+            if notebook_data.name and notebook_data.name != notebook.name:
+                notebook.name = notebook_data.name
+
+            if notebook_data.cells:
+                notebook.cells = notebook_data.cells
+
+            return await update_notebook(notebook, session)
+
+    class RunCodeData(InDTO):
+        content: str = Field(...)
+
+    @router.post("/{notebook_id}/{cell_id}/run")
+    async def run_notebook_cell_endpoint(
+        notebook_id: UUID,
+        cell_id: UUID,
+        run_code: RunCodeData,
+        user: User = Depends(get_authenticated_user),
+    ):
+        async with get_async_session() as session:
+            notebook: Notebook = await get_notebook(notebook_id, user.id, session)
+
+            if notebook is None:
+                return JSONResponse(status_code=404, content={"error": "Notebook not found"})
+
+            result, error = run_in_local_sandbox(run_code.content)
+
+            return JSONResponse(
+                status_code=200, content={"result": jsonable_encoder(result), "error": error}
+            )
+
+    @router.delete("/{notebook_id}")
+    async def delete_notebook_endpoint(
+        notebook_id: UUID, user: User = Depends(get_authenticated_user)
+    ):
+        async with get_async_session(auto_commit=True) as session:
+            notebook: Notebook = await get_notebook(notebook_id, user.id, session)
+
+            if notebook is None:
+                return JSONResponse(status_code=404, content={"error": "Notebook not found"})
+
+            return await delete_notebook(notebook, session)
+
+    return router
diff --git a/cognee/api/v1/search/routers/get_search_router.py b/cognee/api/v1/search/routers/get_search_router.py
index 2cf087b25..b7a8df9d3 100644
--- a/cognee/api/v1/search/routers/get_search_router.py
+++ b/cognee/api/v1/search/routers/get_search_router.py
@@ -1,5 +1,4 @@
 from uuid import UUID
-import pathlib
 from typing import Optional
 from datetime import datetime
 from pydantic import Field
@@ -134,7 +133,7 @@ def get_search_router() -> APIRouter:
                 only_context=payload.only_context,
             )
 
-            return results
+            return JSONResponse(content=results)
         except PermissionDeniedError:
             return []
         except Exception as error:
diff --git a/cognee/api/v1/sync/__init__.py b/cognee/api/v1/sync/__init__.py
new file mode 100644
index 000000000..7f60bc948
--- /dev/null
+++ b/cognee/api/v1/sync/__init__.py
@@ -0,0 +1,17 @@
+from .sync import (
+    sync,
+    SyncResponse,
+    LocalFileInfo,
+    CheckMissingHashesRequest,
+    CheckMissingHashesResponse,
+    PruneDatasetRequest,
+)
+
+__all__ = [
+    "sync",
+    "SyncResponse",
+    "LocalFileInfo",
+    "CheckMissingHashesRequest",
+    "CheckMissingHashesResponse",
+    "PruneDatasetRequest",
+]
diff --git a/cognee/api/v1/sync/routers/__init__.py b/cognee/api/v1/sync/routers/__init__.py
new file mode 100644
index 000000000..c9cfe2afb
--- /dev/null
+++ b/cognee/api/v1/sync/routers/__init__.py
@@ -0,0 +1,3 @@
+from .get_sync_router import get_sync_router
+
+__all__ = ["get_sync_router"]
diff --git a/cognee/api/v1/sync/routers/get_sync_router.py b/cognee/api/v1/sync/routers/get_sync_router.py
new file mode 100644
index 000000000..735fd13bd
--- /dev/null
+++ b/cognee/api/v1/sync/routers/get_sync_router.py
@@ -0,0 +1,134 @@
+from uuid import UUID
+from typing import Optional
+from fastapi import APIRouter, Depends
+from fastapi.responses import JSONResponse
+
+
+from cognee.api.DTO import InDTO
+from cognee.modules.users.models import User
+from cognee.modules.users.methods import get_authenticated_user
+from cognee.modules.users.permissions.methods import get_specific_user_permission_datasets
+from cognee.shared.utils import send_telemetry
+from cognee.shared.logging_utils import get_logger
+from cognee.api.v1.sync import SyncResponse
+from cognee.context_global_variables import set_database_global_context_variables
+
+logger = get_logger()
+
+
+class SyncRequest(InDTO):
+    """Request model for sync operations."""
+
+    dataset_id: Optional[UUID] = None
+
+
+def get_sync_router() -> APIRouter:
+    router = APIRouter()
+
+    @router.post("", response_model=dict[str, SyncResponse])
+    async def sync_to_cloud(
+        request: SyncRequest,
+        user: User = Depends(get_authenticated_user),
+    ):
+        """
+        Sync local data to Cognee Cloud.
+
+        This endpoint triggers synchronization of local Cognee data to your cloud instance.
+        It uploads your local datasets, knowledge graphs, and processed data to the cloud
+        for backup, sharing, or cloud-based processing.
+
+        ## Request Body (JSON)
+        ```json
+        {
+            "dataset_id": "123e4567-e89b-12d3-a456-426614174000"
+        }
+        ```
+
+        ## Response
+        Returns immediate response for the sync operation:
+        - **run_id**: Unique identifier for tracking the background sync operation
+        - **status**: Always "started" (operation runs in background)
+        - **dataset_id**: ID of the dataset being synced
+        - **dataset_name**: Name of the dataset being synced
+        - **message**: Description of the background operation
+        - **timestamp**: When the sync was initiated
+        - **user_id**: User who initiated the sync
+
+        ## Cloud Sync Features
+        - **Automatic Authentication**: Uses your Cognee Cloud credentials
+        - **Data Compression**: Optimizes transfer size for faster uploads
+        - **Smart Sync**: Automatically handles data updates efficiently
+        - **Progress Tracking**: Monitor sync status with sync_id
+        - **Error Recovery**: Automatic retry for failed transfers
+        - **Data Validation**: Ensures data integrity during transfer
+
+        ## Example Usage
+        ```bash
+        # Sync dataset to cloud by ID (JSON request)
+        curl -X POST "http://localhost:8000/api/v1/sync" \\
+          -H "Content-Type: application/json" \\
+          -H "Cookie: auth_token=your-token" \\
+          -d '{"dataset_id": "123e4567-e89b-12d3-a456-426614174000"}'
+        ```
+
+        ## Error Codes
+        - **400 Bad Request**: Invalid dataset_id format
+        - **401 Unauthorized**: Invalid or missing authentication
+        - **403 Forbidden**: User doesn't have permission to access dataset
+        - **404 Not Found**: Dataset not found
+        - **409 Conflict**: Sync operation conflict or cloud service unavailable
+        - **413 Payload Too Large**: Dataset too large for current cloud plan
+        - **429 Too Many Requests**: Rate limit exceeded
+
+        ## Notes  
+        - Sync operations run in the background - you get an immediate response
+        - Use the returned run_id to track progress (status API coming soon)
+        - Large datasets are automatically chunked for efficient transfer
+        - Cloud storage usage counts against your plan limits
+        - The sync will continue even if you close your connection
+        """
+        send_telemetry(
+            "Cloud Sync API Endpoint Invoked",
+            user.id,
+            additional_properties={
+                "endpoint": "POST /v1/sync",
+                "dataset_id": str(request.dataset_id) if request.dataset_id else "*",
+            },
+        )
+
+        from cognee.api.v1.sync import sync as cognee_sync
+
+        try:
+            # Retrieve existing dataset and check permissions
+            datasets = await get_specific_user_permission_datasets(
+                user.id, "write", [request.dataset_id] if request.dataset_id else None
+            )
+
+            sync_results = {}
+
+            for dataset in datasets:
+                await set_database_global_context_variables(dataset.id, dataset.owner_id)
+
+                # Execute cloud sync operation
+                sync_result = await cognee_sync(
+                    dataset=dataset,
+                    user=user,
+                )
+
+                sync_results[str(dataset.id)] = sync_result
+
+            return sync_results
+
+        except ValueError as e:
+            return JSONResponse(status_code=400, content={"error": str(e)})
+        except PermissionError as e:
+            return JSONResponse(status_code=403, content={"error": str(e)})
+        except ConnectionError as e:
+            return JSONResponse(
+                status_code=409, content={"error": f"Cloud service unavailable: {str(e)}"}
+            )
+        except Exception as e:
+            logger.error(f"Cloud sync operation failed: {str(e)}")
+            return JSONResponse(status_code=409, content={"error": "Cloud sync operation failed."})
+
+    return router
diff --git a/cognee/api/v1/sync/sync.py b/cognee/api/v1/sync/sync.py
new file mode 100644
index 000000000..4c6b58eac
--- /dev/null
+++ b/cognee/api/v1/sync/sync.py
@@ -0,0 +1,548 @@
+import os
+import uuid
+import asyncio
+import aiohttp
+from pydantic import BaseModel
+from typing import List, Optional
+from datetime import datetime, timezone
+
+from cognee.infrastructure.files.storage import get_file_storage
+from cognee.shared.logging_utils import get_logger
+from cognee.modules.users.models import User
+from cognee.modules.data.models import Dataset
+from cognee.modules.data.methods import get_dataset_data
+from cognee.modules.sync.methods import (
+    create_sync_operation,
+    update_sync_operation,
+    mark_sync_started,
+    mark_sync_completed,
+    mark_sync_failed,
+)
+
+logger = get_logger()
+
+
+class LocalFileInfo(BaseModel):
+    """Model for local file information with hash."""
+
+    id: str
+    name: str
+    mime_type: Optional[str]
+    extension: Optional[str]
+    raw_data_location: str
+    content_hash: str  # MD5 hash
+    file_size: int
+    node_set: Optional[str] = None
+
+
+class CheckMissingHashesRequest(BaseModel):
+    """Request model for checking missing hashes in a dataset"""
+
+    hashes: List[str]
+
+
+class CheckMissingHashesResponse(BaseModel):
+    """Response model for missing hashes check"""
+
+    missing: List[str]
+
+
+class PruneDatasetRequest(BaseModel):
+    """Request model for pruning dataset to specific hashes"""
+
+    items: List[str]
+
+
+class SyncResponse(BaseModel):
+    """Response model for sync operations."""
+
+    run_id: str
+    status: str  # "started" for immediate response
+    dataset_id: str
+    dataset_name: str
+    message: str
+    timestamp: str
+    user_id: str
+
+
+async def sync(
+    dataset: Dataset,
+    user: User,
+) -> SyncResponse:
+    """
+    Sync local Cognee data to Cognee Cloud.
+
+    This function handles synchronization of local datasets, knowledge graphs, and
+    processed data to the Cognee Cloud infrastructure. It uploads local data for
+    cloud-based processing, backup, and sharing.
+
+    Args:
+        dataset: Dataset object to sync (permissions already verified)
+        user: User object for authentication and permissions
+
+    Returns:
+        SyncResponse model with immediate response:
+            - run_id: Unique identifier for tracking this sync operation
+            - status: Always "started" (sync runs in background)
+            - dataset_id: ID of the dataset being synced
+            - dataset_name: Name of the dataset being synced
+            - message: Description of what's happening
+            - timestamp: When the sync was initiated
+            - user_id: User who initiated the sync
+
+    Raises:
+        ConnectionError: If Cognee Cloud service is unreachable
+        Exception: For other sync-related errors
+    """
+    if not dataset:
+        raise ValueError("Dataset must be provided for sync operation")
+
+    # Generate a unique run ID
+    run_id = str(uuid.uuid4())
+
+    # Get current timestamp
+    timestamp = datetime.now(timezone.utc).isoformat()
+
+    logger.info(f"Starting cloud sync operation {run_id}: dataset {dataset.name} ({dataset.id})")
+
+    # Create sync operation record in database (total_records will be set during background sync)
+    try:
+        await create_sync_operation(
+            run_id=run_id, dataset_id=dataset.id, dataset_name=dataset.name, user_id=user.id
+        )
+        logger.info(f"Created sync operation record for {run_id}")
+    except Exception as e:
+        logger.error(f"Failed to create sync operation record: {str(e)}")
+        # Continue without database tracking if record creation fails
+
+    # Start the sync operation in the background
+    asyncio.create_task(_perform_background_sync(run_id, dataset, user))
+
+    # Return immediately with run_id
+    return SyncResponse(
+        run_id=run_id,
+        status="started",
+        dataset_id=str(dataset.id),
+        dataset_name=dataset.name,
+        message=f"Sync operation started in background. Use run_id '{run_id}' to track progress.",
+        timestamp=timestamp,
+        user_id=str(user.id),
+    )
+
+
+async def _perform_background_sync(run_id: str, dataset: Dataset, user: User) -> None:
+    """Perform the actual sync operation in the background."""
+    start_time = datetime.now(timezone.utc)
+
+    try:
+        logger.info(
+            f"Background sync {run_id}: Starting sync for dataset {dataset.name} ({dataset.id})"
+        )
+
+        # Mark sync as in progress
+        await mark_sync_started(run_id)
+
+        # Perform the actual sync operation
+        records_processed, bytes_transferred = await _sync_to_cognee_cloud(dataset, user, run_id)
+
+        end_time = datetime.now(timezone.utc)
+        duration = (end_time - start_time).total_seconds()
+
+        logger.info(
+            f"Background sync {run_id}: Completed successfully. Records: {records_processed}, Bytes: {bytes_transferred}, Duration: {duration}s"
+        )
+
+        # Mark sync as completed with final stats
+        await mark_sync_completed(run_id, records_processed, bytes_transferred)
+
+    except Exception as e:
+        end_time = datetime.now(timezone.utc)
+        duration = (end_time - start_time).total_seconds()
+
+        logger.error(f"Background sync {run_id}: Failed after {duration}s with error: {str(e)}")
+
+        # Mark sync as failed with error message
+        await mark_sync_failed(run_id, str(e))
+
+
+async def _sync_to_cognee_cloud(dataset: Dataset, user: User, run_id: str) -> tuple[int, int]:
+    """
+    Sync local data to Cognee Cloud using three-step idempotent process:
+    1. Extract local files with stored MD5 hashes and check what's missing on cloud
+    2. Upload missing files individually
+    3. Prune cloud dataset to match local state
+    """
+    logger.info(f"Starting sync to Cognee Cloud: dataset {dataset.name} ({dataset.id})")
+
+    try:
+        # Get cloud configuration
+        cloud_base_url = await _get_cloud_base_url()
+        cloud_auth_token = await _get_cloud_auth_token(user)
+
+        logger.info(f"Cloud API URL: {cloud_base_url}")
+
+        # Step 1: Extract local file info with stored hashes
+        local_files = await _extract_local_files_with_hashes(dataset, user, run_id)
+        logger.info(f"Found {len(local_files)} local files to sync")
+
+        # Update sync operation with total file count
+        try:
+            await update_sync_operation(run_id, processed_records=0)
+        except Exception as e:
+            logger.warning(f"Failed to initialize sync progress: {str(e)}")
+
+        if not local_files:
+            logger.info("No files to sync - dataset is empty")
+            return 0, 0
+
+        # Step 2: Check what files are missing on cloud
+        local_hashes = [f.content_hash for f in local_files]
+        missing_hashes = await _check_missing_hashes(
+            cloud_base_url, cloud_auth_token, dataset.id, local_hashes, run_id
+        )
+        logger.info(f"Cloud is missing {len(missing_hashes)} out of {len(local_hashes)} files")
+
+        # Update progress
+        try:
+            await update_sync_operation(run_id, progress_percentage=25)
+        except Exception as e:
+            logger.warning(f"Failed to update progress: {str(e)}")
+
+        # Step 3: Upload missing files
+        bytes_uploaded = await _upload_missing_files(
+            cloud_base_url, cloud_auth_token, dataset, local_files, missing_hashes, run_id
+        )
+        logger.info(f"Upload complete: {len(missing_hashes)} files, {bytes_uploaded} bytes")
+
+        # Update progress
+        try:
+            await update_sync_operation(run_id, progress_percentage=75)
+        except Exception as e:
+            logger.warning(f"Failed to update progress: {str(e)}")
+
+        # Step 4: Trigger cognify processing on cloud dataset (only if new files were uploaded)
+        if missing_hashes:
+            await _trigger_remote_cognify(cloud_base_url, cloud_auth_token, dataset.id, run_id)
+            logger.info(f"Cognify processing triggered for dataset {dataset.id}")
+        else:
+            logger.info(
+                f"Skipping cognify processing - no new files were uploaded for dataset {dataset.id}"
+            )
+
+        # Final progress
+        try:
+            await update_sync_operation(run_id, progress_percentage=100)
+        except Exception as e:
+            logger.warning(f"Failed to update final progress: {str(e)}")
+
+        records_processed = len(local_files)
+
+        logger.info(
+            f"Sync completed successfully: {records_processed} records, {bytes_uploaded} bytes uploaded"
+        )
+
+        return records_processed, bytes_uploaded
+
+    except Exception as e:
+        logger.error(f"Sync failed: {str(e)}")
+        raise ConnectionError(f"Cloud sync failed: {str(e)}")
+
+
+async def _extract_local_files_with_hashes(
+    dataset: Dataset, user: User, run_id: str
+) -> List[LocalFileInfo]:
+    """
+    Extract local dataset data with existing MD5 hashes from database.
+
+    Args:
+        dataset: Dataset to extract files from
+        user: User performing the sync
+        run_id: Unique identifier for this sync operation
+
+    Returns:
+        List[LocalFileInfo]: Information about each local file with stored hash
+    """
+    try:
+        logger.info(f"Extracting files from dataset: {dataset.name} ({dataset.id})")
+
+        # Get all data entries linked to this dataset
+        data_entries = await get_dataset_data(dataset.id)
+        logger.info(f"Found {len(data_entries)} data entries in dataset")
+
+        # Process each data entry to get file info and hash
+        local_files: List[LocalFileInfo] = []
+        skipped_count = 0
+
+        for data_entry in data_entries:
+            try:
+                # Use existing content_hash from database
+                content_hash = data_entry.raw_content_hash
+                file_size = data_entry.data_size if data_entry.data_size else 0
+
+                # Skip entries without content hash (shouldn't happen in normal cases)
+                if not content_hash:
+                    skipped_count += 1
+                    logger.warning(
+                        f"Skipping file {data_entry.name}: missing content_hash in database"
+                    )
+                    continue
+
+                if file_size == 0:
+                    # Get file size from filesystem if not stored
+                    file_size = await _get_file_size(data_entry.raw_data_location)
+
+                local_files.append(
+                    LocalFileInfo(
+                        id=str(data_entry.id),
+                        name=data_entry.name,
+                        mime_type=data_entry.mime_type,
+                        extension=data_entry.extension,
+                        raw_data_location=data_entry.raw_data_location,
+                        content_hash=content_hash,
+                        file_size=file_size,
+                        node_set=data_entry.node_set,
+                    )
+                )
+
+            except Exception as e:
+                skipped_count += 1
+                logger.warning(f"Failed to process file {data_entry.name}: {str(e)}")
+                # Continue with other entries even if one fails
+                continue
+
+        logger.info(
+            f"File extraction complete: {len(local_files)} files processed, {skipped_count} skipped"
+        )
+        return local_files
+
+    except Exception as e:
+        logger.error(f"Failed to extract files from dataset {dataset.name}: {str(e)}")
+        raise
+
+
+async def _get_file_size(file_path: str) -> int:
+    """Get file size in bytes."""
+    try:
+        file_dir = os.path.dirname(file_path)
+        file_name = os.path.basename(file_path)
+        file_storage = get_file_storage(file_dir)
+
+        return await file_storage.get_size(file_name)
+    except Exception:
+        return 0
+
+
+async def _get_cloud_base_url() -> str:
+    """Get Cognee Cloud API base URL."""
+    # TODO: Make this configurable via environment variable or config
+    return os.getenv("COGNEE_CLOUD_API_URL", "http://localhost:8001")
+
+
+async def _get_cloud_auth_token(user: User) -> str:
+    """Get authentication token for Cognee Cloud API."""
+    # TODO: Implement proper authentication with Cognee Cloud
+    # This should get or refresh an API token for the user
+    return os.getenv("COGNEE_CLOUD_AUTH_TOKEN", "your-auth-token-here")
+
+
+async def _check_missing_hashes(
+    cloud_base_url: str, auth_token: str, dataset_id: str, local_hashes: List[str], run_id: str
+) -> List[str]:
+    """
+    Step 1: Check which hashes are missing on cloud.
+
+    Returns:
+        List[str]: MD5 hashes that need to be uploaded
+    """
+    url = f"{cloud_base_url}/api/sync/{dataset_id}/diff"
+    headers = {"X-Api-Key": auth_token, "Content-Type": "application/json"}
+
+    payload = CheckMissingHashesRequest(hashes=local_hashes)
+
+    logger.info(f"Checking missing hashes on cloud for dataset {dataset_id}")
+
+    try:
+        async with aiohttp.ClientSession() as session:
+            async with session.post(url, json=payload.dict(), headers=headers) as response:
+                if response.status == 200:
+                    data = await response.json()
+                    missing_response = CheckMissingHashesResponse(**data)
+                    logger.info(
+                        f"Cloud reports {len(missing_response.missing)} missing files out of {len(local_hashes)} total"
+                    )
+                    return missing_response.missing
+                else:
+                    error_text = await response.text()
+                    logger.error(
+                        f"Failed to check missing hashes: Status {response.status} - {error_text}"
+                    )
+                    raise ConnectionError(
+                        f"Failed to check missing hashes: {response.status} - {error_text}"
+                    )
+
+    except Exception as e:
+        logger.error(f"Error checking missing hashes: {str(e)}")
+        raise ConnectionError(f"Failed to check missing hashes: {str(e)}")
+
+
+async def _upload_missing_files(
+    cloud_base_url: str,
+    auth_token: str,
+    dataset: Dataset,
+    local_files: List[LocalFileInfo],
+    missing_hashes: List[str],
+    run_id: str,
+) -> int:
+    """
+    Step 2: Upload files that are missing on cloud.
+
+    Returns:
+        int: Total bytes uploaded
+    """
+    # Filter local files to only those with missing hashes
+    files_to_upload = [f for f in local_files if f.content_hash in missing_hashes]
+
+    logger.info(f"Uploading {len(files_to_upload)} missing files to cloud")
+
+    if not files_to_upload:
+        logger.info("No files need to be uploaded - all files already exist on cloud")
+        return 0
+
+    total_bytes_uploaded = 0
+    uploaded_count = 0
+
+    headers = {"X-Api-Key": auth_token}
+
+    async with aiohttp.ClientSession() as session:
+        for file_info in files_to_upload:
+            try:
+                file_dir = os.path.dirname(file_info.raw_data_location)
+                file_name = os.path.basename(file_info.raw_data_location)
+                file_storage = get_file_storage(file_dir)
+
+                async with file_storage.open(file_name, mode="rb") as file:
+                    file_content = file.read()
+
+                # Upload file
+                url = f"{cloud_base_url}/api/sync/{dataset.id}/data/{file_info.id}"
+
+                request_data = aiohttp.FormData()
+
+                request_data.add_field(
+                    "file", file_content, content_type=file_info.mime_type, filename=file_info.name
+                )
+                request_data.add_field("dataset_id", str(dataset.id))
+                request_data.add_field("dataset_name", dataset.name)
+                request_data.add_field("data_id", str(file_info.id))
+                request_data.add_field("mime_type", file_info.mime_type)
+                request_data.add_field("extension", file_info.extension)
+                request_data.add_field("md5", file_info.content_hash)
+
+                async with session.put(url, data=request_data, headers=headers) as response:
+                    if response.status in [200, 201]:
+                        total_bytes_uploaded += len(file_content)
+                        uploaded_count += 1
+
+                        # Update progress periodically
+                        if uploaded_count % 10 == 0:
+                            progress = (
+                                25 + (uploaded_count / len(files_to_upload)) * 50
+                            )  # 25-75% range
+                            await update_sync_operation(run_id, progress_percentage=int(progress))
+                    else:
+                        error_text = await response.text()
+                        logger.error(
+                            f"Failed to upload {file_info.name}: Status {response.status} - {error_text}"
+                        )
+                        raise ConnectionError(
+                            f"Upload failed for {file_info.name}: HTTP {response.status} - {error_text}"
+                        )
+
+            except Exception as e:
+                logger.error(f"Error uploading file {file_info.name}: {str(e)}")
+                raise ConnectionError(f"Upload failed for {file_info.name}: {str(e)}")
+
+    logger.info(f"All {uploaded_count} files uploaded successfully: {total_bytes_uploaded} bytes")
+    return total_bytes_uploaded
+
+
+async def _prune_cloud_dataset(
+    cloud_base_url: str, auth_token: str, dataset_id: str, local_hashes: List[str], run_id: str
+) -> None:
+    """
+    Step 3: Prune cloud dataset to match local state.
+    """
+    url = f"{cloud_base_url}/api/sync/{dataset_id}?prune=true"
+    headers = {"X-Api-Key": auth_token, "Content-Type": "application/json"}
+
+    payload = PruneDatasetRequest(items=local_hashes)
+
+    logger.info("Pruning cloud dataset to match local state")
+
+    try:
+        async with aiohttp.ClientSession() as session:
+            async with session.put(url, json=payload.dict(), headers=headers) as response:
+                if response.status == 200:
+                    data = await response.json()
+                    deleted_entries = data.get("deleted_database_entries", 0)
+                    deleted_files = data.get("deleted_files_from_storage", 0)
+
+                    logger.info(
+                        f"Cloud dataset pruned successfully: {deleted_entries} entries deleted, {deleted_files} files removed"
+                    )
+                else:
+                    error_text = await response.text()
+                    logger.error(
+                        f"Failed to prune cloud dataset: Status {response.status} - {error_text}"
+                    )
+                    # Don't raise error for prune failures - sync partially succeeded
+
+    except Exception as e:
+        logger.error(f"Error pruning cloud dataset: {str(e)}")
+        # Don't raise error for prune failures - sync partially succeeded
+
+
+async def _trigger_remote_cognify(
+    cloud_base_url: str, auth_token: str, dataset_id: str, run_id: str
+) -> None:
+    """
+    Step 4: Trigger cognify processing on the cloud dataset.
+
+    This initiates knowledge graph processing on the synchronized dataset
+    using the cloud infrastructure.
+    """
+    url = f"{cloud_base_url}/api/cognify"
+    headers = {"X-Api-Key": auth_token, "Content-Type": "application/json"}
+
+    payload = {
+        "dataset_ids": [str(dataset_id)],  # Convert UUID to string for JSON serialization
+        "run_in_background": False,
+        "custom_prompt": "",
+    }
+
+    logger.info(f"Triggering cognify processing for dataset {dataset_id}")
+
+    try:
+        async with aiohttp.ClientSession() as session:
+            async with session.post(url, json=payload, headers=headers) as response:
+                if response.status == 200:
+                    data = await response.json()
+                    logger.info(f"Cognify processing started successfully: {data}")
+
+                    # Extract pipeline run IDs for monitoring if available
+                    if isinstance(data, dict):
+                        for dataset_key, run_info in data.items():
+                            if isinstance(run_info, dict) and "pipeline_run_id" in run_info:
+                                logger.info(
+                                    f"Cognify pipeline run ID for dataset {dataset_key}: {run_info['pipeline_run_id']}"
+                                )
+                else:
+                    error_text = await response.text()
+                    logger.warning(
+                        f"Failed to trigger cognify processing: Status {response.status} - {error_text}"
+                    )
+                    # TODO: consider adding retries
+
+    except Exception as e:
+        logger.warning(f"Error triggering cognify processing: {str(e)}")
+        # TODO: consider adding retries
diff --git a/cognee/api/v1/users/routers/get_auth_router.py b/cognee/api/v1/users/routers/get_auth_router.py
index cce3e33c8..b94b0607e 100644
--- a/cognee/api/v1/users/routers/get_auth_router.py
+++ b/cognee/api/v1/users/routers/get_auth_router.py
@@ -1,7 +1,19 @@
+from fastapi import Depends
+
 from cognee.modules.users.get_fastapi_users import get_fastapi_users
+from cognee.modules.users.models import User
+from cognee.modules.users.methods import get_authenticated_user
 from cognee.modules.users.authentication.get_client_auth_backend import get_client_auth_backend
 
 
 def get_auth_router():
     auth_backend = get_client_auth_backend()
-    return get_fastapi_users().get_auth_router(auth_backend)
+    auth_router = get_fastapi_users().get_auth_router(auth_backend)
+
+    @auth_router.get("/me")
+    async def get_me(user: User = Depends(get_authenticated_user)):
+        return {
+            "email": user.email,
+        }
+
+    return auth_router
diff --git a/cognee/infrastructure/databases/relational/__init__.py b/cognee/infrastructure/databases/relational/__init__.py
index 4050c752b..6f97d2c80 100644
--- a/cognee/infrastructure/databases/relational/__init__.py
+++ b/cognee/infrastructure/databases/relational/__init__.py
@@ -1,6 +1,8 @@
 from .ModelBase import Base
 from .config import get_relational_config
 from .config import get_migration_config
+from .get_async_session import get_async_session
+from .with_async_session import with_async_session
 from .create_db_and_tables import create_db_and_tables
 from .get_relational_engine import get_relational_engine
 from .get_migration_relational_engine import get_migration_relational_engine
diff --git a/cognee/infrastructure/databases/relational/get_async_session.py b/cognee/infrastructure/databases/relational/get_async_session.py
new file mode 100644
index 000000000..10f8e6aa1
--- /dev/null
+++ b/cognee/infrastructure/databases/relational/get_async_session.py
@@ -0,0 +1,15 @@
+from typing import AsyncGenerator
+from contextlib import asynccontextmanager
+from sqlalchemy.ext.asyncio import AsyncSession
+
+from .get_relational_engine import get_relational_engine
+
+
+@asynccontextmanager
+async def get_async_session(auto_commit=False) -> AsyncGenerator[AsyncSession, None]:
+    db_engine = get_relational_engine()
+    async with db_engine.get_async_session() as session:
+        yield session
+
+        if auto_commit:
+            await session.commit()
diff --git a/cognee/infrastructure/databases/relational/sqlalchemy/SqlAlchemyAdapter.py b/cognee/infrastructure/databases/relational/sqlalchemy/SqlAlchemyAdapter.py
index 607f3d06e..1b2b974cf 100644
--- a/cognee/infrastructure/databases/relational/sqlalchemy/SqlAlchemyAdapter.py
+++ b/cognee/infrastructure/databases/relational/sqlalchemy/SqlAlchemyAdapter.py
@@ -12,6 +12,7 @@ from sqlalchemy import NullPool, text, select, MetaData, Table, delete, inspect
 from sqlalchemy.ext.asyncio import AsyncSession, create_async_engine, async_sessionmaker
 
 from cognee.modules.data.models.Data import Data
+from cognee.modules.sync.models.SyncOperation import SyncOperation
 from cognee.shared.logging_utils import get_logger
 from cognee.infrastructure.utils.run_sync import run_sync
 from cognee.infrastructure.databases.exceptions import EntityNotFoundError
diff --git a/cognee/infrastructure/databases/relational/with_async_session.py b/cognee/infrastructure/databases/relational/with_async_session.py
new file mode 100644
index 000000000..c188ec158
--- /dev/null
+++ b/cognee/infrastructure/databases/relational/with_async_session.py
@@ -0,0 +1,25 @@
+from typing import Any, Callable, Optional
+from sqlalchemy.ext.asyncio import AsyncSession
+from .get_async_session import get_async_session
+
+
+def get_session_from_args(args):
+    last_arg = args[-1]
+    if isinstance(last_arg, AsyncSession):
+        return last_arg
+    return None
+
+
+def with_async_session(func: Callable[..., Any]) -> Callable[..., Any]:
+    async def wrapper(*args, **kwargs):
+        session = kwargs.get("session") or get_session_from_args(args)  # type: Optional[AsyncSession]
+
+        if session is None:
+            async with get_async_session() as session:
+                result = await func(*args, **kwargs, session=session)
+                await session.commit()
+                return result
+        else:
+            return await func(*args, **kwargs)
+
+    return wrapper
diff --git a/cognee/infrastructure/files/storage/LocalFileStorage.py b/cognee/infrastructure/files/storage/LocalFileStorage.py
index 38c2230a9..34e97d827 100644
--- a/cognee/infrastructure/files/storage/LocalFileStorage.py
+++ b/cognee/infrastructure/files/storage/LocalFileStorage.py
@@ -189,6 +189,15 @@ class LocalFileStorage(Storage):
 
         return os.path.isfile(os.path.join(parsed_storage_path, file_path))
 
+    def get_size(self, file_path: str) -> int:
+        parsed_storage_path = get_parsed_path(self.storage_path)
+
+        return (
+            os.path.getsize(os.path.join(parsed_storage_path, file_path))
+            if self.file_exists(file_path)
+            else 0
+        )
+
     def ensure_directory_exists(self, directory_path: str = ""):
         """
         Ensure that the specified directory exists, creating it if necessary.
diff --git a/cognee/infrastructure/files/storage/S3FileStorage.py b/cognee/infrastructure/files/storage/S3FileStorage.py
index 7c5a1033c..6218d6240 100644
--- a/cognee/infrastructure/files/storage/S3FileStorage.py
+++ b/cognee/infrastructure/files/storage/S3FileStorage.py
@@ -146,6 +146,11 @@ class S3FileStorage(Storage):
             self.s3.isfile, os.path.join(self.storage_path.replace("s3://", ""), file_path)
         )
 
+    async def get_size(self, file_path: str) -> int:
+        return await run_async(
+            self.s3.size, os.path.join(self.storage_path.replace("s3://", ""), file_path)
+        )
+
     async def ensure_directory_exists(self, directory_path: str = ""):
         """
         Ensure that the specified directory exists, creating it if necessary.
diff --git a/cognee/infrastructure/files/storage/StorageManager.py b/cognee/infrastructure/files/storage/StorageManager.py
index 55f37436d..5ac45f14f 100644
--- a/cognee/infrastructure/files/storage/StorageManager.py
+++ b/cognee/infrastructure/files/storage/StorageManager.py
@@ -46,6 +46,12 @@ class StorageManager:
         else:
             return self.storage.is_file(file_path)
 
+    async def get_size(self, file_path: str) -> int:
+        if inspect.iscoroutinefunction(self.storage.get_size):
+            return await self.storage.get_size(file_path)
+        else:
+            return self.storage.get_size(file_path)
+
     async def store(self, file_path: str, data: BinaryIO, overwrite: bool = False) -> str:
         """
         Store data at the specified file path.
@@ -84,7 +90,7 @@ class StorageManager:
         """
         # Check the actual storage type by class name to determine if open() is async or sync
 
-        if self.storage.__class__.__name__ == "S3FileStorage" and file_path.startswith("s3://"):
+        if self.storage.__class__.__name__ == "S3FileStorage":
             # S3FileStorage.open() is async
             async with self.storage.open(file_path, *args, **kwargs) as file:
                 yield file
diff --git a/cognee/infrastructure/files/storage/storage.py b/cognee/infrastructure/files/storage/storage.py
index 51c21b33e..540a280a5 100644
--- a/cognee/infrastructure/files/storage/storage.py
+++ b/cognee/infrastructure/files/storage/storage.py
@@ -40,6 +40,22 @@ class Storage(Protocol):
         """
         pass
 
+    def get_size(self, file_path: str) -> int:
+        """
+        Get the size of a specified file in bytes.
+
+        Parameters:
+        -----------
+
+            - file_path (str): The path of the file to get the size of.
+
+        Returns:
+        --------
+
+            - int: The size of the file in bytes.
+        """
+        pass
+
     def store(self, file_path: str, data: Union[BinaryIO, str], overwrite: bool):
         """
         Store data at the specified file path.
diff --git a/cognee/modules/cloud/exceptions/CloudApiKeyMissingError.py b/cognee/modules/cloud/exceptions/CloudApiKeyMissingError.py
new file mode 100644
index 000000000..2c12561ce
--- /dev/null
+++ b/cognee/modules/cloud/exceptions/CloudApiKeyMissingError.py
@@ -0,0 +1,15 @@
+from fastapi import status
+
+from cognee.exceptions.exceptions import CogneeConfigurationError
+
+
+class CloudApiKeyMissingError(CogneeConfigurationError):
+    """Raised when the API key for the cloud service is not provided."""
+
+    def __init__(
+        self,
+        message: str = "Failed to connect to the cloud service. Please add your API key to local instance.",
+        name: str = "CloudApiKeyMissingError",
+        status_code=status.HTTP_400_BAD_REQUEST,
+    ):
+        super().__init__(message, name, status_code)
diff --git a/cognee/modules/cloud/exceptions/CloudConnectionError.py b/cognee/modules/cloud/exceptions/CloudConnectionError.py
new file mode 100644
index 000000000..83b5557dd
--- /dev/null
+++ b/cognee/modules/cloud/exceptions/CloudConnectionError.py
@@ -0,0 +1,15 @@
+from fastapi import status
+
+from cognee.exceptions.exceptions import CogneeConfigurationError
+
+
+class CloudConnectionError(CogneeConfigurationError):
+    """Raised when the connection to the cloud service fails."""
+
+    def __init__(
+        self,
+        message: str = "Failed to connect to the cloud service. Please check your cloud API key in local instance.",
+        name: str = "CloudConnnectionError",
+        status_code=status.HTTP_503_SERVICE_UNAVAILABLE,
+    ):
+        super().__init__(message, name, status_code)
diff --git a/cognee/modules/cloud/exceptions/__init__.py b/cognee/modules/cloud/exceptions/__init__.py
new file mode 100644
index 000000000..194ca55c1
--- /dev/null
+++ b/cognee/modules/cloud/exceptions/__init__.py
@@ -0,0 +1,2 @@
+from .CloudConnectionError import CloudConnectionError
+from .CloudApiKeyMissingError import CloudApiKeyMissingError
diff --git a/cognee/modules/cloud/operations/__init__.py b/cognee/modules/cloud/operations/__init__.py
new file mode 100644
index 000000000..ad713eacc
--- /dev/null
+++ b/cognee/modules/cloud/operations/__init__.py
@@ -0,0 +1 @@
+from .check_api_key import check_api_key
diff --git a/cognee/modules/cloud/operations/check_api_key.py b/cognee/modules/cloud/operations/check_api_key.py
new file mode 100644
index 000000000..67c1eac3c
--- /dev/null
+++ b/cognee/modules/cloud/operations/check_api_key.py
@@ -0,0 +1,25 @@
+import aiohttp
+
+from cognee.modules.cloud.exceptions import CloudConnectionError
+
+
+async def check_api_key(auth_token: str):
+    cloud_base_url = "http://localhost:8001"
+
+    url = f"{cloud_base_url}/api/api-keys/check"
+    headers = {"X-Api-Key": auth_token}
+
+    try:
+        async with aiohttp.ClientSession() as session:
+            async with session.post(url, headers=headers) as response:
+                if response.status == 200:
+                    return
+                else:
+                    error_text = await response.text()
+
+                    raise CloudConnectionError(
+                        f"Failed to connect to cloud instance: {response.status} - {error_text}"
+                    )
+
+    except Exception as e:
+        raise CloudConnectionError(f"Failed to connect to cloud instance: {str(e)}")
diff --git a/cognee/modules/data/methods/check_dataset_name.py b/cognee/modules/data/methods/check_dataset_name.py
index c075ea353..e50082382 100644
--- a/cognee/modules/data/methods/check_dataset_name.py
+++ b/cognee/modules/data/methods/check_dataset_name.py
@@ -1,3 +1,3 @@
 def check_dataset_name(dataset_name: str):
     if "." in dataset_name or " " in dataset_name:
-        raise ValueError("Dataset name cannot contain spaces or underscores")
+        raise ValueError("Dataset name cannot contain spaces or dots.")
diff --git a/cognee/modules/data/methods/get_dataset_data.py b/cognee/modules/data/methods/get_dataset_data.py
index 80669fddb..afe61ddc5 100644
--- a/cognee/modules/data/methods/get_dataset_data.py
+++ b/cognee/modules/data/methods/get_dataset_data.py
@@ -12,6 +12,6 @@ async def get_dataset_data(dataset_id: UUID) -> list[Data]:
             select(Data).join(Data.datasets).filter((Dataset.id == dataset_id))
         )
 
-        data = result.scalars().all()
+        data = list(result.scalars().all())
 
         return data
diff --git a/cognee/modules/notebooks/methods/__init__.py b/cognee/modules/notebooks/methods/__init__.py
new file mode 100644
index 000000000..7d9cb3b75
--- /dev/null
+++ b/cognee/modules/notebooks/methods/__init__.py
@@ -0,0 +1,5 @@
+from .get_notebook import get_notebook
+from .get_notebooks import get_notebooks
+from .create_notebook import create_notebook
+from .update_notebook import update_notebook
+from .delete_notebook import delete_notebook
diff --git a/cognee/modules/notebooks/methods/create_notebook.py b/cognee/modules/notebooks/methods/create_notebook.py
new file mode 100644
index 000000000..c94ea6977
--- /dev/null
+++ b/cognee/modules/notebooks/methods/create_notebook.py
@@ -0,0 +1,24 @@
+from uuid import UUID
+from typing import List, Optional
+from sqlalchemy.ext.asyncio import AsyncSession
+
+from cognee.infrastructure.databases.relational import with_async_session
+
+from ..models.Notebook import Notebook, NotebookCell
+
+
+@with_async_session
+async def create_notebook(
+    user_id: UUID,
+    notebook_name: str,
+    cells: Optional[List[NotebookCell]],
+    deletable: Optional[bool],
+    session: AsyncSession,
+) -> Notebook:
+    notebook = Notebook(name=notebook_name, owner_id=user_id, cells=cells, deletable=deletable)
+
+    session.add(notebook)
+
+    await session.commit()
+
+    return notebook
diff --git a/cognee/modules/notebooks/methods/delete_notebook.py b/cognee/modules/notebooks/methods/delete_notebook.py
new file mode 100644
index 000000000..df089540a
--- /dev/null
+++ b/cognee/modules/notebooks/methods/delete_notebook.py
@@ -0,0 +1,13 @@
+from sqlalchemy.ext.asyncio import AsyncSession
+
+from cognee.infrastructure.databases.relational import with_async_session
+
+from ..models.Notebook import Notebook
+
+
+@with_async_session
+async def delete_notebook(
+    notebook: Notebook,
+    session: AsyncSession,
+) -> None:
+    await session.delete(notebook)
diff --git a/cognee/modules/notebooks/methods/get_notebook.py b/cognee/modules/notebooks/methods/get_notebook.py
new file mode 100644
index 000000000..ca666edaa
--- /dev/null
+++ b/cognee/modules/notebooks/methods/get_notebook.py
@@ -0,0 +1,21 @@
+from uuid import UUID
+from typing import Optional
+from sqlalchemy import select
+from sqlalchemy.ext.asyncio import AsyncSession
+
+from cognee.infrastructure.databases.relational import with_async_session
+
+from ..models.Notebook import Notebook
+
+
+@with_async_session
+async def get_notebook(
+    notebook_id: UUID,
+    user_id: UUID,
+    session: AsyncSession,
+) -> Optional[Notebook]:
+    result = await session.execute(
+        select(Notebook).where(Notebook.owner_id == user_id and Notebook.id == notebook_id)
+    )
+
+    return result.scalar()
diff --git a/cognee/modules/notebooks/methods/get_notebooks.py b/cognee/modules/notebooks/methods/get_notebooks.py
new file mode 100644
index 000000000..aeb4f7704
--- /dev/null
+++ b/cognee/modules/notebooks/methods/get_notebooks.py
@@ -0,0 +1,18 @@
+from uuid import UUID
+from typing import List
+from sqlalchemy import select
+from sqlalchemy.ext.asyncio import AsyncSession
+
+from cognee.infrastructure.databases.relational import with_async_session
+
+from ..models.Notebook import Notebook
+
+
+@with_async_session
+async def get_notebooks(
+    user_id: UUID,
+    session: AsyncSession,
+) -> List[Notebook]:
+    result = await session.execute(select(Notebook).where(Notebook.owner_id == user_id))
+
+    return list(result.scalars().all())
diff --git a/cognee/modules/notebooks/methods/update_notebook.py b/cognee/modules/notebooks/methods/update_notebook.py
new file mode 100644
index 000000000..4d194202f
--- /dev/null
+++ b/cognee/modules/notebooks/methods/update_notebook.py
@@ -0,0 +1,17 @@
+from typing import Callable, AsyncContextManager
+from sqlalchemy.ext.asyncio import AsyncSession
+
+from cognee.infrastructure.databases.relational import with_async_session
+
+from ..models.Notebook import Notebook
+
+
+@with_async_session
+async def update_notebook(
+    notebook: Notebook,
+    session: AsyncSession,
+) -> Notebook:
+    if notebook not in session:
+        session.add(notebook)
+
+    return notebook
diff --git a/cognee/modules/notebooks/models/Notebook.py b/cognee/modules/notebooks/models/Notebook.py
new file mode 100644
index 000000000..7bf26d4a7
--- /dev/null
+++ b/cognee/modules/notebooks/models/Notebook.py
@@ -0,0 +1,53 @@
+import json
+from typing import List, Literal
+from uuid import uuid4, UUID as UUID_t
+from pydantic import BaseModel, ConfigDict
+from datetime import datetime, timezone
+from fastapi.encoders import jsonable_encoder
+from sqlalchemy import Boolean, Column, DateTime, JSON, UUID, String, TypeDecorator
+from sqlalchemy.orm import mapped_column, Mapped
+
+from cognee.infrastructure.databases.relational import Base
+
+
+class NotebookCell(BaseModel):
+    id: UUID_t
+    type: Literal["markdown", "code"]
+    name: str
+    content: str
+
+    model_config = ConfigDict(arbitrary_types_allowed=True)
+
+
+class NotebookCellList(TypeDecorator):
+    impl = JSON
+    cache_ok = True
+
+    def process_bind_param(self, notebook_cells, dialect):
+        if notebook_cells is None:
+            return []
+        return [
+            json.dumps(jsonable_encoder(cell)) if isinstance(cell, NotebookCell) else cell
+            for cell in notebook_cells
+        ]
+
+    def process_result_value(self, cells_json_list, dialect):
+        if cells_json_list is None:
+            return []
+        return [NotebookCell(**json.loads(json_string)) for json_string in cells_json_list]
+
+
+class Notebook(Base):
+    __tablename__ = "notebooks"
+
+    id: Mapped[UUID_t] = mapped_column(UUID(as_uuid=True), primary_key=True, default=uuid4)
+
+    owner_id: Mapped[UUID_t] = mapped_column(UUID(as_uuid=True), index=True)
+
+    name: Mapped[str] = mapped_column(String, nullable=False)
+
+    cells: Mapped[List[NotebookCell]] = mapped_column(NotebookCellList, nullable=False)
+
+    deletable: Mapped[bool] = mapped_column(Boolean, default=True)
+
+    created_at = Column(DateTime(timezone=True), default=lambda: datetime.now(timezone.utc))
diff --git a/cognee/modules/notebooks/models/__init__.py b/cognee/modules/notebooks/models/__init__.py
new file mode 100644
index 000000000..1b29c5211
--- /dev/null
+++ b/cognee/modules/notebooks/models/__init__.py
@@ -0,0 +1 @@
+from .Notebook import Notebook, NotebookCell
diff --git a/cognee/modules/notebooks/operations/__init__.py b/cognee/modules/notebooks/operations/__init__.py
new file mode 100644
index 000000000..78c97fb99
--- /dev/null
+++ b/cognee/modules/notebooks/operations/__init__.py
@@ -0,0 +1 @@
+from .run_in_local_sandbox import run_in_local_sandbox
diff --git a/cognee/modules/notebooks/operations/run_in_local_sandbox.py b/cognee/modules/notebooks/operations/run_in_local_sandbox.py
new file mode 100644
index 000000000..f3955c256
--- /dev/null
+++ b/cognee/modules/notebooks/operations/run_in_local_sandbox.py
@@ -0,0 +1,69 @@
+import io
+import sys
+import traceback
+
+
+def wrap_in_async_handler(user_code: str) -> str:
+    return (
+        "import asyncio\n\n"
+        "from cognee.infrastructure.utils.run_sync import run_sync\n\n"
+        "async def __user_main__():\n"
+        + "\n".join("    " + line for line in user_code.strip().split("\n"))
+        + "\n"
+        "    globals().update(locals())\n\n"
+        "run_sync(__user_main__())\n"
+    )
+
+
+def run_in_local_sandbox(code, environment=None):
+    environment = environment or {}
+    code = wrap_in_async_handler(code.replace("\xa0", "\n"))
+
+    buffer = io.StringIO()
+    sys_stdout = sys.stdout
+    sys.stdout = buffer
+    sys.stderr = buffer
+
+    error = None
+
+    printOutput = []
+
+    # def process_output(output):
+    #     try:
+    #         result = json.loads(
+    #             re.sub(
+    #                 r"'([^']*)'", r'"\1"',
+    #                 re.sub(r"\bNone\b", "null", output)
+    #             )
+    #         )
+    #         result = json.loads(output)
+    #         return result
+    #     except json.JSONDecodeError:
+    #         return output
+
+    def customPrintFunction(output):
+        printOutput.append(output)
+
+    environment["print"] = customPrintFunction
+
+    try:
+        exec(code, environment)
+    except Exception:
+        error = traceback.format_exc()
+    finally:
+        sys.stdout = sys_stdout
+        sys.stderr = sys_stdout
+
+    return printOutput, error
+
+
+if __name__ == "__main__":
+    run_in_local_sandbox("""
+import cognee
+
+await cognee.add("Test file with some random content 3.")
+
+a = "asd"
+
+b = {"c": "dfgh"}
+""")
diff --git a/cognee/modules/retrieval/graph_completion_cot_retriever.py b/cognee/modules/retrieval/graph_completion_cot_retriever.py
index 86ff8555b..7e14078e4 100644
--- a/cognee/modules/retrieval/graph_completion_cot_retriever.py
+++ b/cognee/modules/retrieval/graph_completion_cot_retriever.py
@@ -1,4 +1,4 @@
-from typing import Any, Optional, List, Type
+from typing import Any, Optional, List, Tuple, Type
 from cognee.shared.logging_utils import get_logger
 
 from cognee.modules.retrieval.graph_completion_retriever import GraphCompletionRetriever
diff --git a/cognee/modules/retrieval/graph_completion_retriever.py b/cognee/modules/retrieval/graph_completion_retriever.py
index bc4fa27b3..478fe4300 100644
--- a/cognee/modules/retrieval/graph_completion_retriever.py
+++ b/cognee/modules/retrieval/graph_completion_retriever.py
@@ -1,4 +1,4 @@
-from typing import Any, Optional, Type, List, Coroutine
+from typing import Any, Optional, Type, List
 from collections import Counter
 from uuid import NAMESPACE_OID, uuid5
 import string
@@ -106,7 +106,7 @@ class GraphCompletionRetriever(BaseRetriever):
 
         return found_triplets
 
-    async def get_context(self, query: str) -> str | tuple[str, list]:
+    async def get_context(self, query: str) -> tuple[str, list]:
         """
         Retrieves and resolves graph triplets into context based on a query.
 
@@ -135,7 +135,7 @@ class GraphCompletionRetriever(BaseRetriever):
         self,
         query: str,
         context: Optional[Any] = None,
-    ) -> Any:
+    ) -> List[str]:
         """
         Generates a completion using graph connections context based on a query.
 
diff --git a/cognee/modules/retrieval/temporal_retriever.py b/cognee/modules/retrieval/temporal_retriever.py
index edd38489c..1e56dda3a 100644
--- a/cognee/modules/retrieval/temporal_retriever.py
+++ b/cognee/modules/retrieval/temporal_retriever.py
@@ -1,5 +1,5 @@
 import os
-from typing import Any, Optional, List, Type
+from typing import Any, Optional, List, Tuple, Type
 
 
 from operator import itemgetter
@@ -101,6 +101,8 @@ class TemporalRetriever(GraphCompletionRetriever):
 
         graph_engine = await get_graph_engine()
 
+        triplets = []
+
         if time_from and time_to:
             ids = await graph_engine.collect_time_ids(time_from=time_from, time_to=time_to)
         elif time_from:
@@ -132,12 +134,12 @@ class TemporalRetriever(GraphCompletionRetriever):
 
         top_k_events = await self.filter_top_k_events(relevant_events, vector_search_results)
 
-        return self.descriptions_to_string(top_k_events)
+        return self.descriptions_to_string(top_k_events), triplets
 
-    async def get_completion(self, query: str, context: Optional[Any] = None) -> Any:
+    async def get_completion(self, query: str, context: Optional[Any] = None) -> List[str]:
         """Generates a response using the query and optional context."""
 
-        context = await self.get_context(query=query)
+        context, triplets = await self.get_context(query=query)
 
         completion = await generate_completion(
             query=query,
diff --git a/cognee/modules/search/methods/search.py b/cognee/modules/search/methods/search.py
index 749a36547..cb2cc2d20 100644
--- a/cognee/modules/search/methods/search.py
+++ b/cognee/modules/search/methods/search.py
@@ -2,8 +2,10 @@ import os
 import json
 import asyncio
 from uuid import UUID
+from fastapi.encoders import jsonable_encoder
 from typing import Callable, List, Optional, Type, Union
 
+
 from cognee.modules.engine.models.node_set import NodeSet
 from cognee.modules.retrieval.user_qa_feedback import UserQAFeedback
 from cognee.modules.search.exceptions import UnsupportedSearchTypeError
@@ -233,7 +235,7 @@ async def authorized_search(
         only_context=only_context,
     )
 
-    await log_result(query.id, json.dumps(search_results, cls=JSONEncoder), user.id)
+    await log_result(query.id, json.dumps(jsonable_encoder(search_results)), user.id)
 
     return search_results
 
@@ -273,7 +275,8 @@ async def specific_search_by_context(
     ):
         # Set database configuration in async context for each dataset user has access for
         await set_database_global_context_variables(dataset.id, dataset.owner_id)
-        search_results = await specific_search(
+
+        result = await specific_search(
             query_type=query_type,
             query_text=query_text,
             user=user,
@@ -286,8 +289,42 @@ async def specific_search_by_context(
             last_k=last_k,
             only_context=only_context,
         )
+
+        if isinstance(result, tuple):
+            search_results = result[0]
+            triplets = result[1]
+        else:
+            search_results = result
+            triplets = []
+
         return {
             "search_result": search_results,
+            "graph": [
+                {
+                    "source": {
+                        "id": triplet.node1.id,
+                        "attributes": {
+                            "name": triplet.node1.attributes["name"],
+                            "type": triplet.node1.attributes["type"],
+                            "description": triplet.node1.attributes["description"],
+                            "vector_distance": triplet.node1.attributes["vector_distance"],
+                        },
+                    },
+                    "destination": {
+                        "id": triplet.node2.id,
+                        "attributes": {
+                            "name": triplet.node2.attributes["name"],
+                            "type": triplet.node2.attributes["type"],
+                            "description": triplet.node2.attributes["description"],
+                            "vector_distance": triplet.node2.attributes["vector_distance"],
+                        },
+                    },
+                    "attributes": {
+                        "relationship_name": triplet.attributes["relationship_name"],
+                    },
+                }
+                for triplet in triplets
+            ],
             "dataset_id": dataset.id,
             "dataset_name": dataset.name,
         }
diff --git a/cognee/modules/sync/__init__.py b/cognee/modules/sync/__init__.py
new file mode 100644
index 000000000..4c90398ab
--- /dev/null
+++ b/cognee/modules/sync/__init__.py
@@ -0,0 +1 @@
+# Sync module for tracking sync operations
diff --git a/cognee/modules/sync/methods/__init__.py b/cognee/modules/sync/methods/__init__.py
new file mode 100644
index 000000000..0fb1c48e1
--- /dev/null
+++ b/cognee/modules/sync/methods/__init__.py
@@ -0,0 +1,18 @@
+from .create_sync_operation import create_sync_operation
+from .get_sync_operation import get_sync_operation, get_user_sync_operations
+from .update_sync_operation import (
+    update_sync_operation,
+    mark_sync_started,
+    mark_sync_completed,
+    mark_sync_failed,
+)
+
+__all__ = [
+    "create_sync_operation",
+    "get_sync_operation",
+    "get_user_sync_operations",
+    "update_sync_operation",
+    "mark_sync_started",
+    "mark_sync_completed",
+    "mark_sync_failed",
+]
diff --git a/cognee/modules/sync/methods/create_sync_operation.py b/cognee/modules/sync/methods/create_sync_operation.py
new file mode 100644
index 000000000..96f53faa3
--- /dev/null
+++ b/cognee/modules/sync/methods/create_sync_operation.py
@@ -0,0 +1,45 @@
+from uuid import UUID
+from typing import Optional
+from datetime import datetime, timezone
+from cognee.modules.sync.models import SyncOperation, SyncStatus
+from cognee.infrastructure.databases.relational import get_relational_engine
+
+
+async def create_sync_operation(
+    run_id: str,
+    dataset_id: UUID,
+    dataset_name: str,
+    user_id: UUID,
+    total_records: Optional[int] = None,
+) -> SyncOperation:
+    """
+    Create a new sync operation record in the database.
+
+    Args:
+        run_id: Unique public identifier for this sync operation
+        dataset_id: UUID of the dataset being synced
+        dataset_name: Name of the dataset being synced
+        user_id: UUID of the user who initiated the sync
+        total_records: Total number of records to sync (if known)
+
+    Returns:
+        SyncOperation: The created sync operation record
+    """
+    db_engine = get_relational_engine()
+
+    sync_operation = SyncOperation(
+        run_id=run_id,
+        dataset_id=dataset_id,
+        dataset_name=dataset_name,
+        user_id=user_id,
+        status=SyncStatus.STARTED,
+        total_records=total_records,
+        created_at=datetime.now(timezone.utc),
+    )
+
+    async with db_engine.get_async_session() as session:
+        session.add(sync_operation)
+        await session.commit()
+        await session.refresh(sync_operation)
+
+    return sync_operation
diff --git a/cognee/modules/sync/methods/get_sync_operation.py b/cognee/modules/sync/methods/get_sync_operation.py
new file mode 100644
index 000000000..f3c466a3f
--- /dev/null
+++ b/cognee/modules/sync/methods/get_sync_operation.py
@@ -0,0 +1,79 @@
+from uuid import UUID
+from typing import List, Optional
+from sqlalchemy import select, desc
+from cognee.modules.sync.models import SyncOperation
+from cognee.infrastructure.databases.relational import get_relational_engine
+
+
+async def get_sync_operation(run_id: str) -> Optional[SyncOperation]:
+    """
+    Get a sync operation by its run_id.
+
+    Args:
+        run_id: The public run_id of the sync operation
+
+    Returns:
+        SyncOperation: The sync operation record, or None if not found
+    """
+    db_engine = get_relational_engine()
+
+    async with db_engine.get_async_session() as session:
+        query = select(SyncOperation).where(SyncOperation.run_id == run_id)
+        result = await session.execute(query)
+        return result.scalars().first()
+
+
+async def get_user_sync_operations(
+    user_id: UUID, limit: int = 50, offset: int = 0
+) -> List[SyncOperation]:
+    """
+    Get sync operations for a specific user, ordered by most recent first.
+
+    Args:
+        user_id: UUID of the user
+        limit: Maximum number of records to return
+        offset: Number of records to skip
+
+    Returns:
+        List[SyncOperation]: List of sync operations for the user
+    """
+    db_engine = get_relational_engine()
+
+    async with db_engine.get_async_session() as session:
+        query = (
+            select(SyncOperation)
+            .where(SyncOperation.user_id == user_id)
+            .order_by(desc(SyncOperation.created_at))
+            .limit(limit)
+            .offset(offset)
+        )
+        result = await session.execute(query)
+        return list(result.scalars().all())
+
+
+async def get_sync_operations_by_dataset(
+    dataset_id: UUID, limit: int = 50, offset: int = 0
+) -> List[SyncOperation]:
+    """
+    Get sync operations for a specific dataset.
+
+    Args:
+        dataset_id: UUID of the dataset
+        limit: Maximum number of records to return
+        offset: Number of records to skip
+
+    Returns:
+        List[SyncOperation]: List of sync operations for the dataset
+    """
+    db_engine = get_relational_engine()
+
+    async with db_engine.get_async_session() as session:
+        query = (
+            select(SyncOperation)
+            .where(SyncOperation.dataset_id == dataset_id)
+            .order_by(desc(SyncOperation.created_at))
+            .limit(limit)
+            .offset(offset)
+        )
+        result = await session.execute(query)
+        return list(result.scalars().all())
diff --git a/cognee/modules/sync/methods/update_sync_operation.py b/cognee/modules/sync/methods/update_sync_operation.py
new file mode 100644
index 000000000..04ad0c786
--- /dev/null
+++ b/cognee/modules/sync/methods/update_sync_operation.py
@@ -0,0 +1,117 @@
+from typing import Optional
+from datetime import datetime, timezone
+from sqlalchemy import select
+from cognee.modules.sync.models import SyncOperation, SyncStatus
+from cognee.infrastructure.databases.relational import get_relational_engine
+
+
+async def update_sync_operation(
+    run_id: str,
+    status: Optional[SyncStatus] = None,
+    progress_percentage: Optional[int] = None,
+    processed_records: Optional[int] = None,
+    bytes_transferred: Optional[int] = None,
+    error_message: Optional[str] = None,
+    retry_count: Optional[int] = None,
+    started_at: Optional[datetime] = None,
+    completed_at: Optional[datetime] = None,
+) -> Optional[SyncOperation]:
+    """
+    Update a sync operation record with new status/progress information.
+
+    Args:
+        run_id: The public run_id of the sync operation to update
+        status: New status for the operation
+        progress_percentage: Progress percentage (0-100)
+        processed_records: Number of records processed so far
+        bytes_transferred: Total bytes transferred
+        error_message: Error message if operation failed
+        retry_count: Number of retry attempts
+        started_at: When the actual processing started
+        completed_at: When the operation completed (success or failure)
+
+    Returns:
+        SyncOperation: The updated sync operation record, or None if not found
+    """
+    db_engine = get_relational_engine()
+
+    async with db_engine.get_async_session() as session:
+        # Find the sync operation
+        query = select(SyncOperation).where(SyncOperation.run_id == run_id)
+        result = await session.execute(query)
+        sync_operation = result.scalars().first()
+
+        if not sync_operation:
+            return None
+
+        # Update fields that were provided
+        if status is not None:
+            sync_operation.status = status
+
+        if progress_percentage is not None:
+            sync_operation.progress_percentage = max(0, min(100, progress_percentage))
+
+        if processed_records is not None:
+            sync_operation.processed_records = processed_records
+
+        if bytes_transferred is not None:
+            sync_operation.bytes_transferred = bytes_transferred
+
+        if error_message is not None:
+            sync_operation.error_message = error_message
+
+        if retry_count is not None:
+            sync_operation.retry_count = retry_count
+
+        if started_at is not None:
+            sync_operation.started_at = started_at
+
+        if completed_at is not None:
+            sync_operation.completed_at = completed_at
+
+        # Auto-set completion timestamp for terminal statuses
+        if (
+            status in [SyncStatus.COMPLETED, SyncStatus.FAILED, SyncStatus.CANCELLED]
+            and completed_at is None
+        ):
+            sync_operation.completed_at = datetime.now(timezone.utc)
+
+        # Auto-set started timestamp when moving to IN_PROGRESS
+        if status == SyncStatus.IN_PROGRESS and sync_operation.started_at is None:
+            sync_operation.started_at = datetime.now(timezone.utc)
+
+        await session.commit()
+        await session.refresh(sync_operation)
+
+        return sync_operation
+
+
+async def mark_sync_started(run_id: str) -> Optional[SyncOperation]:
+    """Convenience method to mark a sync operation as started."""
+    return await update_sync_operation(
+        run_id=run_id, status=SyncStatus.IN_PROGRESS, started_at=datetime.now(timezone.utc)
+    )
+
+
+async def mark_sync_completed(
+    run_id: str, processed_records: int, bytes_transferred: int
+) -> Optional[SyncOperation]:
+    """Convenience method to mark a sync operation as completed successfully."""
+    return await update_sync_operation(
+        run_id=run_id,
+        status=SyncStatus.COMPLETED,
+        progress_percentage=100,
+        processed_records=processed_records,
+        bytes_transferred=bytes_transferred,
+        completed_at=datetime.now(timezone.utc),
+    )
+
+
+async def mark_sync_failed(run_id: str, error_message: str) -> Optional[SyncOperation]:
+    """Convenience method to mark a sync operation as failed."""
+    return await update_sync_operation(
+        run_id=run_id,
+        status=SyncStatus.FAILED,
+        error_message=error_message,
+        completed_at=datetime.now(timezone.utc),
+    )
diff --git a/cognee/modules/sync/models/SyncOperation.py b/cognee/modules/sync/models/SyncOperation.py
new file mode 100644
index 000000000..ea63bb327
--- /dev/null
+++ b/cognee/modules/sync/models/SyncOperation.py
@@ -0,0 +1,86 @@
+from uuid import uuid4
+from enum import Enum
+from typing import Optional
+from datetime import datetime, timezone
+from sqlalchemy import Column, Text, DateTime, UUID as SQLAlchemy_UUID, Integer, Enum as SQLEnum
+
+from cognee.infrastructure.databases.relational import Base
+
+
+class SyncStatus(str, Enum):
+    """Enumeration of possible sync operation statuses."""
+
+    STARTED = "started"
+    IN_PROGRESS = "in_progress"
+    COMPLETED = "completed"
+    FAILED = "failed"
+    CANCELLED = "cancelled"
+
+
+class SyncOperation(Base):
+    """
+    Database model for tracking sync operations.
+
+    This model stores information about background sync operations,
+    allowing users to monitor progress and query the status of their sync requests.
+    """
+
+    __tablename__ = "sync_operations"
+
+    # Primary identifiers
+    id = Column(SQLAlchemy_UUID, primary_key=True, default=uuid4, doc="Database primary key")
+    run_id = Column(Text, unique=True, index=True, doc="Public run ID returned to users")
+
+    # Status and progress tracking
+    status = Column(
+        SQLEnum(SyncStatus), default=SyncStatus.STARTED, doc="Current status of the sync operation"
+    )
+    progress_percentage = Column(Integer, default=0, doc="Progress percentage (0-100)")
+
+    # Operation metadata
+    dataset_id = Column(SQLAlchemy_UUID, index=True, doc="ID of the dataset being synced")
+    dataset_name = Column(Text, doc="Name of the dataset being synced")
+    user_id = Column(SQLAlchemy_UUID, index=True, doc="ID of the user who initiated the sync")
+
+    # Timing information
+    created_at = Column(
+        DateTime(timezone=True),
+        default=lambda: datetime.now(timezone.utc),
+        doc="When the sync was initiated",
+    )
+    started_at = Column(DateTime(timezone=True), doc="When the actual sync processing began")
+    completed_at = Column(
+        DateTime(timezone=True), doc="When the sync finished (success or failure)"
+    )
+
+    # Operation details
+    total_records = Column(Integer, doc="Total number of records to sync")
+    processed_records = Column(Integer, default=0, doc="Number of records successfully processed")
+    bytes_transferred = Column(Integer, default=0, doc="Total bytes transferred to cloud")
+
+    # Error handling
+    error_message = Column(Text, doc="Error message if sync failed")
+    retry_count = Column(Integer, default=0, doc="Number of retry attempts")
+
+    # Additional metadata (can be added later when needed)
+    # cloud_endpoint = Column(Text, doc="Cloud endpoint used for sync")
+    # compression_enabled = Column(Text, doc="Whether compression was used")
+
+    def get_duration_seconds(self) -> Optional[float]:
+        """Get the duration of the sync operation in seconds."""
+        if not self.created_at:
+            return None
+
+        end_time = self.completed_at or datetime.now(timezone.utc)
+        return (end_time - self.created_at).total_seconds()
+
+    def get_progress_info(self) -> dict:
+        """Get comprehensive progress information."""
+        return {
+            "status": self.status.value,
+            "progress_percentage": self.progress_percentage,
+            "records_processed": f"{self.processed_records or 0}/{self.total_records or 'unknown'}",
+            "bytes_transferred": self.bytes_transferred or 0,
+            "duration_seconds": self.get_duration_seconds(),
+            "error_message": self.error_message,
+        }
diff --git a/cognee/modules/sync/models/__init__.py b/cognee/modules/sync/models/__init__.py
new file mode 100644
index 000000000..fa2c4cdd7
--- /dev/null
+++ b/cognee/modules/sync/models/__init__.py
@@ -0,0 +1,3 @@
+from .SyncOperation import SyncOperation, SyncStatus
+
+__all__ = ["SyncOperation", "SyncStatus"]
diff --git a/cognee/modules/users/__init__.py b/cognee/modules/users/__init__.py
index 54fb679e5..2fe7c570c 100644
--- a/cognee/modules/users/__init__.py
+++ b/cognee/modules/users/__init__.py
@@ -1,2 +1 @@
 from .get_user_db import get_user_db
-from .get_user_db import get_async_session
diff --git a/cognee/modules/users/methods/create_user.py b/cognee/modules/users/methods/create_user.py
index bfe1a5873..fd96dc374 100644
--- a/cognee/modules/users/methods/create_user.py
+++ b/cognee/modules/users/methods/create_user.py
@@ -1,6 +1,10 @@
+from uuid import uuid4
 from fastapi_users.exceptions import UserAlreadyExists
-from cognee.modules.users.exceptions import TenantNotFoundError
+
 from cognee.infrastructure.databases.relational import get_relational_engine
+from cognee.modules.notebooks.methods import create_notebook
+from cognee.modules.notebooks.models.Notebook import NotebookCell
+from cognee.modules.users.exceptions import TenantNotFoundError
 from cognee.modules.users.get_user_manager import get_user_manager_context
 from cognee.modules.users.get_user_db import get_user_db_context
 from cognee.modules.users.models.User import UserCreate
@@ -56,6 +60,27 @@ async def create_user(
                     if auto_login:
                         await session.refresh(user)
 
+                    await create_notebook(
+                        user_id=user.id,
+                        notebook_name="Welcome to cognee 🧠",
+                        cells=[
+                            NotebookCell(
+                                id=uuid4(),
+                                name="Welcome",
+                                content="Cognee is your toolkit for turning text into a structured knowledge graph, optionally enhanced by ontologies, and then querying it with advanced retrieval techniques. This notebook will guide you through a simple example.",
+                                type="markdown",
+                            ),
+                            NotebookCell(
+                                id=uuid4(),
+                                name="Example",
+                                content="",
+                                type="code",
+                            ),
+                        ],
+                        deletable=False,
+                        session=session,
+                    )
+
                     return user
     except UserAlreadyExists as error:
         print(f"User {email} already exists")
diff --git a/cognee/modules/users/permissions/methods/get_specific_user_permission_datasets.py b/cognee/modules/users/permissions/methods/get_specific_user_permission_datasets.py
index f5105ebf6..b6ad1291d 100644
--- a/cognee/modules/users/permissions/methods/get_specific_user_permission_datasets.py
+++ b/cognee/modules/users/permissions/methods/get_specific_user_permission_datasets.py
@@ -1,4 +1,5 @@
 from uuid import UUID
+from typing import Optional
 from cognee.modules.data.models.Dataset import Dataset
 from cognee.modules.users.permissions.methods.get_all_user_permission_datasets import (
     get_all_user_permission_datasets,
@@ -8,7 +9,7 @@ from cognee.modules.users.methods import get_user
 
 
 async def get_specific_user_permission_datasets(
-    user_id: UUID, permission_type: str, dataset_ids: list[UUID] = None
+    user_id: UUID, permission_type: str, dataset_ids: Optional[list[UUID]] = None
 ) -> list[Dataset]:
     """
         Return a list of datasets user has given permission for. If a list of datasets is provided,

From 1335f6fdd07420391958d460910d73e28049ea06 Mon Sep 17 00:00:00 2001
From: lxobr <122801072+lxobr@users.noreply.github.com>
Date: Sun, 7 Sep 2025 17:12:39 +0200
Subject: [PATCH 19/19] fix: fix return values

---
 cognee/modules/retrieval/temporal_retriever.py | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/cognee/modules/retrieval/temporal_retriever.py b/cognee/modules/retrieval/temporal_retriever.py
index 1e56dda3a..0ab8e2ecf 100644
--- a/cognee/modules/retrieval/temporal_retriever.py
+++ b/cognee/modules/retrieval/temporal_retriever.py
@@ -114,7 +114,7 @@ class TemporalRetriever(GraphCompletionRetriever):
                 "No timestamps identified based on the query, performing retrieval using triplet search on events and entities."
             )
             triplets = await self.get_triplets(query)
-            return await self.resolve_edges_to_text(triplets)
+            return await self.resolve_edges_to_text(triplets), triplets
 
         if ids:
             relevant_events = await graph_engine.collect_events(ids=ids)
@@ -123,7 +123,7 @@ class TemporalRetriever(GraphCompletionRetriever):
                 "No events identified based on timestamp filtering, performing retrieval using triplet search on events and entities."
             )
             triplets = await self.get_triplets(query)
-            return await self.resolve_edges_to_text(triplets)
+            return await self.resolve_edges_to_text(triplets), triplets
 
         vector_engine = get_vector_engine()
         query_vector = (await vector_engine.embedding_engine.embed_text([query]))[0]