chore: adds back accidentally deleted structured output test
This commit is contained in:
parent
fd23c75c09
commit
fa035f42f4
1 changed files with 204 additions and 0 deletions
204
cognee/tests/unit/modules/retrieval/structured_output_test.py
Normal file
204
cognee/tests/unit/modules/retrieval/structured_output_test.py
Normal file
|
|
@ -0,0 +1,204 @@
|
||||||
|
import asyncio
|
||||||
|
|
||||||
|
import pytest
|
||||||
|
import cognee
|
||||||
|
import pathlib
|
||||||
|
import os
|
||||||
|
|
||||||
|
from pydantic import BaseModel
|
||||||
|
from cognee.low_level import setup, DataPoint
|
||||||
|
from cognee.tasks.storage import add_data_points
|
||||||
|
from cognee.modules.chunking.models import DocumentChunk
|
||||||
|
from cognee.modules.data.processing.document_types import TextDocument
|
||||||
|
from cognee.modules.engine.models import Entity, EntityType
|
||||||
|
from cognee.modules.retrieval.entity_extractors.DummyEntityExtractor import DummyEntityExtractor
|
||||||
|
from cognee.modules.retrieval.context_providers.DummyContextProvider import DummyContextProvider
|
||||||
|
from cognee.modules.retrieval.graph_completion_cot_retriever import GraphCompletionCotRetriever
|
||||||
|
from cognee.modules.retrieval.graph_completion_retriever import GraphCompletionRetriever
|
||||||
|
from cognee.modules.retrieval.graph_completion_context_extension_retriever import (
|
||||||
|
GraphCompletionContextExtensionRetriever,
|
||||||
|
)
|
||||||
|
from cognee.modules.retrieval.EntityCompletionRetriever import EntityCompletionRetriever
|
||||||
|
from cognee.modules.retrieval.temporal_retriever import TemporalRetriever
|
||||||
|
from cognee.modules.retrieval.completion_retriever import CompletionRetriever
|
||||||
|
|
||||||
|
|
||||||
|
class TestAnswer(BaseModel):
|
||||||
|
answer: str
|
||||||
|
explanation: str
|
||||||
|
|
||||||
|
|
||||||
|
def _assert_string_answer(answer: list[str]):
|
||||||
|
assert isinstance(answer, list), f"Expected str, got {type(answer).__name__}"
|
||||||
|
assert all(isinstance(item, str) and item.strip() for item in answer), "Items should be strings"
|
||||||
|
assert all(item.strip() for item in answer), "Items should not be empty"
|
||||||
|
|
||||||
|
|
||||||
|
def _assert_structured_answer(answer: list[TestAnswer]):
|
||||||
|
assert isinstance(answer, list), f"Expected list, got {type(answer).__name__}"
|
||||||
|
assert all(isinstance(x, TestAnswer) for x in answer), "Items should be TestAnswer"
|
||||||
|
assert all(x.answer.strip() for x in answer), "Answer text should not be empty"
|
||||||
|
assert all(x.explanation.strip() for x in answer), "Explanation should not be empty"
|
||||||
|
|
||||||
|
|
||||||
|
async def _test_get_structured_graph_completion_cot():
|
||||||
|
retriever = GraphCompletionCotRetriever()
|
||||||
|
|
||||||
|
# Test with string response model (default)
|
||||||
|
string_answer = await retriever.get_completion("Who works at Figma?")
|
||||||
|
_assert_string_answer(string_answer)
|
||||||
|
|
||||||
|
# Test with structured response model
|
||||||
|
structured_answer = await retriever.get_completion(
|
||||||
|
"Who works at Figma?", response_model=TestAnswer
|
||||||
|
)
|
||||||
|
_assert_structured_answer(structured_answer)
|
||||||
|
|
||||||
|
|
||||||
|
async def _test_get_structured_graph_completion():
|
||||||
|
retriever = GraphCompletionRetriever()
|
||||||
|
|
||||||
|
# Test with string response model (default)
|
||||||
|
string_answer = await retriever.get_completion("Who works at Figma?")
|
||||||
|
_assert_string_answer(string_answer)
|
||||||
|
|
||||||
|
# Test with structured response model
|
||||||
|
structured_answer = await retriever.get_completion(
|
||||||
|
"Who works at Figma?", response_model=TestAnswer
|
||||||
|
)
|
||||||
|
_assert_structured_answer(structured_answer)
|
||||||
|
|
||||||
|
|
||||||
|
async def _test_get_structured_graph_completion_temporal():
|
||||||
|
retriever = TemporalRetriever()
|
||||||
|
|
||||||
|
# Test with string response model (default)
|
||||||
|
string_answer = await retriever.get_completion("When did Steve start working at Figma?")
|
||||||
|
_assert_string_answer(string_answer)
|
||||||
|
|
||||||
|
# Test with structured response model
|
||||||
|
structured_answer = await retriever.get_completion(
|
||||||
|
"When did Steve start working at Figma??", response_model=TestAnswer
|
||||||
|
)
|
||||||
|
_assert_structured_answer(structured_answer)
|
||||||
|
|
||||||
|
|
||||||
|
async def _test_get_structured_graph_completion_rag():
|
||||||
|
retriever = CompletionRetriever()
|
||||||
|
|
||||||
|
# Test with string response model (default)
|
||||||
|
string_answer = await retriever.get_completion("Where does Steve work?")
|
||||||
|
_assert_string_answer(string_answer)
|
||||||
|
|
||||||
|
# Test with structured response model
|
||||||
|
structured_answer = await retriever.get_completion(
|
||||||
|
"Where does Steve work?", response_model=TestAnswer
|
||||||
|
)
|
||||||
|
_assert_structured_answer(structured_answer)
|
||||||
|
|
||||||
|
|
||||||
|
async def _test_get_structured_graph_completion_context_extension():
|
||||||
|
retriever = GraphCompletionContextExtensionRetriever()
|
||||||
|
|
||||||
|
# Test with string response model (default)
|
||||||
|
string_answer = await retriever.get_completion("Who works at Figma?")
|
||||||
|
_assert_string_answer(string_answer)
|
||||||
|
|
||||||
|
# Test with structured response model
|
||||||
|
structured_answer = await retriever.get_completion(
|
||||||
|
"Who works at Figma?", response_model=TestAnswer
|
||||||
|
)
|
||||||
|
_assert_structured_answer(structured_answer)
|
||||||
|
|
||||||
|
|
||||||
|
async def _test_get_structured_entity_completion():
|
||||||
|
retriever = EntityCompletionRetriever(DummyEntityExtractor(), DummyContextProvider())
|
||||||
|
|
||||||
|
# Test with string response model (default)
|
||||||
|
string_answer = await retriever.get_completion("Who is Albert Einstein?")
|
||||||
|
_assert_string_answer(string_answer)
|
||||||
|
|
||||||
|
# Test with structured response model
|
||||||
|
structured_answer = await retriever.get_completion(
|
||||||
|
"Who is Albert Einstein?", response_model=TestAnswer
|
||||||
|
)
|
||||||
|
_assert_structured_answer(structured_answer)
|
||||||
|
|
||||||
|
|
||||||
|
class TestStructuredOutputCompletion:
|
||||||
|
@pytest.mark.asyncio
|
||||||
|
async def test_get_structured_completion(self):
|
||||||
|
system_directory_path = os.path.join(
|
||||||
|
pathlib.Path(__file__).parent, ".cognee_system/test_get_structured_completion"
|
||||||
|
)
|
||||||
|
cognee.config.system_root_directory(system_directory_path)
|
||||||
|
data_directory_path = os.path.join(
|
||||||
|
pathlib.Path(__file__).parent, ".data_storage/test_get_structured_completion"
|
||||||
|
)
|
||||||
|
cognee.config.data_root_directory(data_directory_path)
|
||||||
|
|
||||||
|
await cognee.prune.prune_data()
|
||||||
|
await cognee.prune.prune_system(metadata=True)
|
||||||
|
await setup()
|
||||||
|
|
||||||
|
class Company(DataPoint):
|
||||||
|
name: str
|
||||||
|
|
||||||
|
class Person(DataPoint):
|
||||||
|
name: str
|
||||||
|
works_for: Company
|
||||||
|
works_since: int
|
||||||
|
|
||||||
|
company1 = Company(name="Figma")
|
||||||
|
person1 = Person(name="Steve Rodger", works_for=company1, works_since=2015)
|
||||||
|
|
||||||
|
entities = [company1, person1]
|
||||||
|
await add_data_points(entities)
|
||||||
|
|
||||||
|
document = TextDocument(
|
||||||
|
name="Steve Rodger's career",
|
||||||
|
raw_data_location="somewhere",
|
||||||
|
external_metadata="",
|
||||||
|
mime_type="text/plain",
|
||||||
|
)
|
||||||
|
|
||||||
|
chunk1 = DocumentChunk(
|
||||||
|
text="Steve Rodger",
|
||||||
|
chunk_size=2,
|
||||||
|
chunk_index=0,
|
||||||
|
cut_type="sentence_end",
|
||||||
|
is_part_of=document,
|
||||||
|
contains=[],
|
||||||
|
)
|
||||||
|
chunk2 = DocumentChunk(
|
||||||
|
text="Mike Broski",
|
||||||
|
chunk_size=2,
|
||||||
|
chunk_index=1,
|
||||||
|
cut_type="sentence_end",
|
||||||
|
is_part_of=document,
|
||||||
|
contains=[],
|
||||||
|
)
|
||||||
|
chunk3 = DocumentChunk(
|
||||||
|
text="Christina Mayer",
|
||||||
|
chunk_size=2,
|
||||||
|
chunk_index=2,
|
||||||
|
cut_type="sentence_end",
|
||||||
|
is_part_of=document,
|
||||||
|
contains=[],
|
||||||
|
)
|
||||||
|
|
||||||
|
entities = [chunk1, chunk2, chunk3]
|
||||||
|
await add_data_points(entities)
|
||||||
|
|
||||||
|
entity_type = EntityType(name="Person", description="A human individual")
|
||||||
|
entity = Entity(name="Albert Einstein", is_a=entity_type, description="A famous physicist")
|
||||||
|
|
||||||
|
entities = [entity]
|
||||||
|
await add_data_points(entities)
|
||||||
|
|
||||||
|
await _test_get_structured_graph_completion_cot()
|
||||||
|
await _test_get_structured_graph_completion()
|
||||||
|
await _test_get_structured_graph_completion_temporal()
|
||||||
|
await _test_get_structured_graph_completion_rag()
|
||||||
|
await _test_get_structured_graph_completion_context_extension()
|
||||||
|
await _test_get_structured_entity_completion()
|
||||||
Loading…
Add table
Reference in a new issue