From 669aaae7856d4297631a2d9945afbdba70d27fb4 Mon Sep 17 00:00:00 2001
From: Daniel Chalef <131175+danielchalef@users.noreply.github.com>
Date: Wed, 29 Oct 2025 18:41:18 -0700
Subject: [PATCH] fix: Fix all linting errors in test suite

- Replace bare except with except Exception
- Remove unused imports and variables
- Fix type hints to use modern syntax
- Apply ruff formatting for line length
- Ensure all tests pass linting checks
---
 mcp_server/src/graphiti_mcp_server.py         |   4 +-
 mcp_server/tests/run_tests.py                 | 154 +++++--------
 mcp_server/tests/test_async_operations.py     | 165 +++++++------
 .../tests/test_comprehensive_integration.py   | 218 ++++++++----------
 mcp_server/tests/test_fixtures.py             | 112 ++++-----
 mcp_server/tests/test_stress_load.py          | 201 ++++++++--------
 mcp_server/uv.lock                            |   2 +-
 7 files changed, 403 insertions(+), 453 deletions(-)

diff --git a/mcp_server/src/graphiti_mcp_server.py b/mcp_server/src/graphiti_mcp_server.py
index e9f6a5b8..2d009af1 100644
--- a/mcp_server/src/graphiti_mcp_server.py
+++ b/mcp_server/src/graphiti_mcp_server.py
@@ -61,7 +61,9 @@ logging.basicConfig(
 # Configure specific loggers
 logging.getLogger('uvicorn').setLevel(logging.INFO)
 logging.getLogger('uvicorn.access').setLevel(logging.WARNING)  # Reduce access log noise
-logging.getLogger('mcp.server.streamable_http_manager').setLevel(logging.WARNING)  # Reduce MCP noise
+logging.getLogger('mcp.server.streamable_http_manager').setLevel(
+    logging.WARNING
+)  # Reduce MCP noise
 
 logger = logging.getLogger(__name__)
 
diff --git a/mcp_server/tests/run_tests.py b/mcp_server/tests/run_tests.py
index ab267ab3..e6c15576 100644
--- a/mcp_server/tests/run_tests.py
+++ b/mcp_server/tests/run_tests.py
@@ -5,14 +5,10 @@ Provides various test execution modes and reporting options.
 """
 
 import argparse
-import asyncio
-import json
 import os
-import subprocess
 import sys
 import time
 from pathlib import Path
-from typing import Dict, List, Optional
 
 import pytest
 from dotenv import load_dotenv
@@ -34,7 +30,7 @@ class TestRunner:
         self.test_dir = Path(__file__).parent
         self.results = {}
 
-    def check_prerequisites(self) -> Dict[str, bool]:
+    def check_prerequisites(self) -> dict[str, bool]:
         """Check if required services and dependencies are available."""
         checks = {}
 
@@ -46,7 +42,9 @@ class TestRunner:
                 # Check if .env file exists for helpful message
                 env_path = Path(__file__).parent.parent / '.env'
                 if not env_path.exists():
-                    checks['openai_api_key_hint'] = 'Set OPENAI_API_KEY in environment or create mcp_server/.env file'
+                    checks['openai_api_key_hint'] = (
+                        'Set OPENAI_API_KEY in environment or create mcp_server/.env file'
+                    )
         else:
             checks['openai_api_key'] = True
 
@@ -69,6 +67,7 @@ class TestRunner:
         """Check if Neo4j is available."""
         try:
             import neo4j
+
             # Try to connect
             uri = os.environ.get('NEO4J_URI', 'bolt://localhost:7687')
             user = os.environ.get('NEO4J_USER', 'neo4j')
@@ -76,21 +75,22 @@ class TestRunner:
 
             driver = neo4j.GraphDatabase.driver(uri, auth=(user, password))
             with driver.session() as session:
-                session.run("RETURN 1")
+                session.run('RETURN 1')
             driver.close()
             return True
-        except:
+        except Exception:
             return False
 
     def _check_falkordb(self) -> bool:
         """Check if FalkorDB is available."""
         try:
             import redis
+
             uri = os.environ.get('FALKORDB_URI', 'redis://localhost:6379')
             r = redis.from_url(uri)
             r.ping()
             return True
-        except:
+        except Exception:
             return False
 
     def _check_python_package(self, package: str) -> bool:
@@ -124,10 +124,12 @@ class TestRunner:
             pytest_args.extend(['-m', 'slow', 'test_stress_load.py'])
         elif suite == 'smoke':
             # Quick smoke test - just basic operations
-            pytest_args.extend([
-                'test_comprehensive_integration.py::TestCoreOperations::test_server_initialization',
-                'test_comprehensive_integration.py::TestCoreOperations::test_add_text_memory'
-            ])
+            pytest_args.extend(
+                [
+                    'test_comprehensive_integration.py::TestCoreOperations::test_server_initialization',
+                    'test_comprehensive_integration.py::TestCoreOperations::test_add_text_memory',
+                ]
+            )
         elif suite == 'all':
             pytest_args.append('.')
         else:
@@ -161,7 +163,7 @@ class TestRunner:
             env['DATABASE_PROVIDER'] = self.args.database
 
         # Run tests from the test directory
-        print(f"Running {suite} tests with pytest args: {' '.join(pytest_args)}")
+        print(f'Running {suite} tests with pytest args: {" ".join(pytest_args)}')
 
         # Change to test directory to run tests
         original_dir = os.getcwd()
@@ -176,52 +178,52 @@ class TestRunner:
 
     def run_performance_benchmark(self):
         """Run performance benchmarking suite."""
-        print("Running performance benchmarks...")
+        print('Running performance benchmarks...')
 
         # Import test modules
-        from test_comprehensive_integration import TestPerformance
-        from test_async_operations import TestAsyncPerformance
 
         # Run performance tests
-        result = pytest.main([
-            '-v',
-            'test_comprehensive_integration.py::TestPerformance',
-            'test_async_operations.py::TestAsyncPerformance',
-            '--benchmark-only' if self.args.benchmark_only else '',
-        ])
+        result = pytest.main(
+            [
+                '-v',
+                'test_comprehensive_integration.py::TestPerformance',
+                'test_async_operations.py::TestAsyncPerformance',
+                '--benchmark-only' if self.args.benchmark_only else '',
+            ]
+        )
 
         return result
 
     def generate_report(self):
         """Generate test execution report."""
         report = []
-        report.append("\n" + "=" * 60)
-        report.append("GRAPHITI MCP TEST EXECUTION REPORT")
-        report.append("=" * 60)
+        report.append('\n' + '=' * 60)
+        report.append('GRAPHITI MCP TEST EXECUTION REPORT')
+        report.append('=' * 60)
 
         # Prerequisites check
         checks = self.check_prerequisites()
-        report.append("\nPrerequisites:")
+        report.append('\nPrerequisites:')
         for check, passed in checks.items():
-            status = "✅" if passed else "❌"
-            report.append(f"  {status} {check}")
+            status = '✅' if passed else '❌'
+            report.append(f'  {status} {check}')
 
         # Test configuration
-        report.append(f"\nConfiguration:")
-        report.append(f"  Database: {self.args.database}")
-        report.append(f"  Mock LLM: {self.args.mock_llm}")
-        report.append(f"  Parallel: {self.args.parallel or 'No'}")
-        report.append(f"  Timeout: {self.args.timeout}s")
+        report.append('\nConfiguration:')
+        report.append(f'  Database: {self.args.database}')
+        report.append(f'  Mock LLM: {self.args.mock_llm}')
+        report.append(f'  Parallel: {self.args.parallel or "No"}')
+        report.append(f'  Timeout: {self.args.timeout}s')
 
         # Results summary (if available)
         if self.results:
-            report.append(f"\nResults:")
+            report.append('\nResults:')
             for suite, result in self.results.items():
-                status = "✅ Passed" if result == 0 else f"❌ Failed ({result})"
-                report.append(f"  {suite}: {status}")
+                status = '✅ Passed' if result == 0 else f'❌ Failed ({result})'
+                report.append(f'  {suite}: {status}')
 
-        report.append("=" * 60)
-        return "\n".join(report)
+        report.append('=' * 60)
+        return '\n'.join(report)
 
 
 def main():
@@ -244,70 +246,42 @@ Examples:
   python run_tests.py integration --parallel 4 # Run integration tests in parallel
   python run_tests.py stress --database neo4j  # Run stress tests with Neo4j
   python run_tests.py all --coverage          # Run all tests with coverage
-        """
+        """,
     )
 
     parser.add_argument(
         'suite',
         choices=['unit', 'integration', 'comprehensive', 'async', 'stress', 'smoke', 'all'],
-        help='Test suite to run'
+        help='Test suite to run',
     )
 
     parser.add_argument(
         '--database',
         choices=['neo4j', 'falkordb', 'kuzu'],
         default='kuzu',
-        help='Database backend to test (default: kuzu)'
+        help='Database backend to test (default: kuzu)',
     )
 
-    parser.add_argument(
-        '--mock-llm',
-        action='store_true',
-        help='Use mock LLM for faster testing'
-    )
+    parser.add_argument('--mock-llm', action='store_true', help='Use mock LLM for faster testing')
 
     parser.add_argument(
-        '--parallel',
-        type=int,
-        metavar='N',
-        help='Run tests in parallel with N workers'
+        '--parallel', type=int, metavar='N', help='Run tests in parallel with N workers'
     )
 
-    parser.add_argument(
-        '--coverage',
-        action='store_true',
-        help='Generate coverage report'
-    )
+    parser.add_argument('--coverage', action='store_true', help='Generate coverage report')
+
+    parser.add_argument('--verbose', action='store_true', help='Verbose output')
+
+    parser.add_argument('--skip-slow', action='store_true', help='Skip slow tests')
 
     parser.add_argument(
-        '--verbose',
-        action='store_true',
-        help='Verbose output'
+        '--timeout', type=int, default=300, help='Test timeout in seconds (default: 300)'
     )
 
-    parser.add_argument(
-        '--skip-slow',
-        action='store_true',
-        help='Skip slow tests'
-    )
+    parser.add_argument('--benchmark-only', action='store_true', help='Run only benchmark tests')
 
     parser.add_argument(
-        '--timeout',
-        type=int,
-        default=300,
-        help='Test timeout in seconds (default: 300)'
-    )
-
-    parser.add_argument(
-        '--benchmark-only',
-        action='store_true',
-        help='Run only benchmark tests'
-    )
-
-    parser.add_argument(
-        '--check-only',
-        action='store_true',
-        help='Only check prerequisites without running tests'
+        '--check-only', action='store_true', help='Only check prerequisites without running tests'
     )
 
     args = parser.parse_args()
@@ -326,26 +300,26 @@ Examples:
     validation_checks = {k: v for k, v in checks.items() if not k.endswith('_hint')}
 
     if not all(validation_checks.values()):
-        print("⚠️  Some prerequisites are not met:")
+        print('⚠️  Some prerequisites are not met:')
         for check, passed in checks.items():
             if check.endswith('_hint'):
                 continue  # Skip hint entries
             if not passed:
-                print(f"  ❌ {check}")
+                print(f'  ❌ {check}')
                 # Show hint if available
-                hint_key = f"{check}_hint"
+                hint_key = f'{check}_hint'
                 if hint_key in checks:
-                    print(f"     💡 {checks[hint_key]}")
+                    print(f'     💡 {checks[hint_key]}')
 
         if not args.mock_llm and not checks.get('openai_api_key'):
-            print("\n💡 Tip: Use --mock-llm to run tests without OpenAI API key")
+            print('\n💡 Tip: Use --mock-llm to run tests without OpenAI API key')
 
-        response = input("\nContinue anyway? (y/N): ")
+        response = input('\nContinue anyway? (y/N): ')
         if response.lower() != 'y':
             sys.exit(1)
 
     # Run tests
-    print(f"\n🚀 Starting test execution: {args.suite}")
+    print(f'\n🚀 Starting test execution: {args.suite}')
     start_time = time.time()
 
     if args.benchmark_only:
@@ -360,11 +334,11 @@ Examples:
 
     # Generate and print report
     print(runner.generate_report())
-    print(f"\n⏱️  Test execution completed in {duration:.2f} seconds")
+    print(f'\n⏱️  Test execution completed in {duration:.2f} seconds')
 
     # Exit with test result code
     sys.exit(result)
 
 
-if __name__ == "__main__":
-    main()
\ No newline at end of file
+if __name__ == '__main__':
+    main()
diff --git a/mcp_server/tests/test_async_operations.py b/mcp_server/tests/test_async_operations.py
index 56d41ae9..078a920c 100644
--- a/mcp_server/tests/test_async_operations.py
+++ b/mcp_server/tests/test_async_operations.py
@@ -7,15 +7,11 @@ Tests concurrent operations, queue management, and async patterns.
 import asyncio
 import json
 import time
-from typing import Any, Dict, List
-from unittest.mock import AsyncMock, patch
 
 import pytest
 from test_fixtures import (
     TestDataGenerator,
     graphiti_test_client,
-    performance_benchmark,
-    test_data_generator,
 )
 
 
@@ -38,7 +34,7 @@ class TestAsyncQueueManagement:
                         'source_description': 'sequential test',
                         'group_id': group_id,
                         'reference_id': f'seq_{i}',  # Add reference for tracking
-                    }
+                    },
                 )
                 episodes.append(result)
 
@@ -46,19 +42,18 @@ class TestAsyncQueueManagement:
             await asyncio.sleep(10)  # Allow time for sequential processing
 
             # Retrieve episodes and verify order
-            result = await session.call_tool(
-                'get_episodes',
-                {'group_id': group_id, 'last_n': 10}
-            )
+            result = await session.call_tool('get_episodes', {'group_id': group_id, 'last_n': 10})
 
             processed_episodes = json.loads(result.content[0].text)['episodes']
 
             # Verify all episodes were processed
-            assert len(processed_episodes) >= 5, f"Expected at least 5 episodes, got {len(processed_episodes)}"
+            assert len(processed_episodes) >= 5, (
+                f'Expected at least 5 episodes, got {len(processed_episodes)}'
+            )
 
             # Verify sequential processing (timestamps should be ordered)
             timestamps = [ep.get('created_at') for ep in processed_episodes]
-            assert timestamps == sorted(timestamps), "Episodes not processed in order"
+            assert timestamps == sorted(timestamps), 'Episodes not processed in order'
 
     @pytest.mark.asyncio
     async def test_concurrent_group_processing(self):
@@ -78,7 +73,7 @@ class TestAsyncQueueManagement:
                             'source': 'text',
                             'source_description': 'concurrent test',
                             'group_id': group_id,
-                        }
+                        },
                     )
                     tasks.append(task)
 
@@ -89,11 +84,11 @@ class TestAsyncQueueManagement:
 
             # Verify all succeeded
             failures = [r for r in results if isinstance(r, Exception)]
-            assert not failures, f"Concurrent operations failed: {failures}"
+            assert not failures, f'Concurrent operations failed: {failures}'
 
             # Check that execution was actually concurrent (should be faster than sequential)
             # Sequential would take at least 6 * processing_time
-            assert execution_time < 30, f"Concurrent execution too slow: {execution_time}s"
+            assert execution_time < 30, f'Concurrent execution too slow: {execution_time}s'
 
     @pytest.mark.asyncio
     async def test_queue_overflow_handling(self):
@@ -110,7 +105,7 @@ class TestAsyncQueueManagement:
                         'source': 'text',
                         'source_description': 'overflow test',
                         'group_id': group_id,
-                    }
+                    },
                 )
                 tasks.append(task)
 
@@ -121,11 +116,11 @@ class TestAsyncQueueManagement:
             successful = sum(1 for r in results if not isinstance(r, Exception))
 
             # Should handle overflow gracefully
-            assert successful > 0, "No episodes were queued successfully"
+            assert successful > 0, 'No episodes were queued successfully'
 
             # Log overflow behavior
             if successful < 100:
-                print(f"Queue overflow: {successful}/100 episodes queued")
+                print(f'Queue overflow: {successful}/100 episodes queued')
 
 
 class TestConcurrentOperations:
@@ -148,7 +143,7 @@ class TestConcurrentOperations:
                         'source': 'text',
                         'source_description': 'search test',
                         'group_id': group_id,
-                    }
+                    },
                 )
                 add_tasks.append(task)
 
@@ -172,7 +167,7 @@ class TestConcurrentOperations:
                         'query': query,
                         'group_id': group_id,
                         'limit': 10,
-                    }
+                    },
                 )
                 search_tasks.append(task)
 
@@ -182,10 +177,10 @@ class TestConcurrentOperations:
 
             # Verify all searches completed
             failures = [r for r in results if isinstance(r, Exception)]
-            assert not failures, f"Search operations failed: {failures}"
+            assert not failures, f'Search operations failed: {failures}'
 
             # Verify concurrent execution efficiency
-            assert search_time < len(search_queries) * 2, "Searches not executing concurrently"
+            assert search_time < len(search_queries) * 2, 'Searches not executing concurrently'
 
     @pytest.mark.asyncio
     async def test_mixed_operation_concurrency(self):
@@ -194,48 +189,51 @@ class TestConcurrentOperations:
             operations = []
 
             # Add memory operation
-            operations.append(session.call_tool(
-                'add_memory',
-                {
-                    'name': 'Mixed Op Test',
-                    'episode_body': 'Testing mixed operations',
-                    'source': 'text',
-                    'source_description': 'test',
-                    'group_id': group_id,
-                }
-            ))
+            operations.append(
+                session.call_tool(
+                    'add_memory',
+                    {
+                        'name': 'Mixed Op Test',
+                        'episode_body': 'Testing mixed operations',
+                        'source': 'text',
+                        'source_description': 'test',
+                        'group_id': group_id,
+                    },
+                )
+            )
 
             # Search operation
-            operations.append(session.call_tool(
-                'search_memory_nodes',
-                {
-                    'query': 'test',
-                    'group_id': group_id,
-                    'limit': 5,
-                }
-            ))
+            operations.append(
+                session.call_tool(
+                    'search_memory_nodes',
+                    {
+                        'query': 'test',
+                        'group_id': group_id,
+                        'limit': 5,
+                    },
+                )
+            )
 
             # Get episodes operation
-            operations.append(session.call_tool(
-                'get_episodes',
-                {
-                    'group_id': group_id,
-                    'last_n': 10,
-                }
-            ))
+            operations.append(
+                session.call_tool(
+                    'get_episodes',
+                    {
+                        'group_id': group_id,
+                        'last_n': 10,
+                    },
+                )
+            )
 
             # Get status operation
-            operations.append(session.call_tool(
-                'get_status',
-                {}
-            ))
+            operations.append(session.call_tool('get_status', {}))
 
             # Execute all concurrently
             results = await asyncio.gather(*operations, return_exceptions=True)
 
             # Check results
             for i, result in enumerate(results):
-                assert not isinstance(result, Exception), f"Operation {i} failed: {result}"
+                assert not isinstance(result, Exception), f'Operation {i} failed: {result}'
 
 
 class TestAsyncErrorHandling:
@@ -246,10 +244,10 @@ class TestAsyncErrorHandling:
         """Test recovery from operation timeouts."""
         async with graphiti_test_client() as (session, group_id):
             # Create a very large episode that might timeout
-            large_content = "x" * 1000000  # 1MB of data
+            large_content = 'x' * 1000000  # 1MB of data
 
             try:
-                result = await asyncio.wait_for(
+                await asyncio.wait_for(
                     session.call_tool(
                         'add_memory',
                         {
@@ -258,9 +256,9 @@ class TestAsyncErrorHandling:
                             'source': 'text',
                             'source_description': 'timeout test',
                             'group_id': group_id,
-                        }
+                        },
                     ),
-                    timeout=2.0  # Short timeout
+                    timeout=2.0,  # Short timeout
                 )
             except asyncio.TimeoutError:
                 # Expected timeout
@@ -268,7 +266,7 @@ class TestAsyncErrorHandling:
 
             # Verify server is still responsive after timeout
             status_result = await session.call_tool('get_status', {})
-            assert status_result is not None, "Server unresponsive after timeout"
+            assert status_result is not None, 'Server unresponsive after timeout'
 
     @pytest.mark.asyncio
     async def test_cancellation_handling(self):
@@ -284,7 +282,7 @@ class TestAsyncErrorHandling:
                         'source': 'text',
                         'source_description': 'cancel test',
                         'group_id': group_id,
-                    }
+                    },
                 )
             )
 
@@ -305,13 +303,13 @@ class TestAsyncErrorHandling:
         """Test that exceptions are properly propagated in async context."""
         async with graphiti_test_client() as (session, group_id):
             # Call with invalid arguments
-            with pytest.raises(Exception):
+            with pytest.raises(ValueError):
                 await session.call_tool(
                     'add_memory',
                     {
                         # Missing required fields
                         'group_id': group_id,
-                    }
+                    },
                 )
 
             # Server should remain operational
@@ -340,7 +338,7 @@ class TestAsyncPerformance:
                         'source': 'text',
                         'source_description': 'throughput test',
                         'group_id': group_id,
-                    }
+                    },
                 )
                 tasks.append(task)
 
@@ -355,14 +353,14 @@ class TestAsyncPerformance:
             performance_benchmark.record('async_throughput', throughput)
 
             # Log results
-            print(f"\nAsync Throughput Test:")
-            print(f"  Operations: {num_operations}")
-            print(f"  Successful: {successful}")
-            print(f"  Total time: {total_time:.2f}s")
-            print(f"  Throughput: {throughput:.2f} ops/s")
+            print('\nAsync Throughput Test:')
+            print(f'  Operations: {num_operations}')
+            print(f'  Successful: {successful}')
+            print(f'  Total time: {total_time:.2f}s')
+            print(f'  Throughput: {throughput:.2f} ops/s')
 
             # Assert minimum throughput
-            assert throughput > 1.0, f"Throughput too low: {throughput:.2f} ops/s"
+            assert throughput > 1.0, f'Throughput too low: {throughput:.2f} ops/s'
 
     @pytest.mark.asyncio
     async def test_latency_under_load(self, performance_benchmark):
@@ -380,7 +378,7 @@ class TestAsyncPerformance:
                             'source': 'text',
                             'source_description': 'background',
                             'group_id': f'background_{group_id}',
-                        }
+                        },
                     )
                 )
                 background_tasks.append(task)
@@ -389,10 +387,7 @@ class TestAsyncPerformance:
             latencies = []
             for _ in range(5):
                 start = time.time()
-                await session.call_tool(
-                    'get_status',
-                    {}
-                )
+                await session.call_tool('get_status', {})
                 latency = time.time() - start
                 latencies.append(latency)
                 performance_benchmark.record('latency_under_load', latency)
@@ -405,13 +400,13 @@ class TestAsyncPerformance:
             avg_latency = sum(latencies) / len(latencies)
             max_latency = max(latencies)
 
-            print(f"\nLatency Under Load:")
-            print(f"  Average: {avg_latency:.3f}s")
-            print(f"  Max: {max_latency:.3f}s")
+            print('\nLatency Under Load:')
+            print(f'  Average: {avg_latency:.3f}s')
+            print(f'  Max: {max_latency:.3f}s')
 
             # Assert acceptable latency
-            assert avg_latency < 2.0, f"Average latency too high: {avg_latency:.3f}s"
-            assert max_latency < 5.0, f"Max latency too high: {max_latency:.3f}s"
+            assert avg_latency < 2.0, f'Average latency too high: {avg_latency:.3f}s'
+            assert max_latency < 5.0, f'Max latency too high: {max_latency:.3f}s'
 
 
 class TestAsyncStreamHandling:
@@ -431,7 +426,7 @@ class TestAsyncStreamHandling:
                         'source': 'text',
                         'source_description': 'stream test',
                         'group_id': group_id,
-                    }
+                    },
                 )
 
             # Wait for processing
@@ -443,12 +438,12 @@ class TestAsyncStreamHandling:
                 {
                     'group_id': group_id,
                     'last_n': 100,  # Request all
-                }
+                },
             )
 
             # Verify response handling
             episodes = json.loads(result.content[0].text)['episodes']
-            assert len(episodes) >= 20, f"Expected at least 20 episodes, got {len(episodes)}"
+            assert len(episodes) >= 20, f'Expected at least 20 episodes, got {len(episodes)}'
 
     @pytest.mark.asyncio
     async def test_incremental_processing(self):
@@ -466,7 +461,7 @@ class TestAsyncStreamHandling:
                             'source': 'text',
                             'source_description': 'incremental test',
                             'group_id': group_id,
-                        }
+                        },
                     )
                     batch_tasks.append(task)
 
@@ -482,13 +477,15 @@ class TestAsyncStreamHandling:
                     {
                         'group_id': group_id,
                         'last_n': 100,
-                    }
+                    },
                 )
 
                 episodes = json.loads(result.content[0].text)['episodes']
                 expected_min = (batch + 1) * 5
-                assert len(episodes) >= expected_min, f"Batch {batch}: Expected at least {expected_min} episodes"
+                assert len(episodes) >= expected_min, (
+                    f'Batch {batch}: Expected at least {expected_min} episodes'
+                )
 
 
-if __name__ == "__main__":
-    pytest.main([__file__, "-v", "--asyncio-mode=auto"])
\ No newline at end of file
+if __name__ == '__main__':
+    pytest.main([__file__, '-v', '--asyncio-mode=auto'])
diff --git a/mcp_server/tests/test_comprehensive_integration.py b/mcp_server/tests/test_comprehensive_integration.py
index e1728bc2..b39ec485 100644
--- a/mcp_server/tests/test_comprehensive_integration.py
+++ b/mcp_server/tests/test_comprehensive_integration.py
@@ -9,9 +9,7 @@ import json
 import os
 import time
 from dataclasses import dataclass
-from datetime import datetime, timedelta
-from typing import Any, Dict, List, Optional
-from unittest.mock import patch
+from typing import Any
 
 import pytest
 from mcp import ClientSession, StdioServerParameters
@@ -26,7 +24,7 @@ class TestMetrics:
     start_time: float
     end_time: float
     success: bool
-    details: Dict[str, Any]
+    details: dict[str, Any]
 
     @property
     def duration(self) -> float:
@@ -37,10 +35,10 @@ class TestMetrics:
 class GraphitiTestClient:
     """Enhanced test client for comprehensive Graphiti MCP testing."""
 
-    def __init__(self, test_group_id: Optional[str] = None):
+    def __init__(self, test_group_id: str | None = None):
         self.test_group_id = test_group_id or f'test_{int(time.time())}'
         self.session = None
-        self.metrics: List[TestMetrics] = []
+        self.metrics: list[TestMetrics] = []
         self.default_timeout = 30  # seconds
 
     async def __aenter__(self):
@@ -76,7 +74,7 @@ class GraphitiTestClient:
             await self.client_context.__aexit__(exc_type, exc_val, exc_tb)
 
     async def call_tool_with_metrics(
-        self, tool_name: str, arguments: Dict[str, Any], timeout: Optional[float] = None
+        self, tool_name: str, arguments: dict[str, Any], timeout: float | None = None
     ) -> tuple[Any, TestMetrics]:
         """Call a tool and capture performance metrics."""
         start_time = time.time()
@@ -84,8 +82,7 @@ class GraphitiTestClient:
 
         try:
             result = await asyncio.wait_for(
-                self.session.call_tool(tool_name, arguments),
-                timeout=timeout
+                self.session.call_tool(tool_name, arguments), timeout=timeout
             )
 
             content = result.content[0].text if result.content else None
@@ -108,7 +105,7 @@ class GraphitiTestClient:
             start_time=start_time,
             end_time=end_time,
             success=success,
-            details=details
+            details=details,
         )
         self.metrics.append(metric)
 
@@ -132,8 +129,7 @@ class GraphitiTestClient:
 
         while (time.time() - start_time) < max_wait:
             result, _ = await self.call_tool_with_metrics(
-                'get_episodes',
-                {'group_id': self.test_group_id, 'last_n': 100}
+                'get_episodes', {'group_id': self.test_group_id, 'last_n': 100}
             )
 
             if result:
@@ -168,11 +164,11 @@ class TestCoreOperations:
                 'delete_entity_edge',
                 'get_entity_edge',
                 'clear_graph',
-                'get_status'
+                'get_status',
             }
 
             missing_tools = required_tools - tools
-            assert not missing_tools, f"Missing required tools: {missing_tools}"
+            assert not missing_tools, f'Missing required tools: {missing_tools}'
 
     @pytest.mark.asyncio
     async def test_add_text_memory(self):
@@ -187,15 +183,15 @@ class TestCoreOperations:
                     'source': 'text',
                     'source_description': 'conference notes',
                     'group_id': client.test_group_id,
-                }
+                },
             )
 
-            assert metric.success, f"Failed to add memory: {metric.details}"
+            assert metric.success, f'Failed to add memory: {metric.details}'
             assert 'queued' in str(result).lower()
 
             # Wait for processing
             processed = await client.wait_for_episode_processing(expected_count=1)
-            assert processed, "Episode was not processed within timeout"
+            assert processed, 'Episode was not processed within timeout'
 
     @pytest.mark.asyncio
     async def test_add_json_memory(self):
@@ -205,12 +201,9 @@ class TestCoreOperations:
                 'project': {
                     'name': 'GraphitiDB',
                     'version': '2.0.0',
-                    'features': ['temporal-awareness', 'hybrid-search', 'custom-entities']
+                    'features': ['temporal-awareness', 'hybrid-search', 'custom-entities'],
                 },
-                'team': {
-                    'size': 5,
-                    'roles': ['engineering', 'product', 'research']
-                }
+                'team': {'size': 5, 'roles': ['engineering', 'product', 'research']},
             }
 
             result, metric = await client.call_tool_with_metrics(
@@ -221,7 +214,7 @@ class TestCoreOperations:
                     'source': 'json',
                     'source_description': 'project database',
                     'group_id': client.test_group_id,
-                }
+                },
             )
 
             assert metric.success
@@ -246,11 +239,11 @@ class TestCoreOperations:
                     'source': 'message',
                     'source_description': 'support chat',
                     'group_id': client.test_group_id,
-                }
+                },
             )
 
             assert metric.success
-            assert metric.duration < 5, f"Add memory took too long: {metric.duration}s"
+            assert metric.duration < 5, f'Add memory took too long: {metric.duration}s'
 
 
 class TestSearchOperations:
@@ -269,7 +262,7 @@ class TestSearchOperations:
                     'source': 'text',
                     'source_description': 'product roadmap',
                     'group_id': client.test_group_id,
-                }
+                },
             )
 
             # Wait for processing
@@ -278,11 +271,7 @@ class TestSearchOperations:
             # Search for nodes
             result, metric = await client.call_tool_with_metrics(
                 'search_memory_nodes',
-                {
-                    'query': 'AI product features',
-                    'group_id': client.test_group_id,
-                    'limit': 10
-                }
+                {'query': 'AI product features', 'group_id': client.test_group_id, 'limit': 10},
             )
 
             assert metric.success
@@ -301,7 +290,7 @@ class TestSearchOperations:
                     'source': 'text',
                     'source_description': 'company profile',
                     'group_id': client.test_group_id,
-                }
+                },
             )
 
             await client.wait_for_episode_processing()
@@ -313,8 +302,8 @@ class TestSearchOperations:
                     'query': 'company information',
                     'group_id': client.test_group_id,
                     'created_after': '2020-01-01T00:00:00Z',
-                    'limit': 20
-                }
+                    'limit': 20,
+                },
             )
 
             assert metric.success
@@ -328,13 +317,13 @@ class TestSearchOperations:
                 {
                     'name': 'Technical Doc',
                     'episode_body': 'GraphQL API endpoints support pagination, filtering, and real-time subscriptions.',
-                    'source': 'text'
+                    'source': 'text',
                 },
                 {
                     'name': 'Architecture',
                     'episode_body': 'The system uses Neo4j for graph storage and OpenAI embeddings for semantic search.',
-                    'source': 'text'
-                }
+                    'source': 'text',
+                },
             ]
 
             for memory in test_memories:
@@ -347,11 +336,7 @@ class TestSearchOperations:
             # Test semantic + keyword search
             result, metric = await client.call_tool_with_metrics(
                 'search_memory_nodes',
-                {
-                    'query': 'Neo4j graph database',
-                    'group_id': client.test_group_id,
-                    'limit': 10
-                }
+                {'query': 'Neo4j graph database', 'group_id': client.test_group_id, 'limit': 10},
             )
 
             assert metric.success
@@ -374,18 +359,14 @@ class TestEpisodeManagement:
                         'source': 'text',
                         'source_description': 'test',
                         'group_id': client.test_group_id,
-                    }
+                    },
                 )
 
             await client.wait_for_episode_processing(expected_count=5)
 
             # Test pagination
             result, metric = await client.call_tool_with_metrics(
-                'get_episodes',
-                {
-                    'group_id': client.test_group_id,
-                    'last_n': 3
-                }
+                'get_episodes', {'group_id': client.test_group_id, 'last_n': 3}
             )
 
             assert metric.success
@@ -405,15 +386,14 @@ class TestEpisodeManagement:
                     'source': 'text',
                     'source_description': 'test',
                     'group_id': client.test_group_id,
-                }
+                },
             )
 
             await client.wait_for_episode_processing()
 
             # Get episode UUID
             result, _ = await client.call_tool_with_metrics(
-                'get_episodes',
-                {'group_id': client.test_group_id, 'last_n': 1}
+                'get_episodes', {'group_id': client.test_group_id, 'last_n': 1}
             )
 
             episodes = json.loads(result) if isinstance(result, str) else result
@@ -421,8 +401,7 @@ class TestEpisodeManagement:
 
             # Delete the episode
             result, metric = await client.call_tool_with_metrics(
-                'delete_episode',
-                {'episode_uuid': episode_uuid}
+                'delete_episode', {'episode_uuid': episode_uuid}
             )
 
             assert metric.success
@@ -445,7 +424,7 @@ class TestEntityAndEdgeOperations:
                     'source': 'text',
                     'source_description': 'org chart',
                     'group_id': client.test_group_id,
-                }
+                },
             )
 
             await client.wait_for_episode_processing()
@@ -453,11 +432,7 @@ class TestEntityAndEdgeOperations:
             # Search for nodes to get UUIDs
             result, _ = await client.call_tool_with_metrics(
                 'search_memory_nodes',
-                {
-                    'query': 'TechCorp',
-                    'group_id': client.test_group_id,
-                    'limit': 5
-                }
+                {'query': 'TechCorp', 'group_id': client.test_group_id, 'limit': 5},
             )
 
             # Note: This test assumes edges are created between entities
@@ -480,7 +455,7 @@ class TestErrorHandling:
             # Missing required arguments
             result, metric = await client.call_tool_with_metrics(
                 'add_memory',
-                {'name': 'Incomplete'}  # Missing required fields
+                {'name': 'Incomplete'},  # Missing required fields
             )
 
             assert not metric.success
@@ -491,7 +466,7 @@ class TestErrorHandling:
         """Test timeout handling for long operations."""
         async with GraphitiTestClient() as client:
             # Simulate a very large episode that might timeout
-            large_text = "Large document content. " * 10000
+            large_text = 'Large document content. ' * 10000
 
             result, metric = await client.call_tool_with_metrics(
                 'add_memory',
@@ -502,7 +477,7 @@ class TestErrorHandling:
                     'source_description': 'large file',
                     'group_id': client.test_group_id,
                 },
-                timeout=5  # Short timeout
+                timeout=5,  # Short timeout
             )
 
             # Check if timeout was handled gracefully
@@ -524,7 +499,7 @@ class TestErrorHandling:
                         'source': 'text',
                         'source_description': 'concurrent test',
                         'group_id': client.test_group_id,
-                    }
+                    },
                 )
                 tasks.append(task)
 
@@ -543,35 +518,34 @@ class TestPerformance:
         """Measure and validate operation latencies."""
         async with GraphitiTestClient() as client:
             operations = [
-                ('add_memory', {
-                    'name': 'Perf Test',
-                    'episode_body': 'Simple text',
-                    'source': 'text',
-                    'source_description': 'test',
-                    'group_id': client.test_group_id,
-                }),
-                ('search_memory_nodes', {
-                    'query': 'test',
-                    'group_id': client.test_group_id,
-                    'limit': 10
-                }),
-                ('get_episodes', {
-                    'group_id': client.test_group_id,
-                    'last_n': 10
-                })
+                (
+                    'add_memory',
+                    {
+                        'name': 'Perf Test',
+                        'episode_body': 'Simple text',
+                        'source': 'text',
+                        'source_description': 'test',
+                        'group_id': client.test_group_id,
+                    },
+                ),
+                (
+                    'search_memory_nodes',
+                    {'query': 'test', 'group_id': client.test_group_id, 'limit': 10},
+                ),
+                ('get_episodes', {'group_id': client.test_group_id, 'last_n': 10}),
             ]
 
             for tool_name, args in operations:
                 _, metric = await client.call_tool_with_metrics(tool_name, args)
 
                 # Log performance metrics
-                print(f"{tool_name}: {metric.duration:.2f}s")
+                print(f'{tool_name}: {metric.duration:.2f}s')
 
                 # Basic latency assertions
                 if tool_name == 'get_episodes':
-                    assert metric.duration < 2, f"{tool_name} too slow"
+                    assert metric.duration < 2, f'{tool_name} too slow'
                 elif tool_name == 'search_memory_nodes':
-                    assert metric.duration < 10, f"{tool_name} too slow"
+                    assert metric.duration < 10, f'{tool_name} too slow'
 
     @pytest.mark.asyncio
     async def test_batch_processing_efficiency(self):
@@ -590,33 +564,35 @@ class TestPerformance:
                         'source': 'text',
                         'source_description': 'batch test',
                         'group_id': client.test_group_id,
-                    }
+                    },
                 )
 
             # Wait for all to process
             processed = await client.wait_for_episode_processing(
                 expected_count=batch_size,
-                max_wait=120  # Allow more time for batch
+                max_wait=120,  # Allow more time for batch
             )
 
             total_time = time.time() - start_time
             avg_time_per_item = total_time / batch_size
 
-            assert processed, f"Failed to process {batch_size} items"
-            assert avg_time_per_item < 15, f"Batch processing too slow: {avg_time_per_item:.2f}s per item"
+            assert processed, f'Failed to process {batch_size} items'
+            assert avg_time_per_item < 15, (
+                f'Batch processing too slow: {avg_time_per_item:.2f}s per item'
+            )
 
             # Generate performance report
-            print(f"\nBatch Performance Report:")
-            print(f"  Total items: {batch_size}")
-            print(f"  Total time: {total_time:.2f}s")
-            print(f"  Avg per item: {avg_time_per_item:.2f}s")
+            print('\nBatch Performance Report:')
+            print(f'  Total items: {batch_size}')
+            print(f'  Total time: {total_time:.2f}s')
+            print(f'  Avg per item: {avg_time_per_item:.2f}s')
 
 
 class TestDatabaseBackends:
     """Test different database backend configurations."""
 
     @pytest.mark.asyncio
-    @pytest.mark.parametrize("database", ["neo4j", "falkordb", "kuzu"])
+    @pytest.mark.parametrize('database', ['neo4j', 'falkordb', 'kuzu'])
     async def test_database_operations(self, database):
         """Test operations with different database backends."""
         env_vars = {
@@ -625,53 +601,50 @@ class TestDatabaseBackends:
         }
 
         if database == 'neo4j':
-            env_vars.update({
-                'NEO4J_URI': os.environ.get('NEO4J_URI', 'bolt://localhost:7687'),
-                'NEO4J_USER': os.environ.get('NEO4J_USER', 'neo4j'),
-                'NEO4J_PASSWORD': os.environ.get('NEO4J_PASSWORD', 'graphiti'),
-            })
+            env_vars.update(
+                {
+                    'NEO4J_URI': os.environ.get('NEO4J_URI', 'bolt://localhost:7687'),
+                    'NEO4J_USER': os.environ.get('NEO4J_USER', 'neo4j'),
+                    'NEO4J_PASSWORD': os.environ.get('NEO4J_PASSWORD', 'graphiti'),
+                }
+            )
         elif database == 'falkordb':
             env_vars['FALKORDB_URI'] = os.environ.get('FALKORDB_URI', 'redis://localhost:6379')
         elif database == 'kuzu':
-            env_vars['KUZU_PATH'] = os.environ.get('KUZU_PATH', f'./test_kuzu_{int(time.time())}.db')
+            env_vars['KUZU_PATH'] = os.environ.get(
+                'KUZU_PATH', f'./test_kuzu_{int(time.time())}.db'
+            )
 
-        server_params = StdioServerParameters(
-            command='uv',
-            args=['run', 'main.py', '--transport', 'stdio', '--database', database],
-            env=env_vars
-        )
-
-        # Test basic operations with each backend
+        # This test would require setting up server with specific database
         # Implementation depends on database availability
+        pass  # Placeholder for database-specific tests
 
 
 def generate_test_report(client: GraphitiTestClient) -> str:
     """Generate a comprehensive test report from metrics."""
     if not client.metrics:
-        return "No metrics collected"
+        return 'No metrics collected'
 
     report = []
-    report.append("\n" + "="*60)
-    report.append("GRAPHITI MCP TEST REPORT")
-    report.append("="*60)
+    report.append('\n' + '=' * 60)
+    report.append('GRAPHITI MCP TEST REPORT')
+    report.append('=' * 60)
 
     # Summary statistics
     total_ops = len(client.metrics)
     successful_ops = sum(1 for m in client.metrics if m.success)
     avg_duration = sum(m.duration for m in client.metrics) / total_ops
 
-    report.append(f"\nTotal Operations: {total_ops}")
-    report.append(f"Successful: {successful_ops} ({successful_ops/total_ops*100:.1f}%)")
-    report.append(f"Average Duration: {avg_duration:.2f}s")
+    report.append(f'\nTotal Operations: {total_ops}')
+    report.append(f'Successful: {successful_ops} ({successful_ops / total_ops * 100:.1f}%)')
+    report.append(f'Average Duration: {avg_duration:.2f}s')
 
     # Operation breakdown
-    report.append("\nOperation Breakdown:")
+    report.append('\nOperation Breakdown:')
     operation_stats = {}
     for metric in client.metrics:
         if metric.operation not in operation_stats:
-            operation_stats[metric.operation] = {
-                'count': 0, 'success': 0, 'total_duration': 0
-            }
+            operation_stats[metric.operation] = {'count': 0, 'success': 0, 'total_duration': 0}
         stats = operation_stats[metric.operation]
         stats['count'] += 1
         stats['success'] += 1 if metric.success else 0
@@ -681,20 +654,19 @@ def generate_test_report(client: GraphitiTestClient) -> str:
         avg_dur = stats['total_duration'] / stats['count']
         success_rate = stats['success'] / stats['count'] * 100
         report.append(
-            f"  {op}: {stats['count']} calls, "
-            f"{success_rate:.0f}% success, {avg_dur:.2f}s avg"
+            f'  {op}: {stats["count"]} calls, {success_rate:.0f}% success, {avg_dur:.2f}s avg'
         )
 
     # Slowest operations
     slowest = sorted(client.metrics, key=lambda m: m.duration, reverse=True)[:5]
-    report.append("\nSlowest Operations:")
+    report.append('\nSlowest Operations:')
     for metric in slowest:
-        report.append(f"  {metric.operation}: {metric.duration:.2f}s")
+        report.append(f'  {metric.operation}: {metric.duration:.2f}s')
 
-    report.append("="*60)
-    return "\n".join(report)
+    report.append('=' * 60)
+    return '\n'.join(report)
 
 
-if __name__ == "__main__":
+if __name__ == '__main__':
     # Run tests with pytest
-    pytest.main([__file__, "-v", "--asyncio-mode=auto"])
\ No newline at end of file
+    pytest.main([__file__, '-v', '--asyncio-mode=auto'])
diff --git a/mcp_server/tests/test_fixtures.py b/mcp_server/tests/test_fixtures.py
index ed1e0eda..aa639630 100644
--- a/mcp_server/tests/test_fixtures.py
+++ b/mcp_server/tests/test_fixtures.py
@@ -8,7 +8,7 @@ import os
 import random
 import time
 from contextlib import asynccontextmanager
-from typing import Any, Dict, List, Optional
+from typing import Any
 
 import pytest
 from faker import Faker
@@ -22,7 +22,7 @@ class TestDataGenerator:
     """Generate realistic test data for various scenarios."""
 
     @staticmethod
-    def generate_company_profile() -> Dict[str, Any]:
+    def generate_company_profile() -> dict[str, Any]:
         """Generate a realistic company profile."""
         return {
             'company': {
@@ -30,7 +30,7 @@ class TestDataGenerator:
                 'founded': random.randint(1990, 2023),
                 'industry': random.choice(['Tech', 'Finance', 'Healthcare', 'Retail']),
                 'employees': random.randint(10, 10000),
-                'revenue': f"${random.randint(1, 1000)}M",
+                'revenue': f'${random.randint(1, 1000)}M',
                 'headquarters': fake.city(),
             },
             'products': [
@@ -46,41 +46,41 @@ class TestDataGenerator:
                 'ceo': fake.name(),
                 'cto': fake.name(),
                 'cfo': fake.name(),
-            }
+            },
         }
 
     @staticmethod
     def generate_conversation(turns: int = 3) -> str:
         """Generate a realistic conversation."""
         topics = [
-            "product features",
-            "pricing",
-            "technical support",
-            "integration",
-            "documentation",
-            "performance",
+            'product features',
+            'pricing',
+            'technical support',
+            'integration',
+            'documentation',
+            'performance',
         ]
 
         conversation = []
         for _ in range(turns):
             topic = random.choice(topics)
-            user_msg = f"user: {fake.sentence()} about {topic}?"
-            assistant_msg = f"assistant: {fake.paragraph(nb_sentences=2)}"
+            user_msg = f'user: {fake.sentence()} about {topic}?'
+            assistant_msg = f'assistant: {fake.paragraph(nb_sentences=2)}'
             conversation.extend([user_msg, assistant_msg])
 
-        return "\n".join(conversation)
+        return '\n'.join(conversation)
 
     @staticmethod
     def generate_technical_document() -> str:
         """Generate technical documentation content."""
         sections = [
-            f"# {fake.catch_phrase()}\n\n{fake.paragraph()}",
-            f"## Architecture\n{fake.paragraph()}",
-            f"## Implementation\n{fake.paragraph()}",
-            f"## Performance\n- Latency: {random.randint(1, 100)}ms\n- Throughput: {random.randint(100, 10000)} req/s",
-            f"## Dependencies\n- {fake.word()}\n- {fake.word()}\n- {fake.word()}",
+            f'# {fake.catch_phrase()}\n\n{fake.paragraph()}',
+            f'## Architecture\n{fake.paragraph()}',
+            f'## Implementation\n{fake.paragraph()}',
+            f'## Performance\n- Latency: {random.randint(1, 100)}ms\n- Throughput: {random.randint(100, 10000)} req/s',
+            f'## Dependencies\n- {fake.word()}\n- {fake.word()}\n- {fake.word()}',
         ]
-        return "\n\n".join(sections)
+        return '\n\n'.join(sections)
 
     @staticmethod
     def generate_news_article() -> str:
@@ -100,7 +100,7 @@ class TestDataGenerator:
         """
 
     @staticmethod
-    def generate_user_profile() -> Dict[str, Any]:
+    def generate_user_profile() -> dict[str, Any]:
         """Generate a user profile."""
         return {
             'user_id': fake.uuid4(),
@@ -115,8 +115,8 @@ class TestDataGenerator:
             'activity': {
                 'last_login': fake.date_time_this_month().isoformat(),
                 'total_sessions': random.randint(1, 1000),
-                'average_duration': f"{random.randint(1, 60)} minutes",
-            }
+                'average_duration': f'{random.randint(1, 60)} minutes',
+            },
         }
 
 
@@ -131,25 +131,27 @@ class MockLLMProvider:
         await asyncio.sleep(self.delay)
 
         # Return deterministic responses based on prompt patterns
-        if "extract entities" in prompt.lower():
-            return json.dumps({
-                'entities': [
-                    {'name': 'TestEntity1', 'type': 'PERSON'},
-                    {'name': 'TestEntity2', 'type': 'ORGANIZATION'},
-                ]
-            })
-        elif "summarize" in prompt.lower():
-            return "This is a test summary of the provided content."
+        if 'extract entities' in prompt.lower():
+            return json.dumps(
+                {
+                    'entities': [
+                        {'name': 'TestEntity1', 'type': 'PERSON'},
+                        {'name': 'TestEntity2', 'type': 'ORGANIZATION'},
+                    ]
+                }
+            )
+        elif 'summarize' in prompt.lower():
+            return 'This is a test summary of the provided content.'
         else:
-            return "Mock LLM response"
+            return 'Mock LLM response'
 
 
 @asynccontextmanager
 async def graphiti_test_client(
-    group_id: Optional[str] = None,
-    database: str = "kuzu",
+    group_id: str | None = None,
+    database: str = 'kuzu',
     use_mock_llm: bool = False,
-    config_overrides: Optional[Dict[str, Any]] = None
+    config_overrides: dict[str, Any] | None = None,
 ):
     """
     Context manager for creating test clients with various configurations.
@@ -169,11 +171,13 @@ async def graphiti_test_client(
 
     # Database-specific configuration
     if database == 'neo4j':
-        env.update({
-            'NEO4J_URI': os.environ.get('NEO4J_URI', 'bolt://localhost:7687'),
-            'NEO4J_USER': os.environ.get('NEO4J_USER', 'neo4j'),
-            'NEO4J_PASSWORD': os.environ.get('NEO4J_PASSWORD', 'graphiti'),
-        })
+        env.update(
+            {
+                'NEO4J_URI': os.environ.get('NEO4J_URI', 'bolt://localhost:7687'),
+                'NEO4J_USER': os.environ.get('NEO4J_USER', 'neo4j'),
+                'NEO4J_PASSWORD': os.environ.get('NEO4J_PASSWORD', 'graphiti'),
+            }
+        )
     elif database == 'falkordb':
         env['FALKORDB_URI'] = os.environ.get('FALKORDB_URI', 'redis://localhost:6379')
     elif database == 'kuzu':
@@ -188,9 +192,7 @@ async def graphiti_test_client(
         env['USE_MOCK_LLM'] = 'true'
 
     server_params = StdioServerParameters(
-        command='uv',
-        args=['run', 'main.py', '--transport', 'stdio'],
-        env=env
+        command='uv', args=['run', 'main.py', '--transport', 'stdio'], env=env
     )
 
     async with stdio_client(server_params) as (read, write):
@@ -203,7 +205,7 @@ async def graphiti_test_client(
             # Cleanup: Clear test data
             try:
                 await session.call_tool('clear_graph', {'group_id': test_group_id})
-            except:
+            except Exception:
                 pass  # Ignore cleanup errors
 
             await session.close()
@@ -213,7 +215,7 @@ class PerformanceBenchmark:
     """Track and analyze performance benchmarks."""
 
     def __init__(self):
-        self.measurements: Dict[str, List[float]] = {}
+        self.measurements: dict[str, list[float]] = {}
 
     def record(self, operation: str, duration: float):
         """Record a performance measurement."""
@@ -221,7 +223,7 @@ class PerformanceBenchmark:
             self.measurements[operation] = []
         self.measurements[operation].append(duration)
 
-    def get_stats(self, operation: str) -> Dict[str, float]:
+    def get_stats(self, operation: str) -> dict[str, float]:
         """Get statistics for an operation."""
         if operation not in self.measurements or not self.measurements[operation]:
             return {}
@@ -237,18 +239,18 @@ class PerformanceBenchmark:
 
     def report(self) -> str:
         """Generate a performance report."""
-        lines = ["Performance Benchmark Report", "=" * 40]
+        lines = ['Performance Benchmark Report', '=' * 40]
 
         for operation in sorted(self.measurements.keys()):
             stats = self.get_stats(operation)
-            lines.append(f"\n{operation}:")
-            lines.append(f"  Samples: {stats['count']}")
-            lines.append(f"  Mean: {stats['mean']:.3f}s")
-            lines.append(f"  Median: {stats['median']:.3f}s")
-            lines.append(f"  Min: {stats['min']:.3f}s")
-            lines.append(f"  Max: {stats['max']:.3f}s")
+            lines.append(f'\n{operation}:')
+            lines.append(f'  Samples: {stats["count"]}')
+            lines.append(f'  Mean: {stats["mean"]:.3f}s')
+            lines.append(f'  Median: {stats["median"]:.3f}s')
+            lines.append(f'  Min: {stats["min"]:.3f}s')
+            lines.append(f'  Max: {stats["max"]:.3f}s')
 
-        return "\n".join(lines)
+        return '\n'.join(lines)
 
 
 # Pytest fixtures
@@ -321,4 +323,4 @@ def large_dataset():
             'source_description': 'bulk import',
         }
         for i in range(50)
-    ]
\ No newline at end of file
+    ]
diff --git a/mcp_server/tests/test_stress_load.py b/mcp_server/tests/test_stress_load.py
index 0ffa6349..33517680 100644
--- a/mcp_server/tests/test_stress_load.py
+++ b/mcp_server/tests/test_stress_load.py
@@ -6,16 +6,13 @@ Tests system behavior under high load, resource constraints, and edge conditions
 
 import asyncio
 import gc
-import json
-import os
-import psutil
 import random
 import time
 from dataclasses import dataclass
-from typing import Dict, List, Optional, Tuple
 
+import psutil
 import pytest
-from test_fixtures import TestDataGenerator, graphiti_test_client, PerformanceBenchmark
+from test_fixtures import TestDataGenerator, graphiti_test_client
 
 
 @dataclass
@@ -26,7 +23,7 @@ class LoadTestConfig:
     operations_per_client: int = 100
     ramp_up_time: float = 5.0  # seconds
     test_duration: float = 60.0  # seconds
-    target_throughput: Optional[float] = None  # ops/sec
+    target_throughput: float | None = None  # ops/sec
     think_time: float = 0.1  # seconds between ops
 
 
@@ -44,8 +41,8 @@ class LoadTestResult:
     p95_latency: float
     p99_latency: float
     max_latency: float
-    errors: Dict[str, int]
-    resource_usage: Dict[str, float]
+    errors: dict[str, int]
+    resource_usage: dict[str, float]
 
 
 class LoadTester:
@@ -53,16 +50,11 @@ class LoadTester:
 
     def __init__(self, config: LoadTestConfig):
         self.config = config
-        self.metrics: List[Tuple[float, float, bool]] = []  # (start, duration, success)
-        self.errors: Dict[str, int] = {}
-        self.start_time: Optional[float] = None
+        self.metrics: list[tuple[float, float, bool]] = []  # (start, duration, success)
+        self.errors: dict[str, int] = {}
+        self.start_time: float | None = None
 
-    async def run_client_workload(
-        self,
-        client_id: int,
-        session,
-        group_id: str
-    ) -> Dict[str, int]:
+    async def run_client_workload(self, client_id: int, session, group_id: str) -> dict[str, int]:
         """Run workload for a single simulated client."""
         stats = {'success': 0, 'failure': 0}
         data_gen = TestDataGenerator()
@@ -76,11 +68,13 @@ class LoadTester:
 
             try:
                 # Randomly select operation type
-                operation = random.choice([
-                    'add_memory',
-                    'search_memory_nodes',
-                    'get_episodes',
-                ])
+                operation = random.choice(
+                    [
+                        'add_memory',
+                        'search_memory_nodes',
+                        'get_episodes',
+                    ]
+                )
 
                 if operation == 'add_memory':
                     args = {
@@ -103,10 +97,7 @@ class LoadTester:
                     }
 
                 # Execute operation with timeout
-                result = await asyncio.wait_for(
-                    session.call_tool(operation, args),
-                    timeout=30.0
-                )
+                await asyncio.wait_for(session.call_tool(operation, args), timeout=30.0)
 
                 duration = time.time() - operation_start
                 self.metrics.append((operation_start, duration, True))
@@ -146,7 +137,7 @@ class LoadTester:
         duration = max([m[0] + m[1] for m in self.metrics]) - min([m[0] for m in self.metrics])
 
         # Calculate percentiles
-        def percentile(data: List[float], p: float) -> float:
+        def percentile(data: list[float], p: float) -> float:
             if not data:
                 return 0.0
             idx = int(len(data) * p / 100)
@@ -209,16 +200,20 @@ class TestLoadScenarios:
 
             # Assertions
             assert results.successful_operations > results.failed_operations
-            assert results.average_latency < 5.0, f"Average latency too high: {results.average_latency:.2f}s"
-            assert results.p95_latency < 10.0, f"P95 latency too high: {results.p95_latency:.2f}s"
+            assert results.average_latency < 5.0, (
+                f'Average latency too high: {results.average_latency:.2f}s'
+            )
+            assert results.p95_latency < 10.0, f'P95 latency too high: {results.p95_latency:.2f}s'
 
             # Report results
-            print(f"\nSustained Load Test Results:")
-            print(f"  Total operations: {results.total_operations}")
-            print(f"  Success rate: {results.successful_operations / results.total_operations * 100:.1f}%")
-            print(f"  Throughput: {results.throughput:.2f} ops/s")
-            print(f"  Avg latency: {results.average_latency:.2f}s")
-            print(f"  P95 latency: {results.p95_latency:.2f}s")
+            print('\nSustained Load Test Results:')
+            print(f'  Total operations: {results.total_operations}')
+            print(
+                f'  Success rate: {results.successful_operations / results.total_operations * 100:.1f}%'
+            )
+            print(f'  Throughput: {results.throughput:.2f} ops/s')
+            print(f'  Avg latency: {results.average_latency:.2f}s')
+            print(f'  P95 latency: {results.p95_latency:.2f}s')
 
     @pytest.mark.asyncio
     @pytest.mark.slow
@@ -236,7 +231,7 @@ class TestLoadScenarios:
                         'source': 'text',
                         'source_description': 'normal',
                         'group_id': group_id,
-                    }
+                    },
                 )
                 normal_tasks.append(task)
                 await asyncio.sleep(0.5)
@@ -255,7 +250,7 @@ class TestLoadScenarios:
                         'source': 'text',
                         'source_description': 'spike',
                         'group_id': group_id,
-                    }
+                    },
                 )
                 spike_tasks.append(task)
 
@@ -267,14 +262,14 @@ class TestLoadScenarios:
             spike_failures = sum(1 for r in spike_results if isinstance(r, Exception))
             spike_success_rate = (len(spike_results) - spike_failures) / len(spike_results)
 
-            print(f"\nSpike Load Test Results:")
-            print(f"  Spike size: {len(spike_tasks)} operations")
-            print(f"  Duration: {spike_duration:.2f}s")
-            print(f"  Success rate: {spike_success_rate * 100:.1f}%")
-            print(f"  Throughput: {len(spike_tasks) / spike_duration:.2f} ops/s")
+            print('\nSpike Load Test Results:')
+            print(f'  Spike size: {len(spike_tasks)} operations')
+            print(f'  Duration: {spike_duration:.2f}s')
+            print(f'  Success rate: {spike_success_rate * 100:.1f}%')
+            print(f'  Throughput: {len(spike_tasks) / spike_duration:.2f} ops/s')
 
             # System should handle at least 80% of spike
-            assert spike_success_rate > 0.8, f"Too many failures during spike: {spike_failures}"
+            assert spike_success_rate > 0.8, f'Too many failures during spike: {spike_failures}'
 
     @pytest.mark.asyncio
     @pytest.mark.slow
@@ -297,7 +292,7 @@ class TestLoadScenarios:
                             'source': 'text',
                             'source_description': 'memory test',
                             'group_id': group_id,
-                        }
+                        },
                     )
                     batch_tasks.append(task)
 
@@ -312,15 +307,15 @@ class TestLoadScenarios:
             final_memory = process.memory_info().rss / 1024 / 1024  # MB
             memory_growth = final_memory - initial_memory
 
-            print(f"\nMemory Leak Test:")
-            print(f"  Initial memory: {initial_memory:.1f} MB")
-            print(f"  Final memory: {final_memory:.1f} MB")
-            print(f"  Growth: {memory_growth:.1f} MB")
+            print('\nMemory Leak Test:')
+            print(f'  Initial memory: {initial_memory:.1f} MB')
+            print(f'  Final memory: {final_memory:.1f} MB')
+            print(f'  Growth: {memory_growth:.1f} MB')
 
             # Allow for some memory growth but flag potential leaks
             # This is a soft check - actual threshold depends on system
             if memory_growth > 100:  # More than 100MB growth
-                print(f"  ⚠️  Potential memory leak detected: {memory_growth:.1f} MB growth")
+                print(f'  ⚠️  Potential memory leak detected: {memory_growth:.1f} MB growth')
 
     @pytest.mark.asyncio
     @pytest.mark.slow
@@ -333,32 +328,33 @@ class TestLoadScenarios:
                 task = session.call_tool(
                     'search_memory_nodes',
                     {
-                        'query': f'complex query {i} ' + ' '.join([TestDataGenerator.fake.word() for _ in range(10)]),
+                        'query': f'complex query {i} '
+                        + ' '.join([TestDataGenerator.fake.word() for _ in range(10)]),
                         'group_id': group_id,
                         'limit': 100,
-                    }
+                    },
                 )
                 long_tasks.append(task)
 
             # Execute with timeout
             try:
                 results = await asyncio.wait_for(
-                    asyncio.gather(*long_tasks, return_exceptions=True),
-                    timeout=60.0
+                    asyncio.gather(*long_tasks, return_exceptions=True), timeout=60.0
                 )
 
                 # Count connection-related errors
                 connection_errors = sum(
-                    1 for r in results
+                    1
+                    for r in results
                     if isinstance(r, Exception) and 'connection' in str(r).lower()
                 )
 
-                print(f"\nConnection Pool Test:")
-                print(f"  Total requests: {len(long_tasks)}")
-                print(f"  Connection errors: {connection_errors}")
+                print('\nConnection Pool Test:')
+                print(f'  Total requests: {len(long_tasks)}')
+                print(f'  Connection errors: {connection_errors}')
 
             except asyncio.TimeoutError:
-                print("  Test timed out - possible deadlock or exhaustion")
+                print('  Test timed out - possible deadlock or exhaustion')
 
     @pytest.mark.asyncio
     @pytest.mark.slow
@@ -381,7 +377,7 @@ class TestLoadScenarios:
                             'source': 'text',
                             'source_description': 'degradation test',
                             'group_id': group_id,
-                        }
+                        },
                     )
                     tasks.append(task)
 
@@ -400,10 +396,10 @@ class TestLoadScenarios:
                     'duration': level_duration,
                 }
 
-                print(f"\nLoad Level {level}:")
-                print(f"  Success rate: {success_rate:.1f}%")
-                print(f"  Throughput: {throughput:.2f} ops/s")
-                print(f"  Duration: {level_duration:.2f}s")
+                print(f'\nLoad Level {level}:')
+                print(f'  Success rate: {success_rate:.1f}%')
+                print(f'  Throughput: {throughput:.2f} ops/s')
+                print(f'  Duration: {level_duration:.2f}s')
 
                 # Brief pause between levels
                 await asyncio.sleep(2)
@@ -411,7 +407,7 @@ class TestLoadScenarios:
             # Verify graceful degradation
             # Success rate should not drop below 50% even at high load
             for level, metrics in results_by_level.items():
-                assert metrics['success_rate'] > 50, f"Poor performance at load level {level}"
+                assert metrics['success_rate'] > 50, f'Poor performance at load level {level}'
 
 
 class TestResourceLimits:
@@ -422,18 +418,18 @@ class TestResourceLimits:
         """Test handling of very large payloads."""
         async with graphiti_test_client() as (session, group_id):
             payload_sizes = [
-                (1_000, "1KB"),
-                (10_000, "10KB"),
-                (100_000, "100KB"),
-                (1_000_000, "1MB"),
+                (1_000, '1KB'),
+                (10_000, '10KB'),
+                (100_000, '100KB'),
+                (1_000_000, '1MB'),
             ]
 
             for size, label in payload_sizes:
-                content = "x" * size
+                content = 'x' * size
 
                 start_time = time.time()
                 try:
-                    result = await asyncio.wait_for(
+                    await asyncio.wait_for(
                         session.call_tool(
                             'add_memory',
                             {
@@ -442,22 +438,22 @@ class TestResourceLimits:
                                 'source': 'text',
                                 'source_description': 'payload test',
                                 'group_id': group_id,
-                            }
+                            },
                         ),
-                        timeout=30.0
+                        timeout=30.0,
                     )
                     duration = time.time() - start_time
-                    status = "✅ Success"
+                    status = '✅ Success'
 
                 except asyncio.TimeoutError:
                     duration = 30.0
-                    status = "⏱️  Timeout"
+                    status = '⏱️  Timeout'
 
                 except Exception as e:
                     duration = time.time() - start_time
-                    status = f"❌ Error: {type(e).__name__}"
+                    status = f'❌ Error: {type(e).__name__}'
 
-                print(f"Payload {label}: {status} ({duration:.2f}s)")
+                print(f'Payload {label}: {status} ({duration:.2f}s)')
 
     @pytest.mark.asyncio
     async def test_rate_limit_handling(self):
@@ -474,7 +470,7 @@ class TestResourceLimits:
                         'source': 'text',
                         'source_description': 'rate test',
                         'group_id': group_id,
-                    }
+                    },
                 )
                 rapid_tasks.append(task)
 
@@ -483,42 +479,49 @@ class TestResourceLimits:
 
             # Count rate limit errors
             rate_limit_errors = sum(
-                1 for r in results
+                1
+                for r in results
                 if isinstance(r, Exception) and ('rate' in str(r).lower() or '429' in str(r))
             )
 
-            print(f"\nRate Limit Test:")
-            print(f"  Total requests: {len(rapid_tasks)}")
-            print(f"  Rate limit errors: {rate_limit_errors}")
-            print(f"  Success rate: {(len(rapid_tasks) - rate_limit_errors) / len(rapid_tasks) * 100:.1f}%")
+            print('\nRate Limit Test:')
+            print(f'  Total requests: {len(rapid_tasks)}')
+            print(f'  Rate limit errors: {rate_limit_errors}')
+            print(
+                f'  Success rate: {(len(rapid_tasks) - rate_limit_errors) / len(rapid_tasks) * 100:.1f}%'
+            )
 
 
-def generate_load_test_report(results: List[LoadTestResult]) -> str:
+def generate_load_test_report(results: list[LoadTestResult]) -> str:
     """Generate comprehensive load test report."""
     report = []
-    report.append("\n" + "=" * 60)
-    report.append("LOAD TEST REPORT")
-    report.append("=" * 60)
+    report.append('\n' + '=' * 60)
+    report.append('LOAD TEST REPORT')
+    report.append('=' * 60)
 
     for i, result in enumerate(results):
-        report.append(f"\nTest Run {i + 1}:")
-        report.append(f"  Total Operations: {result.total_operations}")
-        report.append(f"  Success Rate: {result.successful_operations / result.total_operations * 100:.1f}%")
-        report.append(f"  Throughput: {result.throughput:.2f} ops/s")
-        report.append(f"  Latency (avg/p50/p95/p99/max): {result.average_latency:.2f}/{result.p50_latency:.2f}/{result.p95_latency:.2f}/{result.p99_latency:.2f}/{result.max_latency:.2f}s")
+        report.append(f'\nTest Run {i + 1}:')
+        report.append(f'  Total Operations: {result.total_operations}')
+        report.append(
+            f'  Success Rate: {result.successful_operations / result.total_operations * 100:.1f}%'
+        )
+        report.append(f'  Throughput: {result.throughput:.2f} ops/s')
+        report.append(
+            f'  Latency (avg/p50/p95/p99/max): {result.average_latency:.2f}/{result.p50_latency:.2f}/{result.p95_latency:.2f}/{result.p99_latency:.2f}/{result.max_latency:.2f}s'
+        )
 
         if result.errors:
-            report.append("  Errors:")
+            report.append('  Errors:')
             for error_type, count in result.errors.items():
-                report.append(f"    {error_type}: {count}")
+                report.append(f'    {error_type}: {count}')
 
-        report.append("  Resource Usage:")
+        report.append('  Resource Usage:')
         for metric, value in result.resource_usage.items():
-            report.append(f"    {metric}: {value:.2f}")
+            report.append(f'    {metric}: {value:.2f}')
 
-    report.append("=" * 60)
-    return "\n".join(report)
+    report.append('=' * 60)
+    return '\n'.join(report)
 
 
-if __name__ == "__main__":
-    pytest.main([__file__, "-v", "--asyncio-mode=auto", "-m", "slow"])
\ No newline at end of file
+if __name__ == '__main__':
+    pytest.main([__file__, '-v', '--asyncio-mode=auto', '-m', 'slow'])
diff --git a/mcp_server/uv.lock b/mcp_server/uv.lock
index 6222969b..65c91af3 100644
--- a/mcp_server/uv.lock
+++ b/mcp_server/uv.lock
@@ -635,7 +635,7 @@ wheels = [
 
 [[package]]
 name = "graphiti-core"
-version = "0.22.0"
+version = "0.22.1rc2"
 source = { editable = "../" }
 dependencies = [
     { name = "diskcache" },