Remove legacy storage implementations and deprecated examples: - Delete FAISS, JSON, Memgraph, Milvus, MongoDB, Nano Vector DB, Neo4j, NetworkX, Qdrant, Redis storage backends - Remove Kubernetes deployment manifests and installation scripts - Delete unofficial examples for deprecated backends and offline deployment docs Streamline core infrastructure: - Consolidate storage layer to PostgreSQL-only implementation - Add full-text search caching with FTS cache module - Implement metrics collection and monitoring pipeline - Add explain and metrics API routes Modernize frontend and tooling: - Switch web UI to Bun with bun.lock, remove npm and pnpm lockfiles - Update Dockerfile for PostgreSQL-only deployment - Add Makefile for common development tasks - Update environment and configuration examples Enhance evaluation and testing capabilities: - Add prompt optimization with DSPy and auto-tuning - Implement ground truth regeneration and variant testing - Add prompt debugging and response comparison utilities - Expand test coverage with new integration scenarios Simplify dependencies and configuration: - Remove offline-specific requirement files - Update pyproject.toml with streamlined dependencies - Add Python version pinning with .python-version - Create project guidelines in CLAUDE.md and AGENTS.md
122 lines
4.4 KiB
Python
122 lines
4.4 KiB
Python
from __future__ import annotations
|
|
|
|
from typing import Literal
|
|
|
|
import httpx
|
|
|
|
|
|
class APIStatusError(Exception):
|
|
"""Raised when an API response has a status code of 4xx or 5xx."""
|
|
|
|
response: httpx.Response
|
|
status_code: int
|
|
request_id: str | None
|
|
|
|
def __init__(self, message: str, *, response: httpx.Response, body: object | None = None) -> None:
|
|
super().__init__(message)
|
|
self.response = response
|
|
self.status_code = response.status_code
|
|
self.request_id = response.headers.get('x-request-id')
|
|
|
|
|
|
class APIConnectionError(Exception):
|
|
def __init__(self, *, message: str = 'Connection error.', request: httpx.Request) -> None:
|
|
super().__init__(message)
|
|
|
|
|
|
class BadRequestError(APIStatusError):
|
|
status_code: Literal[400] = 400 # pyright: ignore[reportIncompatibleVariableOverride]
|
|
|
|
|
|
class AuthenticationError(APIStatusError):
|
|
status_code: Literal[401] = 401 # pyright: ignore[reportIncompatibleVariableOverride]
|
|
|
|
|
|
class PermissionDeniedError(APIStatusError):
|
|
status_code: Literal[403] = 403 # pyright: ignore[reportIncompatibleVariableOverride]
|
|
|
|
|
|
class NotFoundError(APIStatusError):
|
|
status_code: Literal[404] = 404 # pyright: ignore[reportIncompatibleVariableOverride]
|
|
|
|
|
|
class ConflictError(APIStatusError):
|
|
status_code: Literal[409] = 409 # pyright: ignore[reportIncompatibleVariableOverride]
|
|
|
|
|
|
class UnprocessableEntityError(APIStatusError):
|
|
status_code: Literal[422] = 422 # pyright: ignore[reportIncompatibleVariableOverride]
|
|
|
|
|
|
class RateLimitError(APIStatusError):
|
|
status_code: Literal[429] = 429 # pyright: ignore[reportIncompatibleVariableOverride]
|
|
|
|
|
|
class APITimeoutError(APIConnectionError):
|
|
def __init__(self, request: httpx.Request) -> None:
|
|
super().__init__(message='Request timed out.', request=request)
|
|
|
|
|
|
class StorageNotInitializedError(RuntimeError):
|
|
"""Raised when storage operations are attempted before initialization."""
|
|
|
|
def __init__(self, storage_type: str = 'Storage'):
|
|
super().__init__(
|
|
f'{storage_type} not initialized. Please ensure proper initialization:\n'
|
|
f'\n'
|
|
f' rag = LightRAG(...)\n'
|
|
f' await rag.initialize_storages() # Required - auto-initializes pipeline_status\n'
|
|
f'\n'
|
|
f'See: https://github.com/HKUDS/LightRAG#important-initialization-requirements'
|
|
)
|
|
|
|
|
|
class PipelineNotInitializedError(KeyError):
|
|
"""Raised when pipeline status is accessed before initialization."""
|
|
|
|
def __init__(self, namespace: str = ''):
|
|
msg = (
|
|
f"Pipeline namespace '{namespace}' not found.\n"
|
|
f'\n'
|
|
f'Pipeline status should be auto-initialized by initialize_storages().\n'
|
|
f'If you see this error, please ensure:\n'
|
|
f'\n'
|
|
f' 1. You called await rag.initialize_storages()\n'
|
|
f' 2. For multi-workspace setups, each LightRAG instance was properly initialized\n'
|
|
f'\n'
|
|
f'Standard initialization:\n'
|
|
f" rag = LightRAG(workspace='your_workspace')\n"
|
|
f' await rag.initialize_storages() # Auto-initializes pipeline_status\n'
|
|
f'\n'
|
|
f'If you need manual control (advanced):\n'
|
|
f' from lightrag.kg.shared_storage import initialize_pipeline_status\n'
|
|
f" await initialize_pipeline_status(workspace='your_workspace')"
|
|
)
|
|
super().__init__(msg)
|
|
|
|
|
|
class PipelineCancelledException(Exception):
|
|
"""Raised when pipeline processing is cancelled by user request."""
|
|
|
|
def __init__(self, message: str = 'User cancelled'):
|
|
super().__init__(message)
|
|
self.message = message
|
|
|
|
|
|
class ChunkTokenLimitExceededError(ValueError):
|
|
"""Raised when a chunk exceeds the configured token limit."""
|
|
|
|
def __init__(
|
|
self,
|
|
chunk_tokens: int,
|
|
chunk_token_limit: int,
|
|
chunk_preview: str | None = None,
|
|
) -> None:
|
|
preview = chunk_preview.strip() if chunk_preview else None
|
|
truncated_preview = preview[:80] if preview else None
|
|
preview_note = f" Preview: '{truncated_preview}'" if truncated_preview else ''
|
|
message = f'Chunk token length {chunk_tokens} exceeds chunk_token_size {chunk_token_limit}.{preview_note}'
|
|
super().__init__(message)
|
|
self.chunk_tokens = chunk_tokens
|
|
self.chunk_token_limit = chunk_token_limit
|
|
self.chunk_preview = truncated_preview
|