LightRAG/lightrag/api/run_with_gunicorn.py
clssck 69358d830d test(lightrag,examples,api): comprehensive ruff formatting and type hints
Format entire codebase with ruff and add type hints across all modules:
- Apply ruff formatting to all Python files (121 files, 17K insertions)
- Add type hints to function signatures throughout lightrag core and API
- Update test suite with improved type annotations and docstrings
- Add pyrightconfig.json for static type checking configuration
- Create prompt_optimized.py and test_extraction_prompt_ab.py test files
- Update ruff.toml and .gitignore for improved linting configuration
- Standardize code style across examples, reproduce scripts, and utilities
2025-12-05 15:17:06 +01:00

257 lines
9.6 KiB
Python

#!/usr/bin/env python
"""
Start LightRAG server with Gunicorn
"""
import argparse
import os
import platform
import sys
from typing import cast
import pipmaster as pm
from lightrag.api.config import global_args
from lightrag.api.utils_api import check_env_file, display_splash_screen
from lightrag.constants import (
DEFAULT_TIMEOUT,
DEFAULT_WOKERS,
)
from lightrag.kg.shared_storage import initialize_share_data
from lightrag.utils import get_env_value
def check_and_install_dependencies():
"""Check and install required dependencies"""
required_packages = [
'gunicorn',
'tiktoken',
'psutil',
# Add other required packages here
]
for package in required_packages:
if not pm.is_installed(package):
print(f'Installing {package}...')
pm.install(package)
print(f'{package} installed successfully')
def main():
# Explicitly initialize configuration for Gunicorn mode
from lightrag.api.config import initialize_config
initialize_config()
# Set Gunicorn mode flag for lifespan cleanup detection
os.environ['LIGHTRAG_GUNICORN_MODE'] = '1'
# Check .env file
if not check_env_file():
sys.exit(1)
# Check DOCLING compatibility with Gunicorn multi-worker mode on macOS
if platform.system() == 'Darwin' and global_args.document_loading_engine == 'DOCLING' and global_args.workers > 1:
print('\n' + '=' * 80)
print('❌ ERROR: Incompatible configuration detected!')
print('=' * 80)
print('\nDOCLING engine with Gunicorn multi-worker mode is not supported on macOS')
print('\nReason:')
print(' PyTorch (required by DOCLING) has known compatibility issues with')
print(' fork-based multiprocessing on macOS, which can cause crashes or')
print(' unexpected behavior when using Gunicorn with multiple workers.')
print('\nCurrent configuration:')
print(' - Operating System: macOS (Darwin)')
print(f' - Document Engine: {global_args.document_loading_engine}')
print(f' - Workers: {global_args.workers}')
print('\nPossible solutions:')
print(' 1. Use single worker mode:')
print(' --workers 1')
print('\n 2. Change document loading engine in .env:')
print(' DOCUMENT_LOADING_ENGINE=DEFAULT')
print('\n 3. Deploy on Linux where multi-worker mode is fully supported')
print('=' * 80 + '\n')
sys.exit(1)
# Check macOS fork safety environment variable for multi-worker mode
if (
platform.system() == 'Darwin'
and global_args.workers > 1
and os.environ.get('OBJC_DISABLE_INITIALIZE_FORK_SAFETY') != 'YES'
):
print('\n' + '=' * 80)
print('❌ ERROR: Missing required environment variable on macOS!')
print('=' * 80)
print('\nmacOS with Gunicorn multi-worker mode requires:')
print(' OBJC_DISABLE_INITIALIZE_FORK_SAFETY=YES')
print('\nReason:')
print(" NumPy uses macOS's Accelerate framework (Objective-C based) for")
print(' vector computations. The Objective-C runtime has fork safety checks')
print(' that will crash worker processes when embedding functions are called.')
print('\nCurrent configuration:')
print(' - Operating System: macOS (Darwin)')
print(f' - Workers: {global_args.workers}')
print(f' - Environment Variable: {os.environ.get("OBJC_DISABLE_INITIALIZE_FORK_SAFETY", "NOT SET")}')
print('\nHow to fix:')
print(' Option 1 - Set environment variable before starting (recommended):')
print(' export OBJC_DISABLE_INITIALIZE_FORK_SAFETY=YES')
print(' lightrag-gunicorn --workers 2')
print('\n Option 2 - Add to your shell profile (~/.zshrc or ~/.bash_profile):')
print(" echo 'export OBJC_DISABLE_INITIALIZE_FORK_SAFETY=YES' >> ~/.zshrc")
print(' source ~/.zshrc')
print('\n Option 3 - Use single worker mode (no multiprocessing):')
print(' lightrag-server --workers 1')
print('=' * 80 + '\n')
sys.exit(1)
# Check and install dependencies
check_and_install_dependencies()
# Note: Signal handlers are NOT registered here because:
# - Master cleanup already handled by gunicorn_config.on_exit()
# Display startup information
display_splash_screen(cast(argparse.Namespace, global_args))
print('🚀 Starting LightRAG with Gunicorn')
print(f'🔄 Worker management: Gunicorn (workers={global_args.workers})')
print('🔍 Preloading app: Enabled')
print("📝 Note: Using Gunicorn's preload feature for shared data initialization")
print('\n\n' + '=' * 80)
print('MAIN PROCESS INITIALIZATION')
print(f'Process ID: {os.getpid()}')
print(f'Workers setting: {global_args.workers}')
print('=' * 80 + '\n')
# Import Gunicorn's StandaloneApplication
from gunicorn.app.base import BaseApplication
# Define a custom application class that loads our config
class GunicornApp(BaseApplication):
def __init__(self, app, options=None):
self.options = options or {}
self.application = app
super().__init__()
def load_config(self):
# Define valid Gunicorn configuration options
valid_options = {
'bind',
'workers',
'worker_class',
'timeout',
'keepalive',
'preload_app',
'errorlog',
'accesslog',
'loglevel',
'certfile',
'keyfile',
'limit_request_line',
'limit_request_fields',
'limit_request_field_size',
'graceful_timeout',
'max_requests',
'max_requests_jitter',
}
# Special hooks that need to be set separately
special_hooks = {
'on_starting',
'on_reload',
'on_exit',
'pre_fork',
'post_fork',
'pre_exec',
'pre_request',
'post_request',
'worker_init',
'worker_exit',
'nworkers_changed',
'child_exit',
}
# Import and configure the gunicorn_config module
from lightrag.api import gunicorn_config
# Set configuration variables in gunicorn_config, prioritizing command line arguments
gunicorn_config.workers = (
global_args.workers if global_args.workers else get_env_value('WORKERS', DEFAULT_WOKERS, int)
)
# Bind configuration prioritizes command line arguments
host = global_args.host if global_args.host != '0.0.0.0' else os.getenv('HOST', '0.0.0.0')
port = global_args.port if global_args.port != 9621 else get_env_value('PORT', 9621, int)
gunicorn_config.bind = f'{host}:{port}'
# Log level configuration prioritizes command line arguments
gunicorn_config.loglevel = (
global_args.log_level.lower() if global_args.log_level else os.getenv('LOG_LEVEL', 'info')
)
# Timeout configuration prioritizes command line arguments
gunicorn_config.timeout = (
global_args.timeout + 30
if global_args.timeout is not None
else get_env_value('TIMEOUT', DEFAULT_TIMEOUT + 30, int, special_none=True)
)
# Keepalive configuration
gunicorn_config.keepalive = get_env_value('KEEPALIVE', 5, int)
# SSL configuration prioritizes command line arguments
if global_args.ssl or os.getenv('SSL', '').lower() in (
'true',
'1',
'yes',
't',
'on',
):
gunicorn_config.certfile = (
global_args.ssl_certfile if global_args.ssl_certfile else os.getenv('SSL_CERTFILE')
)
gunicorn_config.keyfile = (
global_args.ssl_keyfile if global_args.ssl_keyfile else os.getenv('SSL_KEYFILE')
)
# Set configuration options from the module
for key in dir(gunicorn_config):
if key in valid_options:
value = getattr(gunicorn_config, key)
# Skip functions like on_starting and None values
if not callable(value) and value is not None:
self.cfg.set(key, value)
# Set special hooks
elif key in special_hooks:
value = getattr(gunicorn_config, key)
if callable(value):
self.cfg.set(key, value)
if hasattr(gunicorn_config, 'logconfig_dict'):
self.cfg.set('logconfig_dict', gunicorn_config.logconfig_dict)
def load(self):
# Import the application
from lightrag.api.lightrag_server import get_application
return get_application(global_args)
# Create the application
app = GunicornApp('')
# Force workers to be an integer and greater than 1 for multi-process mode
workers_count = global_args.workers
if workers_count > 1:
# Set a flag to indicate we're in the main process
os.environ['LIGHTRAG_MAIN_PROCESS'] = '1'
initialize_share_data(workers_count)
else:
initialize_share_data(1)
# Run the application
print('\nStarting Gunicorn with direct Python API...')
app.run()
if __name__ == '__main__':
main()