Fix: Increase Ollama timeout values to prevent ReadTimeout errors

This commit is contained in:
eddiemaru-101 2025-05-30 22:43:52 +09:00
parent 36a736db0b
commit 77399e051f

View file

@ -50,7 +50,7 @@ async def _ollama_model_if_cache(
kwargs.pop("max_tokens", None)
# kwargs.pop("response_format", None) # allow json
host = kwargs.pop("host", None)
timeout = kwargs.pop("timeout", None) or 300 # Default timeout 300s
timeout = kwargs.pop("timeout", None) or 600 # Default timeout 600s (10분으로 증가)
kwargs.pop("hashing_kv", None)
api_key = kwargs.pop("api_key", None)
headers = {
@ -146,7 +146,7 @@ async def ollama_embed(texts: list[str], embed_model, **kwargs) -> np.ndarray:
headers["Authorization"] = f"Bearer {api_key}"
host = kwargs.pop("host", None)
timeout = kwargs.pop("timeout", None) or 90 # Default time out 90s
timeout = kwargs.pop("timeout", None) or 300 # Default time out 300s (5분으로 증가)
ollama_client = ollama.AsyncClient(host=host, timeout=timeout, headers=headers)
@ -168,4 +168,4 @@ async def ollama_embed(texts: list[str], embed_model, **kwargs) -> np.ndarray:
await ollama_client._client.aclose()
logger.debug("Successfully closed Ollama client after embed")
except Exception as close_error:
logger.warning(f"Failed to close Ollama client after embed: {close_error}")
logger.warning(f"Failed to close Ollama client after embed: {close_error}")