chore: adding support for aws bedrock using boto3, more inclined towards anthropic models provided by aws

2025-10-30 16:07:47 +01:00 · 2025-10-30 16:07:47 +01:00 · 82ff6fc696
commit 82ff6fc696
parent 56694a6dea
2 changed files with 149 additions and 0 deletions
--- a/graphiti_core/llm_client/aws_bedrock_client.py
+++ b/graphiti_core/llm_client/aws_bedrock_client.py
@ -0,0 +1,147 @@
+"""
+Copyright 2024, Zep Software, Inc.
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+    http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+"""
+
+import json
+import logging
+import boto3
+from typing import ClassVar
+from pydantic import BaseModel
+
+from .config import DEFAULT_MAX_TOKENS, LLMConfig
+from .openai_base_client import BaseOpenAIClient
+
+logger = logging.getLogger(__name__)
+
+
+class BedrockAnthropicLLMClient(BaseOpenAIClient):
+    MAX_RETRIES: ClassVar[int] = 2
+
+    def __init__(
+        self,
+        config: LLMConfig | None = None,
+        max_tokens: int = DEFAULT_MAX_TOKENS,
+    ):
+        super().__init__(config, cache=False, max_tokens=max_tokens)
+
+        self.region = config.region if config and getattr(config, "region", None) else "us-east-1"
+        self.model = config.model if config else "anthropic.claude-3-sonnet-20240229-v1:0"
+
+        self.client = boto3.client("bedrock-runtime", region_name=self.region)
+    async def _create_structured_completion(
+        self,
+        model: str,
+        messages: list[dict],
+        temperature: float | None,
+        max_tokens: int,
+        response_model: type[BaseModel],
+    ):
+       
+        text_response = await self._invoke_bedrock_model(
+            model=model,
+            messages=messages,
+            temperature=temperature,
+            max_tokens=max_tokens,
+            response_format="json",
+        )
+
+        try:
+            parsed = response_model.parse_raw(text_response)
+            return parsed
+        except Exception as e:
+            logger.error(f"Failed to parse structured Bedrock response: {e}")
+            raise
+
+    async def _create_completion(
+        self,
+        model: str,
+        messages: list[dict],
+        temperature: float | None,
+        max_tokens: int,
+        response_model: type[BaseModel] | None = None,
+    ):
+        text_response = await self._invoke_bedrock_model(
+            model=model,
+            messages=messages,
+            temperature=temperature,
+            max_tokens=max_tokens,
+            response_format="text",
+        )
+
+        if response_model:
+            try:
+                parsed = response_model.parse_raw(text_response)
+                return parsed
+            except Exception as e:
+                logger.error(f"Failed to parse Bedrock response to {response_model.__name__}: {e}")
+                raise
+        return text_response
+
+    async def _invoke_bedrock_model(
+        self,
+        model: str,
+        messages: list[dict],
+        temperature: float | None = 0.7,
+        max_tokens: int = 200,
+        response_format: str = "text",
+    ) -> str:
+
+        # Separate system prompt and user messages
+        system_prompt = None
+        final_messages = []
+        for m in messages:
+            if m["role"] == "system":
+                system_prompt = m["content"]
+            else:
+                final_messages.append(m)
+
+        body_dict = {
+            "messages": final_messages,
+            "temperature": temperature,
+            "max_tokens": max_tokens,
+            "anthropic_version": "bedrock-2023-05-31",
+        }
+
+        if system_prompt:
+            body_dict["system"] = system_prompt
+
+        body = json.dumps(body_dict)
+
+        try:
+            resp = self.client.invoke_model(
+                modelId=model,
+                body=body,
+                accept="application/json",
+                contentType="application/json",
+            )
+            data = json.loads(resp["body"].read().decode("utf-8"))
+
+            if "content" in data and len(data["content"]) > 0:
+                text = data["content"][0].get("text", "")
+            elif "outputText" in data:
+                text = data["outputText"]
+            else:
+                text = json.dumps(data)
+
+            # Ensure JSON-object-only for structured calls
+            if response_format == "json":
+                text = text.strip()
+                if text.startswith("```json"):
+                    text = text.replace("```json", "").replace("```", "").strip()
+            return text.strip()
+
+        except Exception as e:
+            logger.error(f"Bedrock model invocation failed: {e}", exc_info=True)
+            raise
--- a/graphiti_core/llm_client/config.py
+++ b/graphiti_core/llm_client/config.py
@ -42,6 +42,7 @@ class LLMConfig:
        temperature: float = DEFAULT_TEMPERATURE,
        max_tokens: int = DEFAULT_MAX_TOKENS,
        small_model: str | None = None,
+        region: str | None = None,
    ):
        """
        Initialize the LLMConfig with the provided parameters.
@ -66,3 +67,4 @@ class LLMConfig:
        self.small_model = small_model
        self.temperature = temperature
        self.max_tokens = max_tokens
+        self.region = region or "us-east-1"