diff --git a/pyproject.toml b/pyproject.toml
index 765e815ef..745c80e0c 100644
--- a/pyproject.toml
+++ b/pyproject.toml
@@ -89,8 +89,14 @@ writer = [
     "writer-sdk>=2.2.0,<3.0.0"
 ]
 
+sagemaker = [
+    "boto3>=1.26.0,<2.0.0",
+    "botocore>=1.29.0,<2.0.0",
+    "boto3-stubs[sagemaker-runtime]>=1.26.0,<2.0.0"
+]
+
 a2a = [
-    "a2a-sdk[sql]>=0.2.16,<1.0.0",
+    "a2a-sdk[sql]>=0.2.11,<1.0.0",
     "uvicorn>=0.34.2,<1.0.0",
     "httpx>=0.28.1,<1.0.0",
     "fastapi>=0.115.12,<1.0.0",
@@ -136,7 +142,7 @@ all = [
     "opentelemetry-exporter-otlp-proto-http>=1.30.0,<2.0.0",
 
     # a2a
-    "a2a-sdk[sql]>=0.2.16,<1.0.0",
+    "a2a-sdk[sql]>=0.2.11,<1.0.0",
     "uvicorn>=0.34.2,<1.0.0",
     "httpx>=0.28.1,<1.0.0",
     "fastapi>=0.115.12,<1.0.0",
@@ -148,7 +154,7 @@ all = [
 source = "vcs"
 
 [tool.hatch.envs.hatch-static-analysis]
-features = ["anthropic", "litellm", "llamaapi", "ollama", "openai", "otel", "mistral", "writer", "a2a"]
+features = ["anthropic", "litellm", "llamaapi", "ollama", "openai", "otel", "mistral", "writer", "a2a", "sagemaker"]
 dependencies = [
   "mypy>=1.15.0,<2.0.0",
   "ruff>=0.11.6,<0.12.0",
@@ -171,7 +177,7 @@ lint-fix = [
 ]
 
 [tool.hatch.envs.hatch-test]
-features = ["anthropic", "litellm", "llamaapi", "ollama", "openai", "otel", "mistral", "writer", "a2a"]
+features = ["anthropic", "litellm", "llamaapi", "ollama", "openai", "otel", "mistral", "writer", "a2a", "sagemaker"]
 extra-dependencies = [
     "moto>=5.1.0,<6.0.0",
     "pytest>=8.0.0,<9.0.0",
@@ -187,7 +193,7 @@ extra-args = [
 
 [tool.hatch.envs.dev]
 dev-mode = true
-features = ["dev", "docs", "anthropic", "litellm", "llamaapi", "ollama", "otel", "mistral", "writer", "a2a"]
+features = ["dev", "docs", "anthropic", "litellm", "llamaapi", "ollama", "otel", "mistral", "writer", "a2a", "sagemaker"]
 
 [[tool.hatch.envs.hatch-test.matrix]]
 python = ["3.13", "3.12", "3.11", "3.10"]
@@ -315,4 +321,4 @@ style = [
     ["instruction", ""],
     ["text", ""],
     ["disabled", "fg:#858585 italic"]
-]
+]
\ No newline at end of file
diff --git a/src/strands/models/sagemaker.py b/src/strands/models/sagemaker.py
new file mode 100644
index 000000000..bb2db45a2
--- /dev/null
+++ b/src/strands/models/sagemaker.py
@@ -0,0 +1,600 @@
+"""Amazon SageMaker model provider."""
+
+import json
+import logging
+import os
+from dataclasses import dataclass
+from typing import Any, AsyncGenerator, Literal, Optional, Type, TypedDict, TypeVar, Union, cast
+
+import boto3
+from botocore.config import Config as BotocoreConfig
+from mypy_boto3_sagemaker_runtime import SageMakerRuntimeClient
+from pydantic import BaseModel
+from typing_extensions import Unpack, override
+
+from ..types.content import ContentBlock, Messages
+from ..types.streaming import StreamEvent
+from ..types.tools import ToolResult, ToolSpec
+from .openai import OpenAIModel
+
+T = TypeVar("T", bound=BaseModel)
+
+logger = logging.getLogger(__name__)
+
+
+@dataclass
+class UsageMetadata:
+    """Usage metadata for the model.
+
+    Attributes:
+        total_tokens: Total number of tokens used in the request
+        completion_tokens: Number of tokens used in the completion
+        prompt_tokens: Number of tokens used in the prompt
+        prompt_tokens_details: Additional information about the prompt tokens (optional)
+    """
+
+    total_tokens: int
+    completion_tokens: int
+    prompt_tokens: int
+    prompt_tokens_details: Optional[int] = 0
+
+
+@dataclass
+class FunctionCall:
+    """Function call for the model.
+
+    Attributes:
+        name: Name of the function to call
+        arguments: Arguments to pass to the function
+    """
+
+    name: Union[str, dict[Any, Any]]
+    arguments: Union[str, dict[Any, Any]]
+
+    def __init__(self, **kwargs: dict[str, str]):
+        """Initialize function call.
+
+        Args:
+            **kwargs: Keyword arguments for the function call.
+        """
+        self.name = kwargs.get("name", "")
+        self.arguments = kwargs.get("arguments", "")
+
+
+@dataclass
+class ToolCall:
+    """Tool call for the model object.
+
+    Attributes:
+        id: Tool call ID
+        type: Tool call type
+        function: Tool call function
+    """
+
+    id: str
+    type: Literal["function"]
+    function: FunctionCall
+
+    def __init__(self, **kwargs: dict):
+        """Initialize tool call object.
+
+        Args:
+            **kwargs: Keyword arguments for the tool call.
+        """
+        self.id = str(kwargs.get("id", ""))
+        self.type = "function"
+        self.function = FunctionCall(**kwargs.get("function", {"name": "", "arguments": ""}))
+
+
+class SageMakerAIModel(OpenAIModel):
+    """Amazon SageMaker model provider implementation."""
+
+    client: SageMakerRuntimeClient  # type: ignore[assignment]
+
+    class SageMakerAIPayloadSchema(TypedDict, total=False):
+        """Payload schema for the Amazon SageMaker AI model.
+
+        Attributes:
+            max_tokens: Maximum number of tokens to generate in the completion
+            stream: Whether to stream the response
+            temperature: Sampling temperature to use for the model (optional)
+            top_p: Nucleus sampling parameter (optional)
+            top_k: Top-k sampling parameter (optional)
+            stop: List of stop sequences to use for the model (optional)
+            tool_results_as_user_messages: Convert tool result to user messages (optional)
+            additional_args: Additional request parameters, as supported by https://bit.ly/djl-lmi-request-schema
+        """
+
+        max_tokens: int
+        stream: bool
+        temperature: Optional[float]
+        top_p: Optional[float]
+        top_k: Optional[int]
+        stop: Optional[list[str]]
+        tool_results_as_user_messages: Optional[bool]
+        additional_args: Optional[dict[str, Any]]
+
+    class SageMakerAIEndpointConfig(TypedDict, total=False):
+        """Configuration options for SageMaker models.
+
+        Attributes:
+            endpoint_name: The name of the SageMaker endpoint to invoke
+            inference_component_name: The name of the inference component to use
+
+            additional_args: Other request parameters, as supported by https://bit.ly/sagemaker-invoke-endpoint-params
+        """
+
+        endpoint_name: str
+        region_name: str
+        inference_component_name: Union[str, None]
+        target_model: Union[Optional[str], None]
+        target_variant: Union[Optional[str], None]
+        additional_args: Optional[dict[str, Any]]
+
+    def __init__(
+        self,
+        endpoint_config: SageMakerAIEndpointConfig,
+        payload_config: SageMakerAIPayloadSchema,
+        boto_session: Optional[boto3.Session] = None,
+        boto_client_config: Optional[BotocoreConfig] = None,
+    ):
+        """Initialize provider instance.
+
+        Args:
+            endpoint_config: Endpoint configuration for SageMaker.
+            payload_config: Payload configuration for the model.
+            boto_session: Boto Session to use when calling the SageMaker Runtime.
+            boto_client_config: Configuration to use when creating the SageMaker-Runtime Boto Client.
+        """
+        payload_config.setdefault("stream", True)
+        payload_config.setdefault("tool_results_as_user_messages", False)
+        self.endpoint_config = dict(endpoint_config)
+        self.payload_config = dict(payload_config)
+        logger.debug(
+            "endpoint_config=<%s> payload_config=<%s> | initializing", self.endpoint_config, self.payload_config
+        )
+
+        region = self.endpoint_config.get("region_name") or os.getenv("AWS_REGION") or "us-west-2"
+        session = boto_session or boto3.Session(region_name=str(region))
+
+        # Add strands-agents to the request user agent
+        if boto_client_config:
+            existing_user_agent = getattr(boto_client_config, "user_agent_extra", None)
+
+            # Append 'strands-agents' to existing user_agent_extra or set it if not present
+            new_user_agent = f"{existing_user_agent} strands-agents" if existing_user_agent else "strands-agents"
+
+            client_config = boto_client_config.merge(BotocoreConfig(user_agent_extra=new_user_agent))
+        else:
+            client_config = BotocoreConfig(user_agent_extra="strands-agents")
+
+        self.client = session.client(
+            service_name="sagemaker-runtime",
+            config=client_config,
+        )
+
+    @override
+    def update_config(self, **endpoint_config: Unpack[SageMakerAIEndpointConfig]) -> None:  # type: ignore[override]
+        """Update the Amazon SageMaker model configuration with the provided arguments.
+
+        Args:
+            **endpoint_config: Configuration overrides.
+        """
+        self.endpoint_config.update(endpoint_config)
+
+    @override
+    def get_config(self) -> "SageMakerAIModel.SageMakerAIEndpointConfig":  # type: ignore[override]
+        """Get the Amazon SageMaker model configuration.
+
+        Returns:
+            The Amazon SageMaker model configuration.
+        """
+        return cast(SageMakerAIModel.SageMakerAIEndpointConfig, self.endpoint_config)
+
+    @override
+    def format_request(
+        self, messages: Messages, tool_specs: Optional[list[ToolSpec]] = None, system_prompt: Optional[str] = None
+    ) -> dict[str, Any]:
+        """Format an Amazon SageMaker chat streaming request.
+
+        Args:
+            messages: List of message objects to be processed by the model.
+            tool_specs: List of tool specifications to make available to the model.
+            system_prompt: System prompt to provide context to the model.
+
+        Returns:
+            An Amazon SageMaker chat streaming request.
+        """
+        formatted_messages = self.format_request_messages(messages, system_prompt)
+
+        payload = {
+            "messages": formatted_messages,
+            "tools": [
+                {
+                    "type": "function",
+                    "function": {
+                        "name": tool_spec["name"],
+                        "description": tool_spec["description"],
+                        "parameters": tool_spec["inputSchema"]["json"],
+                    },
+                }
+                for tool_spec in tool_specs or []
+            ],
+            # Add payload configuration parameters
+            **{
+                k: v
+                for k, v in self.payload_config.items()
+                if k not in ["additional_args", "tool_results_as_user_messages"]
+            },
+        }
+
+        # Remove tools and tool_choice if tools = []
+        if not payload["tools"]:
+            payload.pop("tools")
+            payload.pop("tool_choice", None)
+        else:
+            # Ensure the model can use tools when available
+            payload["tool_choice"] = "auto"
+
+        for message in payload["messages"]:  # type: ignore
+            # Assistant message must have either content or tool_calls, but not both
+            if message.get("role", "") == "assistant" and message.get("tool_calls", []) != []:
+                message.pop("content", None)
+            if message.get("role") == "tool" and self.payload_config.get("tool_results_as_user_messages", False):
+                # Convert tool message to user message
+                tool_call_id = message.get("tool_call_id", "ABCDEF")
+                content = message.get("content", "")
+                message = {"role": "user", "content": f"Tool call ID '{tool_call_id}' returned: {content}"}
+            # Cannot have both reasoning_text and text - if "text", content becomes an array of content["text"]
+            for c in message.get("content", []):
+                if "text" in c:
+                    message["content"] = [c]
+                    break
+            # Cast message content to string for TGI compatibility
+            # message["content"] = str(message.get("content", ""))
+
+        logger.info("payload=<%s>", json.dumps(payload, indent=2))
+        # Format the request according to the SageMaker Runtime API requirements
+        request = {
+            "EndpointName": self.endpoint_config["endpoint_name"],
+            "Body": json.dumps(payload),
+            "ContentType": "application/json",
+            "Accept": "application/json",
+        }
+
+        # Add optional SageMaker parameters if provided
+        if self.endpoint_config.get("inference_component_name"):
+            request["InferenceComponentName"] = self.endpoint_config["inference_component_name"]
+        if self.endpoint_config.get("target_model"):
+            request["TargetModel"] = self.endpoint_config["target_model"]
+        if self.endpoint_config.get("target_variant"):
+            request["TargetVariant"] = self.endpoint_config["target_variant"]
+
+        # Add additional args if provided
+        if self.endpoint_config.get("additional_args"):
+            request.update(self.endpoint_config["additional_args"].__dict__)
+
+        print(json.dumps(request["Body"], indent=2))
+
+        return request
+
+    @override
+    async def stream(
+        self,
+        messages: Messages,
+        tool_specs: Optional[list[ToolSpec]] = None,
+        system_prompt: Optional[str] = None,
+        **kwargs: Any,
+    ) -> AsyncGenerator[StreamEvent, None]:
+        """Stream conversation with the SageMaker model.
+
+        Args:
+            messages: List of message objects to be processed by the model.
+            tool_specs: List of tool specifications to make available to the model.
+            system_prompt: System prompt to provide context to the model.
+            **kwargs: Additional keyword arguments for future extensibility.
+
+        Yields:
+            Formatted message chunks from the model.
+        """
+        logger.debug("formatting request")
+        request = self.format_request(messages, tool_specs, system_prompt)
+        logger.debug("formatted request=<%s>", request)
+
+        logger.debug("invoking model")
+        try:
+            if self.payload_config.get("stream", True):
+                response = self.client.invoke_endpoint_with_response_stream(**request)
+
+                # Message start
+                yield self.format_chunk({"chunk_type": "message_start"})
+
+                # Parse the content
+                finish_reason = ""
+                partial_content = ""
+                tool_calls: dict[int, list[Any]] = {}
+                has_text_content = False
+                text_content_started = False
+                reasoning_content_started = False
+
+                for event in response["Body"]:
+                    chunk = event["PayloadPart"]["Bytes"].decode("utf-8")
+                    partial_content += chunk[6:] if chunk.startswith("data: ") else chunk  # TGI fix
+                    logger.info("chunk=<%s>", partial_content)
+                    try:
+                        content = json.loads(partial_content)
+                        partial_content = ""
+                        choice = content["choices"][0]
+                        logger.info("choice=<%s>", json.dumps(choice, indent=2))
+
+                        # Handle text content
+                        if choice["delta"].get("content", None):
+                            if not text_content_started:
+                                yield self.format_chunk({"chunk_type": "content_start", "data_type": "text"})
+                                text_content_started = True
+                            has_text_content = True
+                            yield self.format_chunk(
+                                {
+                                    "chunk_type": "content_delta",
+                                    "data_type": "text",
+                                    "data": choice["delta"]["content"],
+                                }
+                            )
+
+                        # Handle reasoning content
+                        if choice["delta"].get("reasoning_content", None):
+                            if not reasoning_content_started:
+                                yield self.format_chunk(
+                                    {"chunk_type": "content_start", "data_type": "reasoning_content"}
+                                )
+                                reasoning_content_started = True
+                            yield self.format_chunk(
+                                {
+                                    "chunk_type": "content_delta",
+                                    "data_type": "reasoning_content",
+                                    "data": choice["delta"]["reasoning_content"],
+                                }
+                            )
+
+                        # Handle tool calls
+                        generated_tool_calls = choice["delta"].get("tool_calls", [])
+                        if not isinstance(generated_tool_calls, list):
+                            generated_tool_calls = [generated_tool_calls]
+                        for tool_call in generated_tool_calls:
+                            tool_calls.setdefault(tool_call["index"], []).append(tool_call)
+
+                        if choice["finish_reason"] is not None:
+                            finish_reason = choice["finish_reason"]
+                            break
+
+                        if choice.get("usage", None):
+                            yield self.format_chunk(
+                                {"chunk_type": "metadata", "data": UsageMetadata(**choice["usage"])}
+                            )
+
+                    except json.JSONDecodeError:
+                        # Continue accumulating content until we have valid JSON
+                        continue
+
+                # Close reasoning content if it was started
+                if reasoning_content_started:
+                    yield self.format_chunk({"chunk_type": "content_stop", "data_type": "reasoning_content"})
+
+                # Close text content if it was started
+                if text_content_started:
+                    yield self.format_chunk({"chunk_type": "content_stop", "data_type": "text"})
+
+                # Handle tool calling
+                logger.info("tool_calls=<%s>", json.dumps(tool_calls, indent=2))
+                for tool_deltas in tool_calls.values():
+                    if not tool_deltas[0]["function"].get("name", None):
+                        raise Exception("The model did not provide a tool name.")
+                    yield self.format_chunk(
+                        {"chunk_type": "content_start", "data_type": "tool", "data": ToolCall(**tool_deltas[0])}
+                    )
+                    for tool_delta in tool_deltas:
+                        yield self.format_chunk(
+                            {"chunk_type": "content_delta", "data_type": "tool", "data": ToolCall(**tool_delta)}
+                        )
+                    yield self.format_chunk({"chunk_type": "content_stop", "data_type": "tool"})
+
+                # If no content was generated at all, ensure we have empty text content
+                if not has_text_content and not tool_calls:
+                    yield self.format_chunk({"chunk_type": "content_start", "data_type": "text"})
+                    yield self.format_chunk({"chunk_type": "content_stop", "data_type": "text"})
+
+                # Message close
+                yield self.format_chunk({"chunk_type": "message_stop", "data": finish_reason})
+
+            else:
+                # Not all SageMaker AI models support streaming!
+                response = self.client.invoke_endpoint(**request)  # type: ignore[assignment]
+                final_response_json = json.loads(response["Body"].read().decode("utf-8"))  # type: ignore[attr-defined]
+                logger.info("response=<%s>", json.dumps(final_response_json, indent=2))
+
+                # Obtain the key elements from the response
+                message = final_response_json["choices"][0]["message"]
+                message_stop_reason = final_response_json["choices"][0]["finish_reason"]
+
+                # Message start
+                yield self.format_chunk({"chunk_type": "message_start"})
+
+                # Handle text
+                if message.get("content", ""):
+                    yield self.format_chunk({"chunk_type": "content_start", "data_type": "text"})
+                    yield self.format_chunk(
+                        {"chunk_type": "content_delta", "data_type": "text", "data": message["content"]}
+                    )
+                    yield self.format_chunk({"chunk_type": "content_stop", "data_type": "text"})
+
+                # Handle reasoning content
+                if message.get("reasoning_content", None):
+                    yield self.format_chunk({"chunk_type": "content_start", "data_type": "reasoning_content"})
+                    yield self.format_chunk(
+                        {
+                            "chunk_type": "content_delta",
+                            "data_type": "reasoning_content",
+                            "data": message["reasoning_content"],
+                        }
+                    )
+                    yield self.format_chunk({"chunk_type": "content_stop", "data_type": "reasoning_content"})
+
+                # Handle the tool calling, if any
+                if message.get("tool_calls", None) or message_stop_reason == "tool_calls":
+                    if not isinstance(message["tool_calls"], list):
+                        message["tool_calls"] = [message["tool_calls"]]
+                    for tool_call in message["tool_calls"]:
+                        # if arguments of tool_call is not str, cast it
+                        if not isinstance(tool_call["function"]["arguments"], str):
+                            tool_call["function"]["arguments"] = json.dumps(tool_call["function"]["arguments"])
+                        yield self.format_chunk(
+                            {"chunk_type": "content_start", "data_type": "tool", "data": ToolCall(**tool_call)}
+                        )
+                        yield self.format_chunk(
+                            {"chunk_type": "content_delta", "data_type": "tool", "data": ToolCall(**tool_call)}
+                        )
+                        yield self.format_chunk({"chunk_type": "content_stop", "data_type": "tool"})
+                    message_stop_reason = "tool_calls"
+
+                # Message close
+                yield self.format_chunk({"chunk_type": "message_stop", "data": message_stop_reason})
+                # Handle usage metadata
+                if final_response_json.get("usage", None):
+                    yield self.format_chunk(
+                        {"chunk_type": "metadata", "data": UsageMetadata(**final_response_json.get("usage", None))}
+                    )
+        except (
+            self.client.exceptions.InternalFailure,
+            self.client.exceptions.ServiceUnavailable,
+            self.client.exceptions.ValidationError,
+            self.client.exceptions.ModelError,
+            self.client.exceptions.InternalDependencyException,
+            self.client.exceptions.ModelNotReadyException,
+        ) as e:
+            logger.error("SageMaker error: %s", str(e))
+            raise e
+
+        logger.debug("finished streaming response from model")
+
+    @override
+    @classmethod
+    def format_request_tool_message(cls, tool_result: ToolResult) -> dict[str, Any]:
+        """Format a SageMaker compatible tool message.
+
+        Args:
+            tool_result: Tool result collected from a tool execution.
+
+        Returns:
+            SageMaker compatible tool message with content as a string.
+        """
+        # Convert content blocks to a simple string for SageMaker compatibility
+        content_parts = []
+        for content in tool_result["content"]:
+            if "json" in content:
+                content_parts.append(json.dumps(content["json"]))
+            elif "text" in content:
+                content_parts.append(content["text"])
+            else:
+                # Handle other content types by converting to string
+                content_parts.append(str(content))
+
+        content_string = " ".join(content_parts)
+
+        return {
+            "role": "tool",
+            "tool_call_id": tool_result["toolUseId"],
+            "content": content_string,  # String instead of list
+        }
+
+    @override
+    @classmethod
+    def format_request_message_content(cls, content: ContentBlock) -> dict[str, Any]:
+        """Format a content block.
+
+        Args:
+            content: Message content.
+
+        Returns:
+            Formatted content block.
+
+        Raises:
+            TypeError: If the content block type cannot be converted to a SageMaker-compatible format.
+        """
+        # if "text" in content and not isinstance(content["text"], str):
+        #     return {"type": "text", "text": str(content["text"])}
+
+        if "reasoningContent" in content and content["reasoningContent"]:
+            return {
+                "signature": content["reasoningContent"].get("reasoningText", {}).get("signature", ""),
+                "thinking": content["reasoningContent"].get("reasoningText", {}).get("text", ""),
+                "type": "thinking",
+            }
+        elif not content.get("reasoningContent", None):
+            content.pop("reasoningContent", None)
+
+        if "video" in content:
+            return {
+                "type": "video_url",
+                "video_url": {
+                    "detail": "auto",
+                    "url": content["video"]["source"]["bytes"],
+                },
+            }
+
+        return super().format_request_message_content(content)
+
+    @override
+    async def structured_output(
+        self, output_model: Type[T], prompt: Messages, system_prompt: Optional[str] = None, **kwargs: Any
+    ) -> AsyncGenerator[dict[str, Union[T, Any]], None]:
+        """Get structured output from the model.
+
+        Args:
+            output_model: The output model to use for the agent.
+            prompt: The prompt messages to use for the agent.
+            system_prompt: System prompt to provide context to the model.
+            **kwargs: Additional keyword arguments for future extensibility.
+
+        Yields:
+            Model events with the last being the structured output.
+        """
+        # Format the request for structured output
+        request = self.format_request(prompt, system_prompt=system_prompt)
+
+        # Parse the payload to add response format
+        payload = json.loads(request["Body"])
+        payload["response_format"] = {
+            "type": "json_schema",
+            "json_schema": {"name": output_model.__name__, "schema": output_model.model_json_schema(), "strict": True},
+        }
+        request["Body"] = json.dumps(payload)
+
+        try:
+            # Use non-streaming mode for structured output
+            response = self.client.invoke_endpoint(**request)
+            final_response_json = json.loads(response["Body"].read().decode("utf-8"))
+
+            # Extract the structured content
+            message = final_response_json["choices"][0]["message"]
+
+            if message.get("content"):
+                try:
+                    # Parse the JSON content and create the output model instance
+                    content_data = json.loads(message["content"])
+                    parsed_output = output_model(**content_data)
+                    yield {"output": parsed_output}
+                except (json.JSONDecodeError, TypeError, ValueError) as e:
+                    raise ValueError(f"Failed to parse structured output: {e}") from e
+            else:
+                raise ValueError("No content found in SageMaker response")
+
+        except (
+            self.client.exceptions.InternalFailure,
+            self.client.exceptions.ServiceUnavailable,
+            self.client.exceptions.ValidationError,
+            self.client.exceptions.ModelError,
+            self.client.exceptions.InternalDependencyException,
+            self.client.exceptions.ModelNotReadyException,
+        ) as e:
+            logger.error("SageMaker structured output error: %s", str(e))
+            raise ValueError(f"SageMaker structured output error: {str(e)}") from e
diff --git a/tests/strands/models/test_sagemaker.py b/tests/strands/models/test_sagemaker.py
new file mode 100644
index 000000000..ba395b2d6
--- /dev/null
+++ b/tests/strands/models/test_sagemaker.py
@@ -0,0 +1,574 @@
+"""Tests for the Amazon SageMaker model provider."""
+
+import json
+import unittest.mock
+from typing import Any, Dict, List
+
+import boto3
+import pytest
+from botocore.config import Config as BotocoreConfig
+
+from strands.models.sagemaker import (
+    FunctionCall,
+    SageMakerAIModel,
+    ToolCall,
+    UsageMetadata,
+)
+from strands.types.content import Messages
+from strands.types.tools import ToolSpec
+
+
+@pytest.fixture
+def boto_session():
+    """Mock boto3 session."""
+    with unittest.mock.patch.object(boto3, "Session") as mock_session:
+        yield mock_session.return_value
+
+
+@pytest.fixture
+def sagemaker_client(boto_session):
+    """Mock SageMaker runtime client."""
+    return boto_session.client.return_value
+
+
+@pytest.fixture
+def endpoint_config() -> Dict[str, Any]:
+    """Default endpoint configuration for tests."""
+    return {
+        "endpoint_name": "test-endpoint",
+        "inference_component_name": "test-component",
+        "region_name": "us-east-1",
+    }
+
+
+@pytest.fixture
+def payload_config() -> Dict[str, Any]:
+    """Default payload configuration for tests."""
+    return {
+        "max_tokens": 1024,
+        "temperature": 0.7,
+        "stream": True,
+    }
+
+
+@pytest.fixture
+def model(boto_session, endpoint_config, payload_config):
+    """SageMaker model instance with mocked boto session."""
+    return SageMakerAIModel(endpoint_config=endpoint_config, payload_config=payload_config, boto_session=boto_session)
+
+
+@pytest.fixture
+def messages() -> Messages:
+    """Sample messages for testing."""
+    return [{"role": "user", "content": [{"text": "What is the capital of France?"}]}]
+
+
+@pytest.fixture
+def tool_specs() -> List[ToolSpec]:
+    """Sample tool specifications for testing."""
+    return [
+        {
+            "name": "get_weather",
+            "description": "Get the weather for a location",
+            "inputSchema": {
+                "json": {
+                    "type": "object",
+                    "properties": {"location": {"type": "string"}},
+                    "required": ["location"],
+                }
+            },
+        }
+    ]
+
+
+@pytest.fixture
+def system_prompt() -> str:
+    """Sample system prompt for testing."""
+    return "You are a helpful assistant."
+
+
+class TestSageMakerAIModel:
+    """Test suite for SageMakerAIModel."""
+
+    def test_init_default(self, boto_session):
+        """Test initialization with default parameters."""
+        endpoint_config = {"endpoint_name": "test-endpoint", "region_name": "us-east-1"}
+        payload_config = {"max_tokens": 1024}
+        model = SageMakerAIModel(
+            endpoint_config=endpoint_config, payload_config=payload_config, boto_session=boto_session
+        )
+
+        assert model.endpoint_config["endpoint_name"] == "test-endpoint"
+        assert model.payload_config.get("stream", True) is True
+
+        boto_session.client.assert_called_once_with(
+            service_name="sagemaker-runtime",
+            config=unittest.mock.ANY,
+        )
+
+    def test_init_with_all_params(self, boto_session):
+        """Test initialization with all parameters."""
+        endpoint_config = {
+            "endpoint_name": "test-endpoint",
+            "inference_component_name": "test-component",
+            "region_name": "us-west-2",
+        }
+        payload_config = {
+            "stream": False,
+            "max_tokens": 1024,
+            "temperature": 0.7,
+        }
+        client_config = BotocoreConfig(user_agent_extra="test-agent")
+
+        model = SageMakerAIModel(
+            endpoint_config=endpoint_config,
+            payload_config=payload_config,
+            boto_session=boto_session,
+            boto_client_config=client_config,
+        )
+
+        assert model.endpoint_config["endpoint_name"] == "test-endpoint"
+        assert model.endpoint_config["inference_component_name"] == "test-component"
+        assert model.payload_config["stream"] is False
+        assert model.payload_config["max_tokens"] == 1024
+        assert model.payload_config["temperature"] == 0.7
+
+        boto_session.client.assert_called_once_with(
+            service_name="sagemaker-runtime",
+            config=unittest.mock.ANY,
+        )
+
+    def test_init_with_client_config(self, boto_session):
+        """Test initialization with client configuration."""
+        endpoint_config = {"endpoint_name": "test-endpoint", "region_name": "us-east-1"}
+        payload_config = {"max_tokens": 1024}
+        client_config = BotocoreConfig(user_agent_extra="test-agent")
+
+        SageMakerAIModel(
+            endpoint_config=endpoint_config,
+            payload_config=payload_config,
+            boto_session=boto_session,
+            boto_client_config=client_config,
+        )
+
+        # Verify client was created with a config that includes our user agent
+        boto_session.client.assert_called_once_with(
+            service_name="sagemaker-runtime",
+            config=unittest.mock.ANY,
+        )
+
+        # Get the actual config passed to client
+        actual_config = boto_session.client.call_args[1]["config"]
+        assert "strands-agents" in actual_config.user_agent_extra
+        assert "test-agent" in actual_config.user_agent_extra
+
+    def test_update_config(self, model):
+        """Test updating model configuration."""
+        new_config = {"target_model": "new-model", "target_variant": "new-variant"}
+        model.update_config(**new_config)
+
+        assert model.endpoint_config["target_model"] == "new-model"
+        assert model.endpoint_config["target_variant"] == "new-variant"
+        # Original values should be preserved
+        assert model.endpoint_config["endpoint_name"] == "test-endpoint"
+        assert model.endpoint_config["inference_component_name"] == "test-component"
+
+    def test_get_config(self, model, endpoint_config):
+        """Test getting model configuration."""
+        config = model.get_config()
+        assert config == model.endpoint_config
+        assert isinstance(config, dict)
+
+    # def test_format_request_messages_with_system_prompt(self, model):
+    #     """Test formatting request messages with system prompt."""
+    #     messages = [{"role": "user", "content": "Hello"}]
+    #     system_prompt = "You are a helpful assistant."
+
+    #     formatted_messages = model.format_request_messages(messages, system_prompt)
+
+    #     assert len(formatted_messages) == 2
+    #     assert formatted_messages[0]["role"] == "system"
+    #     assert formatted_messages[0]["content"] == system_prompt
+    #     assert formatted_messages[1]["role"] == "user"
+    #     assert formatted_messages[1]["content"] == "Hello"
+
+    # def test_format_request_messages_with_tool_calls(self, model):
+    #     """Test formatting request messages with tool calls."""
+    #     messages = [
+    #         {"role": "user", "content": "Hello"},
+    #         {
+    #             "role": "assistant",
+    #             "content": None,
+    #             "tool_calls": [{"id": "123", "type": "function", "function": {"name": "test", "arguments": "{}"}}],
+    #         },
+    #     ]
+
+    #     formatted_messages = model.format_request_messages(messages, None)
+
+    #     assert len(formatted_messages) == 2
+    #     assert formatted_messages[0]["role"] == "user"
+    #     assert formatted_messages[1]["role"] == "assistant"
+    #     assert "content" not in formatted_messages[1]
+    #     assert "tool_calls" in formatted_messages[1]
+
+    # def test_format_request(self, model, messages, tool_specs, system_prompt):
+    #     """Test formatting a request with all parameters."""
+    #     request = model.format_request(messages, tool_specs, system_prompt)
+
+    #     assert request["EndpointName"] == "test-endpoint"
+    #     assert request["InferenceComponentName"] == "test-component"
+    #     assert request["ContentType"] == "application/json"
+    #     assert request["Accept"] == "application/json"
+
+    #     payload = json.loads(request["Body"])
+    #     assert "messages" in payload
+    #     assert len(payload["messages"]) > 0
+    #     assert "tools" in payload
+    #     assert len(payload["tools"]) == 1
+    #     assert payload["tools"][0]["type"] == "function"
+    #     assert payload["tools"][0]["function"]["name"] == "get_weather"
+    #     assert payload["max_tokens"] == 1024
+    #     assert payload["temperature"] == 0.7
+    #     assert payload["stream"] is True
+
+    # def test_format_request_without_tools(self, model, messages, system_prompt):
+    #     """Test formatting a request without tools."""
+    #     request = model.format_request(messages, None, system_prompt)
+
+    #     payload = json.loads(request["Body"])
+    #     assert "tools" in payload
+    #     assert payload["tools"] == []
+
+    @pytest.mark.asyncio
+    async def test_stream_with_streaming_enabled(self, sagemaker_client, model, messages):
+        """Test streaming response with streaming enabled."""
+        # Mock the response from SageMaker
+        mock_response = {
+            "Body": [
+                {
+                    "PayloadPart": {
+                        "Bytes": json.dumps(
+                            {
+                                "choices": [
+                                    {
+                                        "delta": {"content": "Paris is the capital of France."},
+                                        "finish_reason": None,
+                                    }
+                                ]
+                            }
+                        ).encode("utf-8")
+                    }
+                },
+                {
+                    "PayloadPart": {
+                        "Bytes": json.dumps(
+                            {
+                                "choices": [
+                                    {
+                                        "delta": {"content": " It is known for the Eiffel Tower."},
+                                        "finish_reason": "stop",
+                                    }
+                                ]
+                            }
+                        ).encode("utf-8")
+                    }
+                },
+            ]
+        }
+        sagemaker_client.invoke_endpoint_with_response_stream.return_value = mock_response
+
+        response = [chunk async for chunk in model.stream(messages)]
+
+        assert len(response) >= 5
+        assert response[0] == {"messageStart": {"role": "assistant"}}
+
+        # Find content events
+        content_start = next((e for e in response if "contentBlockStart" in e), None)
+        content_delta = next((e for e in response if "contentBlockDelta" in e), None)
+        content_stop = next((e for e in response if "contentBlockStop" in e), None)
+        message_stop = next((e for e in response if "messageStop" in e), None)
+
+        assert content_start is not None
+        assert content_delta is not None
+        assert content_stop is not None
+        assert message_stop is not None
+        assert message_stop["messageStop"]["stopReason"] == "end_turn"
+
+        sagemaker_client.invoke_endpoint_with_response_stream.assert_called_once()
+
+    @pytest.mark.asyncio
+    async def test_stream_with_tool_calls(self, sagemaker_client, model, messages):
+        """Test streaming response with tool calls."""
+        # Mock the response from SageMaker with tool calls
+        mock_response = {
+            "Body": [
+                {
+                    "PayloadPart": {
+                        "Bytes": json.dumps(
+                            {
+                                "choices": [
+                                    {
+                                        "delta": {
+                                            "content": None,
+                                            "tool_calls": [
+                                                {
+                                                    "index": 0,
+                                                    "id": "tool123",
+                                                    "type": "function",
+                                                    "function": {
+                                                        "name": "get_weather",
+                                                        "arguments": '{"location": "Paris"}',
+                                                    },
+                                                }
+                                            ],
+                                        },
+                                        "finish_reason": "tool_calls",
+                                    }
+                                ]
+                            }
+                        ).encode("utf-8")
+                    }
+                }
+            ]
+        }
+        sagemaker_client.invoke_endpoint_with_response_stream.return_value = mock_response
+
+        response = [chunk async for chunk in model.stream(messages)]
+
+        # Verify the response contains tool call events
+        assert len(response) >= 4
+        assert response[0] == {"messageStart": {"role": "assistant"}}
+
+        message_stop = next((e for e in response if "messageStop" in e), None)
+        assert message_stop is not None
+        assert message_stop["messageStop"]["stopReason"] == "tool_use"
+
+        # Find tool call events
+        tool_start = next(
+            (
+                e
+                for e in response
+                if "contentBlockStart" in e and e.get("contentBlockStart", {}).get("start", {}).get("toolUse")
+            ),
+            None,
+        )
+        tool_delta = next(
+            (
+                e
+                for e in response
+                if "contentBlockDelta" in e and e.get("contentBlockDelta", {}).get("delta", {}).get("toolUse")
+            ),
+            None,
+        )
+        tool_stop = next((e for e in response if "contentBlockStop" in e), None)
+
+        assert tool_start is not None
+        assert tool_delta is not None
+        assert tool_stop is not None
+
+        # Verify tool call data
+        tool_use_data = tool_start["contentBlockStart"]["start"]["toolUse"]
+        assert tool_use_data["toolUseId"] == "tool123"
+        assert tool_use_data["name"] == "get_weather"
+
+    @pytest.mark.asyncio
+    async def test_stream_with_partial_json(self, sagemaker_client, model, messages):
+        """Test streaming response with partial JSON chunks."""
+        # Mock the response from SageMaker with split JSON
+        mock_response = {
+            "Body": [
+                {"PayloadPart": {"Bytes": '{"choices": [{"delta": {"content": "Paris is'.encode("utf-8")}},
+                {"PayloadPart": {"Bytes": ' the capital of France."}, "finish_reason": "stop"}]}'.encode("utf-8")}},
+            ]
+        }
+        sagemaker_client.invoke_endpoint_with_response_stream.return_value = mock_response
+
+        response = [chunk async for chunk in model.stream(messages)]
+
+        assert len(response) == 5
+        assert response[0] == {"messageStart": {"role": "assistant"}}
+
+        # Find content events
+        content_start = next((e for e in response if "contentBlockStart" in e), None)
+        content_delta = next((e for e in response if "contentBlockDelta" in e), None)
+        content_stop = next((e for e in response if "contentBlockStop" in e), None)
+        message_stop = next((e for e in response if "messageStop" in e), None)
+
+        assert content_start is not None
+        assert content_delta is not None
+        assert content_stop is not None
+        assert message_stop is not None
+        assert message_stop["messageStop"]["stopReason"] == "end_turn"
+
+        # Verify content
+        text_delta = content_delta["contentBlockDelta"]["delta"]["text"]
+        assert text_delta == "Paris is the capital of France."
+
+    @pytest.mark.asyncio
+    async def test_stream_non_streaming(self, sagemaker_client, model, messages):
+        """Test non-streaming response."""
+        # Configure model for non-streaming
+        model.payload_config["stream"] = False
+
+        # Mock the response from SageMaker
+        mock_response = {"Body": unittest.mock.MagicMock()}
+        mock_response["Body"].read.return_value = json.dumps(
+            {
+                "choices": [
+                    {
+                        "message": {"content": "Paris is the capital of France.", "tool_calls": None},
+                        "finish_reason": "stop",
+                    }
+                ],
+                "usage": {"prompt_tokens": 10, "completion_tokens": 20, "total_tokens": 30, "prompt_tokens_details": 0},
+            }
+        ).encode("utf-8")
+
+        sagemaker_client.invoke_endpoint.return_value = mock_response
+
+        response = [chunk async for chunk in model.stream(messages)]
+
+        assert len(response) >= 6
+        assert response[0] == {"messageStart": {"role": "assistant"}}
+
+        # Find content events
+        content_start = next((e for e in response if "contentBlockStart" in e), None)
+        content_delta = next((e for e in response if "contentBlockDelta" in e), None)
+        content_stop = next((e for e in response if "contentBlockStop" in e), None)
+        message_stop = next((e for e in response if "messageStop" in e), None)
+
+        assert content_start is not None
+        assert content_delta is not None
+        assert content_stop is not None
+        assert message_stop is not None
+
+        # Verify content
+        text_delta = content_delta["contentBlockDelta"]["delta"]["text"]
+        assert text_delta == "Paris is the capital of France."
+
+        sagemaker_client.invoke_endpoint.assert_called_once()
+
+    @pytest.mark.asyncio
+    async def test_stream_non_streaming_with_tool_calls(self, sagemaker_client, model, messages):
+        """Test non-streaming response with tool calls."""
+        # Configure model for non-streaming
+        model.payload_config["stream"] = False
+
+        # Mock the response from SageMaker with tool calls
+        mock_response = {"Body": unittest.mock.MagicMock()}
+        mock_response["Body"].read.return_value = json.dumps(
+            {
+                "choices": [
+                    {
+                        "message": {
+                            "content": None,
+                            "tool_calls": [
+                                {
+                                    "id": "tool123",
+                                    "type": "function",
+                                    "function": {"name": "get_weather", "arguments": '{"location": "Paris"}'},
+                                }
+                            ],
+                        },
+                        "finish_reason": "tool_calls",
+                    }
+                ],
+                "usage": {"prompt_tokens": 10, "completion_tokens": 20, "total_tokens": 30, "prompt_tokens_details": 0},
+            }
+        ).encode("utf-8")
+
+        sagemaker_client.invoke_endpoint.return_value = mock_response
+
+        response = [chunk async for chunk in model.stream(messages)]
+
+        # Verify basic structure
+        assert len(response) >= 6
+        assert response[0] == {"messageStart": {"role": "assistant"}}
+
+        # Find tool call events
+        tool_start = next(
+            (
+                e
+                for e in response
+                if "contentBlockStart" in e and e.get("contentBlockStart", {}).get("start", {}).get("toolUse")
+            ),
+            None,
+        )
+        tool_delta = next(
+            (
+                e
+                for e in response
+                if "contentBlockDelta" in e and e.get("contentBlockDelta", {}).get("delta", {}).get("toolUse")
+            ),
+            None,
+        )
+        tool_stop = next((e for e in response if "contentBlockStop" in e), None)
+        message_stop = next((e for e in response if "messageStop" in e), None)
+
+        assert tool_start is not None
+        assert tool_delta is not None
+        assert tool_stop is not None
+        assert message_stop is not None
+
+        # Verify tool call data
+        tool_use_data = tool_start["contentBlockStart"]["start"]["toolUse"]
+        assert tool_use_data["toolUseId"] == "tool123"
+        assert tool_use_data["name"] == "get_weather"
+
+        # Verify metadata
+        metadata = next((e for e in response if "metadata" in e), None)
+        assert metadata is not None
+        usage_data = metadata["metadata"]["usage"]
+        assert usage_data["totalTokens"] == 30
+
+
+class TestDataClasses:
+    """Test suite for data classes."""
+
+    def test_usage_metadata(self):
+        """Test UsageMetadata dataclass."""
+        usage = UsageMetadata(total_tokens=100, completion_tokens=30, prompt_tokens=70, prompt_tokens_details=5)
+
+        assert usage.total_tokens == 100
+        assert usage.completion_tokens == 30
+        assert usage.prompt_tokens == 70
+        assert usage.prompt_tokens_details == 5
+
+    def test_function_call(self):
+        """Test FunctionCall dataclass."""
+        func = FunctionCall(name="get_weather", arguments='{"location": "Paris"}')
+
+        assert func.name == "get_weather"
+        assert func.arguments == '{"location": "Paris"}'
+
+        # Test initialization with kwargs
+        func2 = FunctionCall(**{"name": "get_time", "arguments": '{"timezone": "UTC"}'})
+
+        assert func2.name == "get_time"
+        assert func2.arguments == '{"timezone": "UTC"}'
+
+    def test_tool_call(self):
+        """Test ToolCall dataclass."""
+        # Create a tool call using kwargs directly
+        tool = ToolCall(
+            id="tool123", type="function", function={"name": "get_weather", "arguments": '{"location": "Paris"}'}
+        )
+
+        assert tool.id == "tool123"
+        assert tool.type == "function"
+        assert tool.function.name == "get_weather"
+        assert tool.function.arguments == '{"location": "Paris"}'
+
+        # Test initialization with kwargs
+        tool2 = ToolCall(
+            **{
+                "id": "tool456",
+                "type": "function",
+                "function": {"name": "get_time", "arguments": '{"timezone": "UTC"}'},
+            }
+        )
+
+        assert tool2.id == "tool456"
+        assert tool2.type == "function"
+        assert tool2.function.name == "get_time"
+        assert tool2.function.arguments == '{"timezone": "UTC"}'
diff --git a/tests_integ/models/test_model_sagemaker.py b/tests_integ/models/test_model_sagemaker.py
new file mode 100644
index 000000000..62362e299
--- /dev/null
+++ b/tests_integ/models/test_model_sagemaker.py
@@ -0,0 +1,76 @@
+import os
+
+import pytest
+
+import strands
+from strands import Agent
+from strands.models.sagemaker import SageMakerAIModel
+
+
+@pytest.fixture
+def model():
+    endpoint_config = SageMakerAIModel.SageMakerAIEndpointConfig(
+        endpoint_name=os.getenv("SAGEMAKER_ENDPOINT_NAME", ""), region_name="us-east-1"
+    )
+    payload_config = SageMakerAIModel.SageMakerAIPayloadSchema(max_tokens=1024, temperature=0.7, stream=False)
+    return SageMakerAIModel(endpoint_config=endpoint_config, payload_config=payload_config)
+
+
+@pytest.fixture
+def tools():
+    @strands.tool
+    def tool_time(location: str) -> str:
+        """Get the current time for a location."""
+        return f"The time in {location} is 12:00 PM"
+
+    @strands.tool
+    def tool_weather(location: str) -> str:
+        """Get the current weather for a location."""
+        return f"The weather in {location} is sunny"
+
+    return [tool_time, tool_weather]
+
+
+@pytest.fixture
+def system_prompt():
+    return "You are a helpful assistant that provides concise answers."
+
+
+@pytest.fixture
+def agent(model, tools, system_prompt):
+    return Agent(model=model, tools=tools, system_prompt=system_prompt)
+
+
+@pytest.mark.skipif(
+    "SAGEMAKER_ENDPOINT_NAME" not in os.environ,
+    reason="SAGEMAKER_ENDPOINT_NAME environment variable missing",
+)
+def test_agent_with_tools(agent):
+    result = agent("What is the time and weather in New York?")
+    text = result.message["content"][0]["text"].lower()
+
+    assert "12:00" in text and "sunny" in text
+
+
+@pytest.mark.skipif(
+    "SAGEMAKER_ENDPOINT_NAME" not in os.environ,
+    reason="SAGEMAKER_ENDPOINT_NAME environment variable missing",
+)
+def test_agent_without_tools(model, system_prompt):
+    agent = Agent(model=model, system_prompt=system_prompt)
+    result = agent("Hello, how are you?")
+
+    assert result.message["content"][0]["text"]
+    assert len(result.message["content"][0]["text"]) > 0
+
+
+@pytest.mark.skipif(
+    "SAGEMAKER_ENDPOINT_NAME" not in os.environ,
+    reason="SAGEMAKER_ENDPOINT_NAME environment variable missing",
+)
+@pytest.mark.parametrize("location", ["Tokyo", "London", "Sydney"])
+def test_agent_different_locations(agent, location):
+    result = agent(f"What is the weather in {location}?")
+    text = result.message["content"][0]["text"].lower()
+
+    assert location.lower() in text and "sunny" in text