From cd097ab36102f09dbd87900b4247fe1a3dbaa94e Mon Sep 17 00:00:00 2001
From: Suresh Veeragoni <suvee@amazon.com>
Date: Fri, 11 Jul 2025 18:18:45 -0700
Subject: [PATCH 1/3] # Add DeepSeek model provider support
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

## Features
- **New DeepSeek Model Provider**: Full implementation with streaming and structured output support
- **OpenAI-compatible API**: Uses OpenAI client for seamless integration with DeepSeek endpoints
- **Reasoning Model Support**: Handles DeepSeek-specific features like reasoning content
- **Beta Features**: Support for beta endpoint and advanced DeepSeek capabilities

## Changes
- `src/strands/models/deepseek.py`: New DeepSeek model provider implementation
- `src/strands/models/__init__.py`: Export DeepSeekModel class
- `tests_integ/models/test_model_deepseek.py`: Comprehensive integration tests (7 test cases)
- `tests_integ/models/providers.py`: Add DeepSeek to provider configuration
- `README.md`: Update documentation with DeepSeek examples and provider list

## Usage
```python
from strands.models.deepseek import DeepSeekModel
model = DeepSeekModel(api_key="your-key", model_id="deepseek-chat")

Testing
✅ All 7 integration tests passing

✅ Basic conversation, structured output, streaming, tool usage

✅ Configuration updates and async operations
---
 README.md                                 |  10 +
 src/strands/models/__init__.py            |   5 +-
 src/strands/models/deepseek.py            | 298 ++++++++++++++++++++++
 tests_integ/models/providers.py           |  10 +
 tests_integ/models/test_model_deepseek.py | 143 +++++++++++
 5 files changed, 464 insertions(+), 2 deletions(-)
 create mode 100644 src/strands/models/deepseek.py
 create mode 100644 tests_integ/models/test_model_deepseek.py

diff --git a/README.md b/README.md
index ed98d0012..505cda2b8 100644
--- a/README.md
+++ b/README.md
@@ -116,6 +116,7 @@ Support for various model providers:
 ```python
 from strands import Agent
 from strands.models import BedrockModel
+from strands.models.deepseek import DeepSeekModel
 from strands.models.ollama import OllamaModel
 from strands.models.llamaapi import LlamaAPIModel
 
@@ -128,6 +129,14 @@ bedrock_model = BedrockModel(
 agent = Agent(model=bedrock_model)
 agent("Tell me about Agentic AI")
 
+# DeepSeek
+deepseek_model = DeepSeekModel(
+  api_key="your-deepseek-api-key",
+  model_id="deepseek-chat"
+)
+agent = Agent(model=deepseek_model)
+agent("Tell me about Agentic AI")
+
 # Ollama
 ollama_model = OllamaModel(
   host="http://localhost:11434",
@@ -147,6 +156,7 @@ response = agent("Tell me about Agentic AI")
 Built-in providers:
  - [Amazon Bedrock](https://strandsagents.com/latest/user-guide/concepts/model-providers/amazon-bedrock/)
  - [Anthropic](https://strandsagents.com/latest/user-guide/concepts/model-providers/anthropic/)
+ - [DeepSeek](https://platform.deepseek.com/api-docs/)
  - [LiteLLM](https://strandsagents.com/latest/user-guide/concepts/model-providers/litellm/)
  - [LlamaAPI](https://strandsagents.com/latest/user-guide/concepts/model-providers/llamaapi/)
  - [Ollama](https://strandsagents.com/latest/user-guide/concepts/model-providers/ollama/)
diff --git a/src/strands/models/__init__.py b/src/strands/models/__init__.py
index ead290a35..4a525058a 100644
--- a/src/strands/models/__init__.py
+++ b/src/strands/models/__init__.py
@@ -3,8 +3,9 @@
 This package includes an abstract base Model class along with concrete implementations for specific providers.
 """
 
-from . import bedrock, model
+from . import bedrock, deepseek, model
 from .bedrock import BedrockModel
+from .deepseek import DeepSeekModel
 from .model import Model
 
-__all__ = ["bedrock", "model", "BedrockModel", "Model"]
+__all__ = ["bedrock", "deepseek", "model", "BedrockModel", "DeepSeekModel", "Model"]
diff --git a/src/strands/models/deepseek.py b/src/strands/models/deepseek.py
new file mode 100644
index 000000000..960d71cbb
--- /dev/null
+++ b/src/strands/models/deepseek.py
@@ -0,0 +1,298 @@
+"""DeepSeek model provider.
+
+- Docs: https://platform.deepseek.com/api-docs/
+"""
+
+import json
+import logging
+from typing import Any, AsyncGenerator, Optional, Type, TypeVar
+
+import openai
+from pydantic import BaseModel
+from typing_extensions import TypedDict, Unpack, override
+
+from ..types.content import Messages
+from ..types.streaming import StreamEvent
+from ..types.tools import ToolSpec
+from .model import Model
+
+logger = logging.getLogger(__name__)
+
+T = TypeVar("T", bound=BaseModel)
+
+
+class DeepSeekModel(Model):
+    """DeepSeek model provider implementation using OpenAI-compatible API."""
+
+    class DeepSeekConfig(TypedDict, total=False):
+        """Configuration parameters for DeepSeek models.
+
+        Attributes:
+            model_id: DeepSeek model ID (e.g., "deepseek-chat", "deepseek-reasoner").
+            api_key: DeepSeek API key.
+            base_url: API base URL.
+            use_beta: Whether to use beta endpoint for advanced features.
+            params: Additional model parameters.
+        """
+
+        model_id: str
+        api_key: str
+        base_url: Optional[str]
+        use_beta: Optional[bool]
+        params: Optional[dict[str, Any]]
+
+    def __init__(
+        self,
+        api_key: str,
+        *,
+        model_id: str = "deepseek-chat",
+        base_url: Optional[str] = None,
+        use_beta: bool = False,
+        params: Optional[dict[str, Any]] = None,
+        **kwargs: Any,
+    ) -> None:
+        """Initialize DeepSeek provider instance.
+
+        Args:
+            api_key: DeepSeek API key.
+            model_id: Model ID to use.
+            base_url: Custom base URL. Defaults to standard or beta endpoint.
+            use_beta: Whether to use beta endpoint.
+            params: Additional model parameters.
+            **kwargs: Additional arguments for future extensibility.
+        """
+        if base_url is None:
+            base_url = "https://api.deepseek.com/beta" if use_beta else "https://api.deepseek.com"
+
+        self.config = DeepSeekModel.DeepSeekConfig(
+            model_id=model_id,
+            api_key=api_key,
+            base_url=base_url,
+            use_beta=use_beta,
+            params=params or {},
+        )
+
+        logger.debug("config=<%s> | initializing", self.config)
+
+        self.client = openai.AsyncOpenAI(
+            api_key=self.config["api_key"],
+            base_url=self.config["base_url"],
+        )
+
+    @override
+    def update_config(self, **model_config: Unpack[DeepSeekConfig]) -> None:  # type: ignore
+        """Update the DeepSeek model configuration.
+
+        Args:
+            **model_config: Configuration overrides.
+        """
+        self.config.update(model_config)
+
+        # Recreate client if API settings changed
+        if any(key in model_config for key in ["api_key", "base_url"]):
+            self.client = openai.AsyncOpenAI(
+                api_key=self.config["api_key"],
+                base_url=self.config["base_url"],
+            )
+
+    @override
+    def get_config(self) -> DeepSeekConfig:
+        """Get the DeepSeek model configuration.
+
+        Returns:
+            The DeepSeek model configuration.
+        """
+        return self.config
+
+    def format_request(
+        self, messages: Messages, tool_specs: Optional[list[ToolSpec]] = None, system_prompt: Optional[str] = None
+    ) -> dict[str, Any]:
+        """Format a DeepSeek chat request.
+
+        Args:
+            messages: List of message objects to be processed by the model.
+            tool_specs: List of tool specifications to make available to the model.
+            system_prompt: System prompt to provide context to the model.
+
+        Returns:
+            A DeepSeek chat request.
+        """
+        formatted_messages = []
+
+        if system_prompt:
+            formatted_messages.append({"role": "system", "content": system_prompt})
+
+        # Convert Strands messages to OpenAI format
+        for message in messages:
+            if message["role"] in ["user", "assistant"]:
+                content = ""
+                for block in message["content"]:
+                    if "text" in block:
+                        content += block["text"]
+                formatted_messages.append({"role": message["role"], "content": content})
+
+        request = {
+            "model": self.config["model_id"],
+            "messages": formatted_messages,
+            "stream": True,
+            **self.config.get("params", {}),
+        }
+
+        if tool_specs:
+            request["tools"] = [
+                {
+                    "type": "function",
+                    "function": {
+                        "name": tool_spec["name"],
+                        "description": tool_spec["description"],
+                        "parameters": tool_spec["inputSchema"]["json"],
+                    },
+                }
+                for tool_spec in tool_specs
+            ]
+
+        return request
+
+    def format_chunk(self, event: dict[str, Any]) -> StreamEvent:
+        """Format DeepSeek response event into standardized message chunk.
+
+        Args:
+            event: A response event from the DeepSeek model.
+
+        Returns:
+            The formatted chunk.
+        """
+        match event["chunk_type"]:
+            case "message_start":
+                return {"messageStart": {"role": "assistant"}}
+
+            case "content_start":
+                return {"contentBlockStart": {"start": {}}}
+
+            case "content_delta":
+                if event["data_type"] == "reasoning_content":
+                    return {"contentBlockDelta": {"delta": {"reasoningContent": {"text": event["data"]}}}}
+                return {"contentBlockDelta": {"delta": {"text": event["data"]}}}
+
+            case "content_stop":
+                return {"contentBlockStop": {}}
+
+            case "message_stop":
+                return {"messageStop": {"stopReason": "end_turn"}}
+
+            case _:
+                return {"contentBlockDelta": {"delta": {"text": ""}}}
+
+    @override
+    async def stream(
+        self,
+        messages: Messages,
+        tool_specs: Optional[list[ToolSpec]] = None,
+        system_prompt: Optional[str] = None,
+        **kwargs: Any,
+    ) -> AsyncGenerator[StreamEvent, None]:
+        """Stream conversation with the DeepSeek model.
+
+        Args:
+            messages: List of message objects to be processed by the model.
+            tool_specs: List of tool specifications to make available to the model.
+            system_prompt: System prompt to provide context to the model.
+            **kwargs: Additional keyword arguments for future extensibility.
+
+        Yields:
+            Formatted message chunks from the model.
+        """
+        logger.debug("formatting request")
+        request = self.format_request(messages, tool_specs, system_prompt)
+        logger.debug("request=<%s>", request)
+
+        logger.debug("invoking model")
+        response = await self.client.chat.completions.create(**request)
+
+        logger.debug("got response from model")
+        yield self.format_chunk({"chunk_type": "message_start"})
+        yield self.format_chunk({"chunk_type": "content_start"})
+
+        async for chunk in response:
+            if hasattr(chunk, "choices") and chunk.choices:
+                choice = chunk.choices[0]
+
+                if hasattr(choice, "delta") and choice.delta:
+                    delta = choice.delta
+
+                    # Handle reasoning content
+                    if hasattr(delta, "reasoning_content") and delta.reasoning_content:
+                        yield self.format_chunk({
+                            "chunk_type": "content_delta",
+                            "data_type": "reasoning_content",
+                            "data": delta.reasoning_content,
+                        })
+
+                    # Handle regular content
+                    if hasattr(delta, "content") and delta.content:
+                        yield self.format_chunk({
+                            "chunk_type": "content_delta",
+                            "data_type": "text",
+                            "data": delta.content,
+                        })
+
+                if hasattr(choice, "finish_reason") and choice.finish_reason:
+                    break
+
+        yield self.format_chunk({"chunk_type": "content_stop"})
+        yield self.format_chunk({"chunk_type": "message_stop"})
+
+        logger.debug("finished streaming response from model")
+
+    @override
+    async def structured_output(
+        self, output_model: Type[T], prompt: Messages, **kwargs: Any
+    ) -> AsyncGenerator[dict[str, T], None]:
+        """Get structured output from the model.
+
+        Args:
+            output_model: The output model to use for the agent.
+            prompt: The prompt messages to use for the agent.
+            **kwargs: Additional keyword arguments for future extensibility.
+
+        Yields:
+            Model events with the structured output.
+        """
+        # Extract text from prompt
+        text_prompt = ""
+        for message in prompt:
+            if message.get("role") == "user":
+                for block in message.get("content", []):
+                    if "text" in block:
+                        text_prompt += block["text"]
+
+        # Create JSON schema prompt
+        schema = output_model.model_json_schema()
+        properties = schema.get("properties", {})
+        field_descriptions = [
+            f"- {field_name}: {field_info.get('description', field_name)} ({field_info.get('type', 'string')})"
+            for field_name, field_info in properties.items()
+        ]
+
+        json_prompt = f"""{text_prompt}
+
+Extract the information and return it as JSON with these fields:
+{chr(10).join(field_descriptions)}
+
+Return only the JSON object with the extracted data, no additional text."""
+
+        request_params = {
+            "model": self.config["model_id"],
+            "messages": [{"role": "user", "content": json_prompt}],
+            "response_format": {"type": "json_object"},
+        }
+
+        # Add max_tokens for reasoning model
+        if self.config["model_id"] == "deepseek-reasoner":
+            request_params["max_tokens"] = 32000
+
+        response = await self.client.chat.completions.create(**request_params)
+        json_data = json.loads(response.choices[0].message.content)
+        result = output_model(**json_data)
+
+        yield {"output": result}
\ No newline at end of file
diff --git a/tests_integ/models/providers.py b/tests_integ/models/providers.py
index 543f58480..02f113ad2 100644
--- a/tests_integ/models/providers.py
+++ b/tests_integ/models/providers.py
@@ -10,6 +10,7 @@
 
 from strands.models import BedrockModel, Model
 from strands.models.anthropic import AnthropicModel
+from strands.models.deepseek import DeepSeekModel
 from strands.models.litellm import LiteLLMModel
 from strands.models.llamaapi import LlamaAPIModel
 from strands.models.mistral import MistralModel
@@ -126,6 +127,14 @@ def __init__(self):
         stream_options={"include_usage": True},
     ),
 )
+deepseek = ProviderInfo(
+    id="deepseek",
+    environment_variable="DEEPSEEK_API_KEY",
+    factory=lambda: DeepSeekModel(
+        model_id="deepseek-chat",
+        api_key=os.getenv("DEEPSEEK_API_KEY"),
+    ),
+)
 
 ollama = OllamaProviderInfo()
 
@@ -134,6 +143,7 @@ def __init__(self):
     bedrock,
     anthropic,
     cohere,
+    deepseek,
     llama,
     litellm,
     mistral,
diff --git a/tests_integ/models/test_model_deepseek.py b/tests_integ/models/test_model_deepseek.py
new file mode 100644
index 000000000..af1e4c46d
--- /dev/null
+++ b/tests_integ/models/test_model_deepseek.py
@@ -0,0 +1,143 @@
+import os
+
+import pytest
+from pydantic import BaseModel, Field
+
+import strands
+from strands import Agent
+from strands.models.deepseek import DeepSeekModel
+
+# these tests only run if we have the deepseek api key
+pytestmark = pytest.mark.skipif(
+    "DEEPSEEK_API_KEY" not in os.environ,
+    reason="DEEPSEEK_API_KEY environment variable missing",
+)
+
+
+@pytest.fixture()
+def base_model():
+    return DeepSeekModel(
+        api_key=os.getenv("DEEPSEEK_API_KEY"),
+        model_id="deepseek-chat",
+        params={"max_tokens": 2000, "temperature": 0.7}
+    )
+
+
+@pytest.fixture()
+def reasoning_model():
+    return DeepSeekModel(
+        api_key=os.getenv("DEEPSEEK_API_KEY"),
+        model_id="deepseek-reasoner",
+        params={"max_tokens": 32000}
+    )
+
+
+@pytest.fixture()
+def beta_model():
+    return DeepSeekModel(
+        api_key=os.getenv("DEEPSEEK_API_KEY"),
+        model_id="deepseek-chat",
+        use_beta=True,
+        params={"max_tokens": 1000}
+    )
+
+
+@pytest.fixture()
+def tools():
+    @strands.tool
+    def tool_time() -> str:
+        return "12:00"
+
+    @strands.tool
+    def tool_weather() -> str:
+        return "sunny"
+
+    return [tool_time, tool_weather]
+
+
+@pytest.fixture()
+def base_agent(base_model, tools):
+    return Agent(model=base_model, tools=tools)
+
+
+class PersonInfo(BaseModel):
+    """Extract person information from text."""
+    name: str = Field(description="Full name of the person")
+    age: int = Field(description="Age in years")
+    occupation: str = Field(description="Job or profession")
+
+
+class WeatherInfo(BaseModel):
+    """Weather information."""
+    location: str = Field(description="City and state")
+    temperature: str = Field(description="Current temperature")
+    condition: str = Field(description="Weather condition")
+
+
+def test_basic_conversation(base_agent):
+    result = base_agent("Hello, how are you today?")
+    assert "content" in result.message
+    assert len(result.message["content"]) > 0
+
+
+def test_structured_output_person(base_agent):
+    result = base_agent.structured_output(
+        PersonInfo,
+        "John Smith is a 30-year-old software engineer working at a tech startup."
+    )
+    assert result.name == "John Smith"
+    assert result.age == 30
+    assert "engineer" in result.occupation.lower()
+
+
+def test_tool_usage(base_agent):
+    result = base_agent("What is the time and weather?")
+    # Handle case where content might be empty or structured differently
+    content = result.message.get("content", [])
+    if content and "text" in content[0]:
+        text = content[0]["text"].lower()
+        assert any(string in text for string in ["12:00", "sunny"])
+    else:
+        # If no text content, just verify the result exists
+        assert result.message is not None
+
+
+@pytest.mark.asyncio
+async def test_streaming(base_model):
+    agent = Agent(model=base_model)
+    events = []
+    async for event in agent.stream_async("Tell me a short fact about robots"):
+        events.append(event)
+    
+    assert len(events) > 0
+    assert "result" in events[-1]
+
+
+def test_config_update(base_model):
+    original_config = base_model.get_config()
+    assert original_config["model_id"] == "deepseek-chat"
+    
+    base_model.update_config(model_id="deepseek-reasoner", params={"temperature": 0.5})
+    updated_config = base_model.get_config()
+    assert updated_config["model_id"] == "deepseek-reasoner"
+
+
+def test_weather_structured_output(base_agent):
+    result = base_agent.structured_output(
+        WeatherInfo,
+        "Get the weather for San Francisco, CA. It's currently 72°F and sunny."
+    )
+    assert "san francisco" in result.location.lower()
+    assert "72" in result.temperature
+    assert "sunny" in result.condition.lower()
+
+
+@pytest.mark.asyncio
+async def test_async_structured_output(base_agent):
+    result = await base_agent.structured_output_async(
+        PersonInfo,
+        "Alice Johnson is a 25-year-old teacher at the local school."
+    )
+    assert result.name == "Alice Johnson"
+    assert result.age == 25
+    assert "teacher" in result.occupation.lower()
\ No newline at end of file

From 8e4cd4025bc79e000f6c79193657a29be4794467 Mon Sep 17 00:00:00 2001
From: Suresh Veeragoni <suvee@amazon.com>
Date: Fri, 11 Jul 2025 18:24:52 -0700
Subject: [PATCH 2/3] updates after hatch run prepare

---
 src/strands/models/deepseek.py            | 26 +++++++++++---------
 tests_integ/models/test_model_deepseek.py | 30 +++++++++--------------
 2 files changed, 26 insertions(+), 30 deletions(-)

diff --git a/src/strands/models/deepseek.py b/src/strands/models/deepseek.py
index 960d71cbb..804302f4b 100644
--- a/src/strands/models/deepseek.py
+++ b/src/strands/models/deepseek.py
@@ -222,19 +222,23 @@ async def stream(
 
                     # Handle reasoning content
                     if hasattr(delta, "reasoning_content") and delta.reasoning_content:
-                        yield self.format_chunk({
-                            "chunk_type": "content_delta",
-                            "data_type": "reasoning_content",
-                            "data": delta.reasoning_content,
-                        })
+                        yield self.format_chunk(
+                            {
+                                "chunk_type": "content_delta",
+                                "data_type": "reasoning_content",
+                                "data": delta.reasoning_content,
+                            }
+                        )
 
                     # Handle regular content
                     if hasattr(delta, "content") and delta.content:
-                        yield self.format_chunk({
-                            "chunk_type": "content_delta",
-                            "data_type": "text",
-                            "data": delta.content,
-                        })
+                        yield self.format_chunk(
+                            {
+                                "chunk_type": "content_delta",
+                                "data_type": "text",
+                                "data": delta.content,
+                            }
+                        )
 
                 if hasattr(choice, "finish_reason") and choice.finish_reason:
                     break
@@ -295,4 +299,4 @@ async def structured_output(
         json_data = json.loads(response.choices[0].message.content)
         result = output_model(**json_data)
 
-        yield {"output": result}
\ No newline at end of file
+        yield {"output": result}
diff --git a/tests_integ/models/test_model_deepseek.py b/tests_integ/models/test_model_deepseek.py
index af1e4c46d..9aae5f2d7 100644
--- a/tests_integ/models/test_model_deepseek.py
+++ b/tests_integ/models/test_model_deepseek.py
@@ -17,28 +17,21 @@
 @pytest.fixture()
 def base_model():
     return DeepSeekModel(
-        api_key=os.getenv("DEEPSEEK_API_KEY"),
-        model_id="deepseek-chat",
-        params={"max_tokens": 2000, "temperature": 0.7}
+        api_key=os.getenv("DEEPSEEK_API_KEY"), model_id="deepseek-chat", params={"max_tokens": 2000, "temperature": 0.7}
     )
 
 
 @pytest.fixture()
 def reasoning_model():
     return DeepSeekModel(
-        api_key=os.getenv("DEEPSEEK_API_KEY"),
-        model_id="deepseek-reasoner",
-        params={"max_tokens": 32000}
+        api_key=os.getenv("DEEPSEEK_API_KEY"), model_id="deepseek-reasoner", params={"max_tokens": 32000}
     )
 
 
 @pytest.fixture()
 def beta_model():
     return DeepSeekModel(
-        api_key=os.getenv("DEEPSEEK_API_KEY"),
-        model_id="deepseek-chat",
-        use_beta=True,
-        params={"max_tokens": 1000}
+        api_key=os.getenv("DEEPSEEK_API_KEY"), model_id="deepseek-chat", use_beta=True, params={"max_tokens": 1000}
     )
 
 
@@ -62,6 +55,7 @@ def base_agent(base_model, tools):
 
 class PersonInfo(BaseModel):
     """Extract person information from text."""
+
     name: str = Field(description="Full name of the person")
     age: int = Field(description="Age in years")
     occupation: str = Field(description="Job or profession")
@@ -69,6 +63,7 @@ class PersonInfo(BaseModel):
 
 class WeatherInfo(BaseModel):
     """Weather information."""
+
     location: str = Field(description="City and state")
     temperature: str = Field(description="Current temperature")
     condition: str = Field(description="Weather condition")
@@ -82,8 +77,7 @@ def test_basic_conversation(base_agent):
 
 def test_structured_output_person(base_agent):
     result = base_agent.structured_output(
-        PersonInfo,
-        "John Smith is a 30-year-old software engineer working at a tech startup."
+        PersonInfo, "John Smith is a 30-year-old software engineer working at a tech startup."
     )
     assert result.name == "John Smith"
     assert result.age == 30
@@ -108,7 +102,7 @@ async def test_streaming(base_model):
     events = []
     async for event in agent.stream_async("Tell me a short fact about robots"):
         events.append(event)
-    
+
     assert len(events) > 0
     assert "result" in events[-1]
 
@@ -116,7 +110,7 @@ async def test_streaming(base_model):
 def test_config_update(base_model):
     original_config = base_model.get_config()
     assert original_config["model_id"] == "deepseek-chat"
-    
+
     base_model.update_config(model_id="deepseek-reasoner", params={"temperature": 0.5})
     updated_config = base_model.get_config()
     assert updated_config["model_id"] == "deepseek-reasoner"
@@ -124,8 +118,7 @@ def test_config_update(base_model):
 
 def test_weather_structured_output(base_agent):
     result = base_agent.structured_output(
-        WeatherInfo,
-        "Get the weather for San Francisco, CA. It's currently 72°F and sunny."
+        WeatherInfo, "Get the weather for San Francisco, CA. It's currently 72°F and sunny."
     )
     assert "san francisco" in result.location.lower()
     assert "72" in result.temperature
@@ -135,9 +128,8 @@ def test_weather_structured_output(base_agent):
 @pytest.mark.asyncio
 async def test_async_structured_output(base_agent):
     result = await base_agent.structured_output_async(
-        PersonInfo,
-        "Alice Johnson is a 25-year-old teacher at the local school."
+        PersonInfo, "Alice Johnson is a 25-year-old teacher at the local school."
     )
     assert result.name == "Alice Johnson"
     assert result.age == 25
-    assert "teacher" in result.occupation.lower()
\ No newline at end of file
+    assert "teacher" in result.occupation.lower()

From a824b9d4acae4b796fc5e3620f9546c97db83c7f Mon Sep 17 00:00:00 2001
From: Suresh Veeragoni <suvee@amazon.com>
Date: Sat, 12 Jul 2025 01:54:07 -0700
Subject: [PATCH 3/3] fixes to tool usage

---
 src/strands/models/deepseek.py            | 198 ++++++++++++++++------
 tests_integ/models/test_model_deepseek.py | 127 +++++++++-----
 2 files changed, 227 insertions(+), 98 deletions(-)

diff --git a/src/strands/models/deepseek.py b/src/strands/models/deepseek.py
index 804302f4b..49c825347 100644
--- a/src/strands/models/deepseek.py
+++ b/src/strands/models/deepseek.py
@@ -104,6 +104,58 @@ def get_config(self) -> DeepSeekConfig:
         """
         return self.config
 
+    @classmethod
+    def format_request_messages(cls, messages: Messages, system_prompt: Optional[str] = None) -> list[dict[str, Any]]:
+        """Format DeepSeek compatible messages array (exactly like OpenAI)."""
+        formatted_messages: list[dict[str, Any]]
+        formatted_messages = [{"role": "system", "content": system_prompt}] if system_prompt else []
+
+        for message in messages:
+            contents = message["content"]
+
+            formatted_contents = [
+                {"text": content["text"], "type": "text"} for content in contents if "text" in content
+            ]
+            formatted_tool_calls = [
+                {
+                    "function": {
+                        "arguments": json.dumps(content["toolUse"]["input"]),
+                        "name": content["toolUse"]["name"],
+                    },
+                    "id": content["toolUse"]["toolUseId"],
+                    "type": "function",
+                }
+                for content in contents
+                if "toolUse" in content
+            ]
+            formatted_tool_messages = [
+                {
+                    "role": "tool",
+                    "tool_call_id": content["toolResult"]["toolUseId"],
+                    "content": "".join(
+                        [
+                            json.dumps(tool_content["json"]) if "json" in tool_content else tool_content["text"]
+                            for tool_content in content["toolResult"]["content"]
+                        ]
+                    ),
+                }
+                for content in contents
+                if "toolResult" in content
+            ]
+
+            # Flatten content for DeepSeek
+            text_content = "".join([c["text"] for c in formatted_contents])
+
+            formatted_message = {
+                "role": message["role"],
+                "content": text_content,
+                **({"tool_calls": formatted_tool_calls} if formatted_tool_calls else {}),
+            }
+            formatted_messages.append(formatted_message)
+            formatted_messages.extend(formatted_tool_messages)
+
+        return [message for message in formatted_messages if message["content"] or "tool_calls" in message]
+
     def format_request(
         self, messages: Messages, tool_specs: Optional[list[ToolSpec]] = None, system_prompt: Optional[str] = None
     ) -> dict[str, Any]:
@@ -117,25 +169,11 @@ def format_request(
         Returns:
             A DeepSeek chat request.
         """
-        formatted_messages = []
-
-        if system_prompt:
-            formatted_messages.append({"role": "system", "content": system_prompt})
-
-        # Convert Strands messages to OpenAI format
-        for message in messages:
-            if message["role"] in ["user", "assistant"]:
-                content = ""
-                for block in message["content"]:
-                    if "text" in block:
-                        content += block["text"]
-                formatted_messages.append({"role": message["role"], "content": content})
-
         request = {
             "model": self.config["model_id"],
-            "messages": formatted_messages,
+            "messages": self.format_request_messages(messages, system_prompt),
             "stream": True,
-            **self.config.get("params", {}),
+            **(self.config.get("params") or {}),
         }
 
         if tool_specs:
@@ -167,9 +205,24 @@ def format_chunk(self, event: dict[str, Any]) -> StreamEvent:
                 return {"messageStart": {"role": "assistant"}}
 
             case "content_start":
+                if event["data_type"] == "tool":
+                    return {
+                        "contentBlockStart": {
+                            "start": {
+                                "toolUse": {
+                                    "name": event["data"].function.name,
+                                    "toolUseId": event["data"].id,
+                                }
+                            }
+                        }
+                    }
                 return {"contentBlockStart": {"start": {}}}
 
             case "content_delta":
+                if event["data_type"] == "tool":
+                    return {
+                        "contentBlockDelta": {"delta": {"toolUse": {"input": event["data"].function.arguments or ""}}}
+                    }
                 if event["data_type"] == "reasoning_content":
                     return {"contentBlockDelta": {"delta": {"reasoningContent": {"text": event["data"]}}}}
                 return {"contentBlockDelta": {"delta": {"text": event["data"]}}}
@@ -178,10 +231,30 @@ def format_chunk(self, event: dict[str, Any]) -> StreamEvent:
                 return {"contentBlockStop": {}}
 
             case "message_stop":
-                return {"messageStop": {"stopReason": "end_turn"}}
+                match event["data"]:
+                    case "tool_calls":
+                        return {"messageStop": {"stopReason": "tool_use"}}
+                    case "length":
+                        return {"messageStop": {"stopReason": "max_tokens"}}
+                    case _:
+                        return {"messageStop": {"stopReason": "end_turn"}}
+
+            case "metadata":
+                return {
+                    "metadata": {
+                        "usage": {
+                            "inputTokens": event["data"].prompt_tokens,
+                            "outputTokens": event["data"].completion_tokens,
+                            "totalTokens": event["data"].total_tokens,
+                        },
+                        "metrics": {
+                            "latencyMs": 0,
+                        },
+                    },
+                }
 
             case _:
-                return {"contentBlockDelta": {"delta": {"text": ""}}}
+                raise RuntimeError(f"chunk_type=<{event['chunk_type']}> | unknown type")
 
     @override
     async def stream(
@@ -204,47 +277,68 @@ async def stream(
         """
         logger.debug("formatting request")
         request = self.format_request(messages, tool_specs, system_prompt)
-        logger.debug("request=<%s>", request)
+        logger.debug("request messages=<%s>", request.get("messages", []))
+        logger.debug("request tools=<%s>", len(request.get("tools", [])))
+
+        # Debug logging removed for production
+
+        # Debug logging disabled for production
+        # import logging
+        # logging.basicConfig(level=logging.DEBUG)
+        # logging.getLogger(__name__).setLevel(logging.DEBUG)
 
         logger.debug("invoking model")
         response = await self.client.chat.completions.create(**request)
 
         logger.debug("got response from model")
         yield self.format_chunk({"chunk_type": "message_start"})
-        yield self.format_chunk({"chunk_type": "content_start"})
-
-        async for chunk in response:
-            if hasattr(chunk, "choices") and chunk.choices:
-                choice = chunk.choices[0]
-
-                if hasattr(choice, "delta") and choice.delta:
-                    delta = choice.delta
-
-                    # Handle reasoning content
-                    if hasattr(delta, "reasoning_content") and delta.reasoning_content:
-                        yield self.format_chunk(
-                            {
-                                "chunk_type": "content_delta",
-                                "data_type": "reasoning_content",
-                                "data": delta.reasoning_content,
-                            }
-                        )
-
-                    # Handle regular content
-                    if hasattr(delta, "content") and delta.content:
-                        yield self.format_chunk(
-                            {
-                                "chunk_type": "content_delta",
-                                "data_type": "text",
-                                "data": delta.content,
-                            }
-                        )
+        yield self.format_chunk({"chunk_type": "content_start", "data_type": "text"})
+
+        tool_calls: dict[int, list[Any]] = {}
+
+        async for event in response:
+            # Defensive: skip events with empty or missing choices
+            if not getattr(event, "choices", None):
+                continue
+            choice = event.choices[0]
+
+            if choice.delta.content:
+                yield self.format_chunk(
+                    {"chunk_type": "content_delta", "data_type": "text", "data": choice.delta.content}
+                )
+
+            if hasattr(choice.delta, "reasoning_content") and choice.delta.reasoning_content:
+                yield self.format_chunk(
+                    {
+                        "chunk_type": "content_delta",
+                        "data_type": "reasoning_content",
+                        "data": choice.delta.reasoning_content,
+                    }
+                )
+
+            for tool_call in choice.delta.tool_calls or []:
+                tool_calls.setdefault(tool_call.index, []).append(tool_call)
+
+            if choice.finish_reason:
+                break
+
+        yield self.format_chunk({"chunk_type": "content_stop", "data_type": "text"})
+
+        for tool_deltas in tool_calls.values():
+            yield self.format_chunk({"chunk_type": "content_start", "data_type": "tool", "data": tool_deltas[0]})
+
+            for tool_delta in tool_deltas:
+                yield self.format_chunk({"chunk_type": "content_delta", "data_type": "tool", "data": tool_delta})
+
+            yield self.format_chunk({"chunk_type": "content_stop", "data_type": "tool"})
+
+        yield self.format_chunk({"chunk_type": "message_stop", "data": choice.finish_reason})
 
-                if hasattr(choice, "finish_reason") and choice.finish_reason:
-                    break
+        # Skip remaining events as we don't have use for anything except the final usage payload
+        async for event in response:
+            _ = event
 
-        yield self.format_chunk({"chunk_type": "content_stop"})
-        yield self.format_chunk({"chunk_type": "message_stop"})
+        yield self.format_chunk({"chunk_type": "metadata", "data": event.usage})
 
         logger.debug("finished streaming response from model")
 
@@ -285,7 +379,7 @@ async def structured_output(
 
 Return only the JSON object with the extracted data, no additional text."""
 
-        request_params = {
+        request_params: dict[str, Any] = {
             "model": self.config["model_id"],
             "messages": [{"role": "user", "content": json_prompt}],
             "response_format": {"type": "json_object"},
diff --git a/tests_integ/models/test_model_deepseek.py b/tests_integ/models/test_model_deepseek.py
index 9aae5f2d7..e88b4913e 100644
--- a/tests_integ/models/test_model_deepseek.py
+++ b/tests_integ/models/test_model_deepseek.py
@@ -21,20 +21,6 @@ def base_model():
     )
 
 
-@pytest.fixture()
-def reasoning_model():
-    return DeepSeekModel(
-        api_key=os.getenv("DEEPSEEK_API_KEY"), model_id="deepseek-reasoner", params={"max_tokens": 32000}
-    )
-
-
-@pytest.fixture()
-def beta_model():
-    return DeepSeekModel(
-        api_key=os.getenv("DEEPSEEK_API_KEY"), model_id="deepseek-chat", use_beta=True, params={"max_tokens": 1000}
-    )
-
-
 @pytest.fixture()
 def tools():
     @strands.tool
@@ -61,20 +47,25 @@ class PersonInfo(BaseModel):
     occupation: str = Field(description="Job or profession")
 
 
-class WeatherInfo(BaseModel):
-    """Weather information."""
-
-    location: str = Field(description="City and state")
-    temperature: str = Field(description="Current temperature")
-    condition: str = Field(description="Weather condition")
-
-
 def test_basic_conversation(base_agent):
     result = base_agent("Hello, how are you today?")
     assert "content" in result.message
     assert len(result.message["content"]) > 0
 
 
+def test_tool_usage(base_agent):
+    result = base_agent("What is the time and weather?")
+    content = result.message.get("content", [])
+
+    # Check for tool calls
+    tool_calls = [block for block in content if "toolUse" in block]
+    if tool_calls:
+        tool_names = [tool["toolUse"]["name"] for tool in tool_calls]
+        assert "tool_time" in tool_names or "tool_weather" in tool_names
+
+    assert result.message is not None
+
+
 def test_structured_output_person(base_agent):
     result = base_agent.structured_output(
         PersonInfo, "John Smith is a 30-year-old software engineer working at a tech startup."
@@ -84,27 +75,68 @@ def test_structured_output_person(base_agent):
     assert "engineer" in result.occupation.lower()
 
 
-def test_tool_usage(base_agent):
-    result = base_agent("What is the time and weather?")
-    # Handle case where content might be empty or structured differently
+def test_calculator_integration():
+    """Test calculator tool integration like ds_test.py"""
+    try:
+        from strands_tools import calculator
+    except ImportError:
+        pytest.skip("strands_tools not available")
+
+    model = DeepSeekModel(
+        api_key=os.getenv("DEEPSEEK_API_KEY"),
+        base_url="https://api.deepseek.com",
+        model_id="deepseek-chat",
+        params={"max_tokens": 2000, "temperature": 0.7},
+    )
+
+    agent = Agent(model=model, tools=[calculator])
+    result = agent("What is 42 ^ 9")
+
+    # Verify response exists
+    assert result.message is not None
     content = result.message.get("content", [])
-    if content and "text" in content[0]:
-        text = content[0]["text"].lower()
-        assert any(string in text for string in ["12:00", "sunny"])
-    else:
-        # If no text content, just verify the result exists
-        assert result.message is not None
+    assert len(content) > 0
+
+    # Check for tool calls
+    tool_calls = [block for block in content if "toolUse" in block]
+    if tool_calls:
+        for tool_call in tool_calls:
+            assert tool_call["toolUse"]["name"] == "calculator"
+            assert "input" in tool_call["toolUse"]
+
+
+def test_multi_tool_workflow():
+    """Test multi-tool workflow like ds_test.py"""
+    try:
+        from strands_tools import calculator, file_read, shell
+    except ImportError:
+        pytest.skip("strands_tools not available")
+
+    model = DeepSeekModel(
+        api_key=os.getenv("DEEPSEEK_API_KEY"),
+        base_url="https://api.deepseek.com",
+        model_id="deepseek-chat",
+        params={"max_tokens": 2000, "temperature": 0.7},
+    )
 
+    agent = Agent(model=model, tools=[calculator, file_read, shell])
 
-@pytest.mark.asyncio
-async def test_streaming(base_model):
-    agent = Agent(model=base_model)
-    events = []
-    async for event in agent.stream_async("Tell me a short fact about robots"):
-        events.append(event)
+    # Test 1: Calculator
+    result1 = agent("What is 42 ^ 9")
+    assert result1.message is not None
+    content1 = result1.message.get("content", [])
+    tool_calls1 = [block for block in content1 if "toolUse" in block]
+    if tool_calls1:
+        assert any(tool["toolUse"]["name"] == "calculator" for tool in tool_calls1)
 
-    assert len(events) > 0
-    assert "result" in events[-1]
+    # Test 2: File operations
+    result2 = agent("Show me the contents of a single file in this directory")
+    assert result2.message is not None
+    content2 = result2.message.get("content", [])
+    tool_calls2 = [block for block in content2 if "toolUse" in block]
+    if tool_calls2:
+        tool_names = [tool["toolUse"]["name"] for tool in tool_calls2]
+        assert any(name in ["file_read", "shell"] for name in tool_names)
 
 
 def test_config_update(base_model):
@@ -114,15 +146,18 @@ def test_config_update(base_model):
     base_model.update_config(model_id="deepseek-reasoner", params={"temperature": 0.5})
     updated_config = base_model.get_config()
     assert updated_config["model_id"] == "deepseek-reasoner"
+    assert updated_config["params"]["temperature"] == 0.5
 
 
-def test_weather_structured_output(base_agent):
-    result = base_agent.structured_output(
-        WeatherInfo, "Get the weather for San Francisco, CA. It's currently 72°F and sunny."
-    )
-    assert "san francisco" in result.location.lower()
-    assert "72" in result.temperature
-    assert "sunny" in result.condition.lower()
+@pytest.mark.asyncio
+async def test_streaming(base_model):
+    agent = Agent(model=base_model)
+    events = []
+    async for event in agent.stream_async("Tell me a short fact about robots"):
+        events.append(event)
+
+    assert len(events) > 0
+    assert "result" in events[-1]
 
 
 @pytest.mark.asyncio