strands-agents · Jun 17, 2025
diff --git a/‎README.md
Lines changed: 12 additions & 0 deletions b/‎README.md
Lines changed: 12 additions & 0 deletions
diff --git a/‎pyproject.toml
Lines changed: 10 additions & 3 deletions b/‎pyproject.toml
Lines changed: 10 additions & 3 deletions
diff --git a/‎src/strands/models/portkey.py
Lines changed: 386 additions & 0 deletions b/‎src/strands/models/portkey.py
Lines changed: 386 additions & 0 deletions
diff --git a/‎tests/strands/models/test_portkey.py
Lines changed: 228 additions & 0 deletions b/‎tests/strands/models/test_portkey.py
Lines changed: 228 additions & 0 deletions
@@ -118,6 +118,7 @@ from strands import Agent
 from strands.models import BedrockModel
 from strands.models.ollama import OllamaModel
 from strands.models.llamaapi import LlamaAPIModel
+from strands.models.portkey import PortkeyModel
 
 # Bedrock
 bedrock_model = BedrockModel(
@@ -142,6 +143,17 @@ llama_model = LlamaAPIModel(
 )
 agent = Agent(model=llama_model)
 response = agent("Tell me about Agentic AI")
+
+# Portkey for all models
+portkey_model = PortkeyModel(
+    api_key="<PORTKEY_API_KEY>",
+    model_id="anthropic.claude-3-5-sonnet-20241022-v2:0",
+    virtual_key="<BEDROCK_VIRTUAL_KEY>",
+    provider="bedrock",
+    base_url="http://portkey-service-gateway.service.prod.example.com/v1",
+)
+agent = Agent(model=portkey_model)
+response = agent("Tell me about Agentic AI")
 ```
 
 Built-in providers:
 
@@ -49,6 +49,8 @@ packages = ["src/strands"]
 anthropic = [
     "anthropic>=0.21.0,<1.0.0",
 ]
+# Optional dependencies for different AI providers
+
 dev = [
     "commitizen>=4.4.0,<5.0.0",
     "hatch>=1.0.0,<2.0.0",
@@ -88,12 +90,17 @@ a2a = [
     "starlette>=0.46.2",
 ]
 
+portkey = [
+    "portkey-ai>=1.0.0,<2.0.0",
+]
+
 [tool.hatch.version]
 # Tells Hatch to use your version control system (git) to determine the version.
 source = "vcs"
 
 [tool.hatch.envs.hatch-static-analysis]
-features = ["anthropic", "litellm", "llamaapi", "ollama", "openai", "otel"]
+features = ["anthropic", "litellm", "llamaapi", "ollama", "openai","otel", "portkey"]
+
 dependencies = [
   "mypy>=1.15.0,<2.0.0",
   "ruff>=0.11.6,<0.12.0",
@@ -116,7 +123,7 @@ lint-fix = [
 ]
 
 [tool.hatch.envs.hatch-test]
-features = ["anthropic", "litellm", "llamaapi", "ollama", "openai", "otel"]
+features = ["anthropic", "litellm", "llamaapi", "ollama", "openai", "otel", "portkey"]
 extra-dependencies = [
     "moto>=5.1.0,<6.0.0",
     "pytest>=8.0.0,<9.0.0",
@@ -132,7 +139,7 @@ extra-args = [
 
 [tool.hatch.envs.dev]
 dev-mode = true
-features = ["dev", "docs", "anthropic", "litellm", "llamaapi", "ollama", "otel"]
+features = ["dev", "docs", "anthropic", "litellm", "llamaapi", "ollama", "otel,", "portkey"]
 
 [tool.hatch.envs.a2a]
 dev-mode = true
 
@@ -0,0 +1,386 @@
+"""Implementation of the Portkey model provider integration."""
+
+import json
+import logging
+import uuid
+from typing import Any, Dict, Iterable, List, Optional, cast
+
+from portkey_ai import Portkey
+from typing_extensions import TypedDict, override
+
+from ..types.content import Messages
+from ..types.exceptions import ContextWindowOverflowException
+from ..types.models import Model
+from ..types.streaming import StreamEvent
+from ..types.tools import ToolSpec
+
+# Configure logger for debug-level output
+logger = logging.getLogger(__name__)
+
+
+class PortkeyModel(Model):
+    """Portkey model provider implementation."""
+
+    class PortkeyConfig(TypedDict, total=False):
+        """Configuration schema for the Portkey model."""
+
+        api_key: str
+        virtual_key: str
+        base_url: str
+        model_id: str
+        provider: str
+        streaming: bool
+
+    def __init__(self, **model_config: PortkeyConfig):
+        """Initialize the Portkey model provider.
+
+        Sets up the model configuration and initializes the Portkey client.
+
+        Args:
+            **model_config (PortkeyConfig): Configuration parameters for the model.
+        """
+        self.config = PortkeyModel.PortkeyConfig()
+        self.config["streaming"] = True
+        self.update_config(**model_config)
+
+        # Extract provider(bedrock, openai, anthropic, etc) from model_config or infer from model_id.
+        self.provider: str = str(model_config["provider"])
+
+        logger.debug("PortkeyModel initialized with config: %s", self.config)
+
+        self.client = Portkey(
+            api_key=self.config["api_key"],
+            virtual_key=self.config["virtual_key"],
+            base_url=self.config["base_url"],
+            model=self.config["model_id"],
+        )
+        self._current_tool_use_id: Optional[str] = None
+        self._current_tool_name: Optional[str] = None
+        self._current_tool_args = ""
+
+    @override
+    def update_config(self, **model_config: PortkeyConfig) -> None:
+        """Update the model configuration.
+
+        Args:
+            **model_config (PortkeyConfig): Configuration parameters to update.
+        """
+        logger.debug("Updating config with: %s", model_config)
+        self.config.update(cast(PortkeyModel.PortkeyConfig, model_config))
+
+    @override
+    def get_config(self) -> PortkeyConfig:
+        """Retrieve the current model configuration.
+
+        Returns:
+            PortkeyConfig: The current configuration dictionary.
+        """
+        logger.debug("Retrieving current model config")
+        return self.config
+
+    @override
+    def format_request(
+        self,
+        messages: Messages,
+        tool_specs: Optional[List[ToolSpec]] = None,
+        system_prompt: Optional[str] = None,
+    ) -> Dict[str, Any]:
+        """Format the input messages and tool specifications into a request dictionary.
+
+        Prepares the messages, system prompt, and tool specifications into the format
+        required by the Portkey client for streaming chat completions.
+
+        Args:
+            messages (Messages): List of messages to format.
+            tool_specs (Optional[List[ToolSpec]]): Optional list of tool specifications.
+            system_prompt (Optional[str]): Optional system prompt string.
+
+        Returns:
+            Dict[str, Any]: Formatted request dictionary.
+        """
+        formatted_messages = []
+        for msg in messages:
+            role = msg.get("role")
+            content = msg.get("content")
+            if role in ("user", "assistant") and content:
+                formatted_messages.extend(self._format_message_parts(role, content))
+
+        if system_prompt:
+            formatted_messages.insert(0, {"role": "system", "content": system_prompt})
+
+        request = {
+            "messages": formatted_messages,
+            "model": self.config["model_id"],
+            "stream": True,
+        }
+
+        allow_tools = self._allow_tool_use()
+
+        if tool_specs and allow_tools:
+            tool_calls = self._map_tools(tool_specs)
+        else:
+            tool_calls = None
+
+        if tool_calls:
+            request["tools"] = tool_calls
+            request["tool_choice"] = "auto"
+        logger.debug("Formatted Portkey request: %s", json.dumps(request, default=str)[:300])
+        return request
+
+    def _allow_tool_use(self) -> bool:
+        """Determine whether tool use is allowed based on provider and model.
+
+        Returns:
+            bool: True if tool use is allowed for the current provider and model.
+        """
+        provider = str(self.provider).lower()
+        if provider == "openai":
+            return True
+        if provider == "bedrock":
+            model_id = self.config.get("model_id", "").lower()
+            return "anthropic" in model_id
+        return False
+
+    @override
+    def stream(self, request: Dict[str, Any]) -> Iterable[Any]:
+        """Stream responses from the Portkey client based on the request.
+
+        Args:
+            request (Dict[str, Any]): The formatted request dictionary.
+
+        Returns:
+            Iterable[Any]: An iterable stream of response events.
+
+        Raises:
+            ContextWindowOverflowException: If the context window is exceeded.
+        """
+        try:
+            return iter(self.client.chat.completions.create(**request))
+        except ContextWindowOverflowException:
+            logger.error("Context window exceeded for request: %s", request)
+            raise
+
+    @override
+    def format_chunk(self, event: Any) -> StreamEvent:
+        """Format a single response event into a stream event for Strands Agents.
+
+        Converts the raw event from the Portkey client into the structured stream event
+        format expected downstream.
+
+        Args:
+            event (Any): The raw response event from the model.
+
+        Returns:
+            StreamEvent: The formatted stream event dictionary.
+        """
+        choice = event.get("choices", [{}])[0]
+        delta = choice.get("delta", {})
+
+        tool_calls = delta.get("tool_calls")
+        if tool_calls:
+            tool_call = tool_calls[0]
+            tool_name = tool_call.get("function", {}).get("name")
+            call_type = tool_call.get("type")
+            arguments_chunk = tool_call.get("function", {}).get("arguments", "")
+            if tool_name and call_type and not self._current_tool_name:
+                self._current_tool_name = tool_name
+                self._current_tool_use_id = f"{tool_name}-{uuid.uuid4().hex[:6]}"
+                self._current_tool_args = arguments_chunk
+                return cast(
+                    StreamEvent,
+                    {
+                        "contentBlockStart": {
+                            "start": {
+                                "toolUse": {
+                                    "name": self._current_tool_name,
+                                    "toolUseId": self._current_tool_use_id,
+                                }
+                            }
+                        }
+                    },
+                )
+
+            if arguments_chunk:
+                return cast(StreamEvent, {"contentBlockDelta": {"delta": {"toolUse": {"input": arguments_chunk}}}})
+
+        if choice.get("finish_reason") == "tool_calls" or choice.get("finish_reason") == "tool_use":
+            return cast(
+                StreamEvent,
+                {
+                    "contentBlockStop": {
+                        "name": self._current_tool_name,
+                        "toolUseId": self._current_tool_use_id,
+                    }
+                },
+            )
+
+        if delta.get("content"):
+            return cast(StreamEvent, {"contentBlockDelta": {"delta": {"text": delta["content"]}}})
+        elif event.get("usage"):
+            usage_data = event["usage"]
+            return cast(
+                StreamEvent,
+                {
+                    "metadata": {
+                        "metrics": {"latencyMs": 0},
+                        "usage": {
+                            "inputTokens": usage_data["prompt_tokens"],
+                            "outputTokens": usage_data["completion_tokens"],
+                            "totalTokens": usage_data["total_tokens"],
+                        },
+                    }
+                },
+            )
+        return cast(StreamEvent, {})
+
+    @override
+    def converse(
+        self,
+        messages: Messages,
+        tool_specs: Optional[list[ToolSpec]] = None,
+        system_prompt: Optional[str] = None,
+    ) -> Iterable[StreamEvent]:
+        """Converse with the model by streaming formatted message chunks.
+
+        Handles the full lifecycle of conversing with the model, including formatting
+        the request, sending it, and yielding formatted response chunks.
+
+        Args:
+            messages (Messages): List of message objects to be processed by the model.
+            tool_specs (Optional[list[ToolSpec]]): List of tool specifications available to the model.
+            system_prompt (Optional[str]): System prompt to provide context to the model.
+
+        Yields:
+            Iterable[StreamEvent]: Formatted message chunks from the model.
+
+        Raises:
+            ModelThrottledException: When the model service is throttling requests from the client.
+        """
+        logger.debug("formatting request")
+        request = self.format_request(messages, tool_specs, system_prompt)
+
+        logger.debug("invoking model %s", request)
+        response = self.stream(request)
+        logger.debug("streaming response from model %s", response)
+
+        yield cast(StreamEvent, {"messageStart": {"role": "assistant"}})
+
+        for event in response:
+            yield self.format_chunk(event)
+
+            if self._should_terminate_with_tool_use(event):
+                yield cast(StreamEvent, {"messageStop": {"stopReason": "tool_use"}})
+                logger.debug("finished streaming response from model")
+
+        self._current_tool_use_id = None
+        self._current_tool_name = None
+        self._current_tool_args = ""
+
+    @staticmethod
+    def _should_terminate_with_tool_use(event: dict) -> bool:
+        """Determine whether the stream should terminate due to a tool use.
+
+        This accounts for inconsistencies across providers: some may return a 'tool_calls'
+        payload but label the finish_reason as 'stop' instead of 'tool_calls'.
+
+        Args:
+            event (dict): The raw event from the model.
+
+        Returns:
+            bool: True if the event indicates a tool use termination.
+        """
+        choice = event.get("choices", [{}])[0]
+        finish_reason = (choice.get("finish_reason") or "").lower()
+        return finish_reason in ["tool_calls", "tool_use"]
+
+    def _format_tool_use_part(self, part: dict) -> dict:
+        """Format a tool use part of a message into the standard dictionary format.
+
+        Args:
+            part (dict): The part of the message representing a tool use.
+
+        Returns:
+            dict: Formatted dictionary representing the tool use.
+        """
+        logger.debug("Formatting tool use part: %s", part)
+        self._current_tool_use_id = part["toolUse"]["toolUseId"]
+        return {
+            "role": "assistant",
+            "tool_calls": [
+                {
+                    "id": self._current_tool_use_id,
+                    "type": "function",
+                    "function": {"name": part["toolUse"]["name"], "arguments": json.dumps(part["toolUse"]["input"])},
+                }
+            ],
+            "content": None,
+        }
+
+    def _format_tool_result_part(self, part: dict) -> dict:
+        """Format a tool result part of a message into the standard dictionary format.
+
+        Args:
+            part (dict): The part of the message representing a tool result.
+
+        Returns:
+            dict: Formatted dictionary representing the tool result.
+        """
+        logger.debug("Formatting tool result part: %s", part)
+        result_text = " ".join([c["text"] for c in part["toolResult"]["content"] if "text" in c])
+        return {"role": "tool", "tool_call_id": self._current_tool_use_id, "content": result_text}
+
+    def _format_message_parts(self, role: str, content: Any) -> List[Dict[str, Any]]:
+        """Format message parts into a list of standardized message dictionaries.
+
+        Handles plain text content as well as structured parts including tool uses and results.
+
+        Args:
+            role (str): The role of the message sender (e.g., 'user', 'assistant').
+            content (Any): The content of the message, can be string or list of parts.
+
+        Returns:
+            List[Dict[str, Any]]: List of formatted message dictionaries.
+        """
+        logger.debug("Formatting message parts for role '%s' with content: %s", role, content)
+        parts = []
+        if isinstance(content, str):
+            parts.append({"role": role, "content": content})
+        elif isinstance(content, list):
+            for part in content:
+                if "text" in part and isinstance(part["text"], str):
+                    parts.append({"role": role, "content": part["text"]})
+                elif "toolUse" in part:
+                    parts.append(self._format_tool_use_part(part))
+                elif "toolResult" in part and self._current_tool_use_id:
+                    parts.append(self._format_tool_result_part(part))
+        return parts
+
+    @staticmethod
+    def _map_tools(tool_specs: List[ToolSpec]) -> List[Dict[str, Any]]:
+        """Map tool specifications to the format expected by Portkey.
+
+        Args:
+            tool_specs (List[ToolSpec]): List of tool specifications.
+
+        Returns:
+            List[Dict[str, Any]]: Mapped list of tool dictionaries.
+        """
+        logger.debug("Mapping tool specs: %s", tool_specs)
+        return [
+            {
+                "type": "function",
+                "function": {
+                    "name": spec["name"],
+                    "description": spec["description"],
+                    "parameters": {
+                        "type": "object",
+                        "properties": {
+                            k: {key: value for key, value in v.items() if key != "default" or value is not None}
+                            for k, v in spec["inputSchema"]["json"].get("properties", {}).items()
+                        },
+                        "required": spec["inputSchema"]["json"].get("required", []),
+                    },
+                },
+            }
+            for spec in tool_specs
+        ]
@@ -0,0 +1,228 @@
+# Python
+import unittest.mock
+
+import pytest
+
+from src.strands.models.portkey import PortkeyModel
+from src.strands.types.exceptions import ContextWindowOverflowException
+
+
+@pytest.fixture
+def model_config():
+    return {
+        "api_key": "test_api_key",
+        "virtual_key": "test_virtual_key",
+        "base_url": "https://test.url",
+        "model_id": "test_model_id",
+        "provider": "openai",
+    }
+
+
+@pytest.fixture
+def portkey_model(model_config):
+    return PortkeyModel(**model_config)
+
+
+def test__init__(portkey_model):
+    assert portkey_model.config["api_key"] == "test_api_key"
+    assert portkey_model.provider == "openai"
+
+
+def test_get_config(portkey_model):
+    config = portkey_model.get_config()
+    assert config["api_key"] == "test_api_key"
+
+
+def test_format_request_no_tools(portkey_model):
+    messages = [{"role": "user", "content": "Hello"}]
+    request = portkey_model.format_request(messages)
+    assert "tools" not in request
+
+
+def test_format_request_with_tools(portkey_model):
+    messages = [{"role": "user", "content": "Hello"}]
+    tool_specs = [{"name": "test_tool", "description": "Test tool", "inputSchema": {"json": {"properties": {}}}}]
+    request = portkey_model.format_request(messages, tool_specs)
+    assert "tools" in request
+
+
+def test_format_request_system_prompt(portkey_model):
+    messages = [{"role": "user", "content": "Hello"}]
+    system_prompt = "Test system prompt"
+    request = portkey_model.format_request(messages, system_prompt=system_prompt)
+    assert request["messages"][0]["role"] == "system"
+
+
+def test_allow_tool_use_openai(portkey_model):
+    assert portkey_model._allow_tool_use()
+
+
+def test_allow_tool_use_bedrock():
+    model_config = {
+        "api_key": "test_api_key",
+        "virtual_key": "test_virtual_key",
+        "base_url": "https://test.url",
+        "model_id": "anthropic_model_id",
+        "provider": "bedrock",
+    }
+    portkey_model = PortkeyModel(**model_config)
+    assert portkey_model._allow_tool_use() is True
+
+
+def test_allow_tool_use_false():
+    model_config = {
+        "api_key": "test_api_key",
+        "virtual_key": "test_virtual_key",
+        "base_url": "https://test.url",
+        "model_id": "test_model_id",
+        "provider": "unknown",
+    }
+    portkey_model = PortkeyModel(**model_config)
+    assert portkey_model._allow_tool_use() is False
+
+
+def test_stream(portkey_model):
+    mock_event = {"choices": [{"delta": {"content": "test"}}]}
+    with unittest.mock.patch.object(portkey_model.client.chat.completions, "create", return_value=iter([mock_event])):
+        request = {"messages": [{"role": "user", "content": "Hello"}], "model": "test_model_id", "stream": True}
+        response = list(portkey_model.stream(request))
+        assert response[0]["choices"][0]["delta"]["content"] == "test"
+
+
+def test_stream_context_window_exception(portkey_model):
+    with unittest.mock.patch.object(
+        portkey_model.client.chat.completions,
+        "create",
+        side_effect=ContextWindowOverflowException("Context window exceeded"),
+    ):
+        request = {"messages": [{"role": "user", "content": "Hello"}], "model": "test_model_id", "stream": True}
+        with pytest.raises(ContextWindowOverflowException):
+            list(portkey_model.stream(request))
+
+
+def test_format_chunk_tool_calls(portkey_model):
+    event = {
+        "choices": [
+            {
+                "delta": {
+                    "tool_calls": [
+                        {
+                            "function": {"name": "test_tool", "arguments": "test_args"},
+                            "type": "function",
+                        }
+                    ]
+                },
+                "finish_reason": None,
+            }
+        ]
+    }
+    chunk = portkey_model.format_chunk(event)
+    assert "contentBlockStart" in chunk
+
+
+def test_format_chunk_arguments_chunk(portkey_model):
+    event = {
+        "choices": [
+            {
+                "delta": {
+                    "tool_calls": [
+                        {
+                            "function": {"arguments": "test_args"},
+                        }
+                    ]
+                },
+                "finish_reason": None,
+            }
+        ]
+    }
+    chunk = portkey_model.format_chunk(event)
+    assert "contentBlockDelta" in chunk
+
+
+def test_format_chunk_finish_reason_tool_calls(portkey_model):
+    event = {"choices": [{"finish_reason": "tool_calls"}]}
+    chunk = portkey_model.format_chunk(event)
+    assert "contentBlockStop" in chunk
+
+
+def test_format_chunk_usage(portkey_model):
+    event = {
+        "usage": {
+            "prompt_tokens": 10,
+            "completion_tokens": 5,
+            "total_tokens": 15,
+        },
+        "choices": [{"delta": {"content": None}}],  # Ensure 'content' key exists
+    }
+    chunk = portkey_model.format_chunk(event)
+    assert chunk["metadata"]["usage"]["totalTokens"] == 15
+
+
+def test_format_message_parts_string(portkey_model):
+    parts = portkey_model._format_message_parts("user", "test content")
+    assert parts == [{"role": "user", "content": "test content"}]
+
+
+def test_format_message_parts_list_with_text(portkey_model):
+    content = [{"text": "test text"}]
+    parts = portkey_model._format_message_parts("assistant", content)
+    assert parts == [{"role": "assistant", "content": "test text"}]
+
+
+def test_format_message_parts_tool_use(portkey_model):
+    content = [{"toolUse": {"toolUseId": "123", "name": "test_tool", "input": {}}}]
+    parts = portkey_model._format_message_parts("assistant", content)
+    assert "tool_calls" in parts[0]
+
+
+def test_format_message_parts_tool_result(portkey_model):
+    portkey_model._current_tool_use_id = "123"
+    content = [{"toolResult": {"content": [{"text": "result text"}]}}]
+    parts = portkey_model._format_message_parts("assistant", content)
+    assert parts[0]["content"] == "result text"
+
+
+def test_map_tools(portkey_model):
+    tool_specs = [
+        {
+            "name": "test_tool",
+            "description": "Test tool",
+            "inputSchema": {
+                "json": {
+                    "properties": {"arg1": {"type": "string"}},
+                    "required": ["arg1"],
+                }
+            },
+        }
+    ]
+    tools = portkey_model._map_tools(tool_specs)
+    assert tools[0]["function"]["name"] == "test_tool"
+    assert tools[0]["function"]["parameters"]["required"] == ["arg1"]
+
+
+def test_format_tool_use_part(portkey_model):
+    part = {"toolUse": {"toolUseId": "123", "name": "test_tool", "input": {}}}
+    formatted = portkey_model._format_tool_use_part(part)
+    assert formatted["tool_calls"][0]["function"]["name"] == "test_tool"
+
+
+def test_format_tool_result_part(portkey_model):
+    portkey_model._current_tool_use_id = "123"
+    part = {"toolResult": {"content": [{"text": "result text"}]}}
+    formatted = portkey_model._format_tool_result_part(part)
+    assert formatted["content"] == "result text"
+
+
+def test_should_terminate_with_tool_use(portkey_model):
+    event = {"choices": [{"finish_reason": "tool_calls"}]}
+    assert portkey_model._should_terminate_with_tool_use(event) is True
+
+
+def test_converse(portkey_model):
+    mock_event = {"choices": [{"delta": {"content": "test"}}]}
+    with unittest.mock.patch.object(portkey_model.client.chat.completions, "create", return_value=iter([mock_event])):
+        messages = [{"role": "user", "content": "Hello"}]
+        tool_specs = [{"name": "test_tool", "description": "Test tool", "inputSchema": {"json": {"properties": {}}}}]
+        system_prompt = "Test system prompt"
+        response = list(portkey_model.converse(messages, tool_specs, system_prompt))
+        assert response[0]["messageStart"]["role"] == "assistant"