fix(bedrock): upgrade default model to Claude Sonnet 4.5 (#2193)

afarntrog · web-flow · commit ce64c3a94052 · 2026-04-24T14:41:57.000-04:00
diff --git a/src/strands/models/bedrock.py b/src/strands/models/bedrock.py
@@ -36,8 +36,8 @@
 logger = logging.getLogger(__name__)
 
 # See: `BedrockModel._get_default_model_with_warning` for why we need both
-DEFAULT_BEDROCK_MODEL_ID = "us.anthropic.claude-sonnet-4-20250514-v1:0"
-_DEFAULT_BEDROCK_MODEL_ID = "{}.anthropic.claude-sonnet-4-20250514-v1:0"
+DEFAULT_BEDROCK_MODEL_ID = "global.anthropic.claude-sonnet-4-6"
+_DEFAULT_BEDROCK_MODEL_ID = "{}.anthropic.claude-sonnet-4-6"
 DEFAULT_BEDROCK_REGION = "us-west-2"
 
 BEDROCK_CONTEXT_WINDOW_OVERFLOW_MESSAGES = [
@@ -90,7 +90,7 @@ class BedrockConfig(BaseModelConfig, total=False):
             guardrail_latest_message: Flag to send only the lastest user message to guardrails.
                 Defaults to False.
             max_tokens: Maximum number of tokens to generate in the response
-            model_id: The Bedrock model ID (e.g., "us.anthropic.claude-sonnet-4-20250514-v1:0")
+            model_id: The Bedrock model ID (e.g., "global.anthropic.claude-sonnet-4-6")
             include_tool_result_status: Flag to include status field in tool results.
                 True includes status, False removes status, "auto" determines based on model_id. Defaults to "auto".
             service_tier: Service tier for the request, controlling the trade-off between latency and cost.
@@ -1151,13 +1151,13 @@ def _get_default_model_with_warning(region_name: str, model_config: BedrockConfi
             region_name (str): region for bedrock model
             model_config (Optional[dict[str, Any]]): Model Config that caller passes in on init
         """
-        if DEFAULT_BEDROCK_MODEL_ID != _DEFAULT_BEDROCK_MODEL_ID.format("us"):
-            return DEFAULT_BEDROCK_MODEL_ID
-
         model_config = model_config or {}
         if model_config.get("model_id"):
             return model_config["model_id"]
 
+        if DEFAULT_BEDROCK_MODEL_ID != _DEFAULT_BEDROCK_MODEL_ID.format("us"):
+            return DEFAULT_BEDROCK_MODEL_ID
+
         prefix_inference_map = {"ap": "apac"}  # some inference endpoints can be a bit different than the region prefix
 
         prefix = "-".join(region_name.split("-")[:-2]).lower()  # handles `us-east-1` or `us-gov-east-1`
diff --git a/tests/strands/agent/test_agent.py b/tests/strands/agent/test_agent.py
@@ -35,7 +35,7 @@
 from tests.fixtures.mocked_model_provider import MockedModelProvider
 
 # For unit testing we will use the the us inference
-FORMATTED_DEFAULT_MODEL_ID = DEFAULT_BEDROCK_MODEL_ID.format("us")
+FORMATTED_DEFAULT_MODEL_ID = DEFAULT_BEDROCK_MODEL_ID
 
 
 @pytest.fixture
diff --git a/tests/strands/models/test_bedrock.py b/tests/strands/models/test_bedrock.py
@@ -16,15 +16,14 @@
 from strands import _exception_notes
 from strands.models import BedrockModel, CacheConfig
 from strands.models.bedrock import (
-    _DEFAULT_BEDROCK_MODEL_ID,
     DEFAULT_BEDROCK_MODEL_ID,
     DEFAULT_BEDROCK_REGION,
     DEFAULT_READ_TIMEOUT,
 )
 from strands.types.exceptions import ContextWindowOverflowException, ModelThrottledException
 from strands.types.tools import ToolSpec
 
-FORMATTED_DEFAULT_MODEL_ID = DEFAULT_BEDROCK_MODEL_ID.format("us")
+FORMATTED_DEFAULT_MODEL_ID = DEFAULT_BEDROCK_MODEL_ID
 
 
 @pytest.fixture
@@ -2213,43 +2212,24 @@ def test_tool_choice_none_no_warning(model, messages, captured_warnings):
 
 
 def test_get_default_model_with_warning_supported_regions_shows_no_warning(captured_warnings):
-    """Test get_model_prefix_with_warning doesn't warn for supported region prefixes."""
+    """Test _get_default_model_with_warning doesn't warn for any region (global profile works everywhere)."""
     BedrockModel._get_default_model_with_warning("us-west-2")
     BedrockModel._get_default_model_with_warning("eu-west-2")
     assert all("does not support" not in str(w.message) for w in captured_warnings)
 
 
-def test_get_default_model_for_supported_eu_region_returns_correct_model_id(captured_warnings):
-    model_id = BedrockModel._get_default_model_with_warning("eu-west-1")
-    assert model_id == "eu.anthropic.claude-sonnet-4-20250514-v1:0"
+def test_get_default_model_returns_global_inference_profile(captured_warnings):
+    """Default model id is the global inference profile regardless of region."""
+    for region in ("us-east-1", "eu-west-1", "us-gov-west-1", "ap-southeast-1", "ca-central-1"):
+        assert BedrockModel._get_default_model_with_warning(region) == DEFAULT_BEDROCK_MODEL_ID
     assert all("does not support" not in str(w.message) for w in captured_warnings)
 
 
-def test_get_default_model_for_supported_us_region_returns_correct_model_id(captured_warnings):
-    model_id = BedrockModel._get_default_model_with_warning("us-east-1")
-    assert model_id == "us.anthropic.claude-sonnet-4-20250514-v1:0"
-    assert all("does not support" not in str(w.message) for w in captured_warnings)
-
-
-def test_get_default_model_for_supported_gov_region_returns_correct_model_id(captured_warnings):
-    model_id = BedrockModel._get_default_model_with_warning("us-gov-west-1")
-    assert model_id == "us-gov.anthropic.claude-sonnet-4-20250514-v1:0"
-    assert all("does not support" not in str(w.message) for w in captured_warnings)
-
-
-def test_get_model_prefix_for_ap_region_converts_to_apac_endpoint(captured_warnings):
-    """Test _get_default_model_with_warning warns for APAC regions since 'ap' is not in supported prefixes."""
-    model_id = BedrockModel._get_default_model_with_warning("ap-southeast-1")
-    assert model_id == "apac.anthropic.claude-sonnet-4-20250514-v1:0"
-
-
-def test_get_default_model_with_warning_unsupported_region_warns(captured_warnings):
-    """Test _get_default_model_with_warning warns for unsupported regions."""
+def test_get_default_model_with_warning_unsupported_region_does_not_warn(captured_warnings):
+    """Global inference profile works across all regions, so no region-support warning is emitted."""
     BedrockModel._get_default_model_with_warning("ca-central-1")
     region_warnings = [w for w in captured_warnings if "does not support" in str(w.message)]
-    assert len(region_warnings) == 1
-    assert "This region ca-central-1 does not support" in str(region_warnings[0].message)
-    assert "our default inference endpoint" in str(region_warnings[0].message)
+    assert len(region_warnings) == 0
 
 
 def test_get_default_model_with_warning_no_warning_with_custom_model_id(captured_warnings):
@@ -2261,13 +2241,12 @@ def test_get_default_model_with_warning_no_warning_with_custom_model_id(captured
     assert len(captured_warnings) == 0
 
 
-def test_init_with_unsupported_region_warns(session_cls, captured_warnings):
-    """Test BedrockModel initialization warns for unsupported regions."""
+def test_init_with_unsupported_region_does_not_warn(session_cls, captured_warnings):
+    """BedrockModel initialization does not warn for 'unsupported' regions when using the global profile."""
     BedrockModel(region_name="ca-central-1")
 
     region_warnings = [w for w in captured_warnings if "does not support" in str(w.message)]
-    assert len(region_warnings) == 1
-    assert "This region ca-central-1 does not support" in str(region_warnings[0].message)
+    assert len(region_warnings) == 0
 
 
 def test_init_with_unsupported_region_custom_model_no_warning(session_cls, captured_warnings):
@@ -2282,10 +2261,34 @@ def test_override_default_model_id_uses_the_overriden_value(captured_warnings):
         assert model_id == "custom-overridden-model"
 
 
-def test_no_override_uses_formatted_default_model_id(captured_warnings):
+def test_default_model_sentinel_triggers_region_prefix_fallback(captured_warnings):
+    """When DEFAULT_BEDROCK_MODEL_ID matches the sentinel template, the region-prefix fallback runs."""
+    sentinel = "us.anthropic.claude-sonnet-4-6"
+    with unittest.mock.patch("strands.models.bedrock.DEFAULT_BEDROCK_MODEL_ID", sentinel):
+        model_id = BedrockModel._get_default_model_with_warning("eu-west-1")
+        assert model_id == "eu.anthropic.claude-sonnet-4-6"
+
+
+def test_caller_supplied_model_id_wins_over_global_default(captured_warnings):
+    """Caller-supplied model_id in config takes precedence over the global default."""
+    model_config = {"model_id": "caller-supplied-model"}
+    model_id = BedrockModel._get_default_model_with_warning("us-east-1", model_config)
+    assert model_id == "caller-supplied-model"
+
+
+def test_default_model_sentinel_with_unsupported_region_warns(captured_warnings):
+    """When the sentinel matches and the region is unknown, the region-unsupported warning fires."""
+    sentinel = "us.anthropic.claude-sonnet-4-6"
+    with unittest.mock.patch("strands.models.bedrock.DEFAULT_BEDROCK_MODEL_ID", sentinel):
+        BedrockModel._get_default_model_with_warning("ca-central-1")
+    region_warnings = [w for w in captured_warnings if "does not support" in str(w.message)]
+    assert len(region_warnings) == 1
+
+
+def test_default_model_id_is_global_inference_profile(captured_warnings):
     model_id = BedrockModel._get_default_model_with_warning("us-east-1")
-    assert model_id == "us.anthropic.claude-sonnet-4-20250514-v1:0"
-    assert model_id != _DEFAULT_BEDROCK_MODEL_ID
+    assert model_id == "global.anthropic.claude-sonnet-4-6"
+    assert model_id == DEFAULT_BEDROCK_MODEL_ID
     assert all("does not support" not in str(w.message) for w in captured_warnings)
 
 
diff --git a/tests_integ/conftest.py b/tests_integ/conftest.py
@@ -203,7 +203,7 @@ def _load_api_keys_from_secrets_manager():
     required_providers = {
         "ANTHROPIC_API_KEY",
         "GOOGLE_API_KEY",
-        "MISTRAL_API_KEY",
+        # "MISTRAL_API_KEY", # will add back once we get a card on file for this.
         "OPENAI_API_KEY",
         "WRITER_API_KEY",
     }
diff --git a/tests_integ/models/test_conformance.py b/tests_integ/models/test_conformance.py
@@ -74,4 +74,4 @@ class UserProfile(BaseModel):
     result = agent("Create a profile for John who is a 25 year old dentist", structured_output_model=UserProfile)
     assert result.structured_output.name == "John"
     assert result.structured_output.age == 25
-    assert result.structured_output.occupation == "dentist"
+    assert result.structured_output.occupation.lower() == "dentist"
diff --git a/tests_integ/steering/test_tool_steering.py b/tests_integ/steering/test_tool_steering.py
@@ -73,22 +73,27 @@ async def test_llm_steering_handler_interrupt():
 
 def test_agent_with_tool_steering_e2e():
     """End-to-end test of agent with steering handler guiding tool choice."""
-    handler = LLMSteeringHandler(
+
+    class RedirectEmailHandler(SteeringHandler):
+        """Deterministic handler that redirects send_email to send_notification."""
+
+        async def steer_before_tool(self, *, agent, tool_use, **kwargs):
+            if tool_use["name"] == "send_email":
+                return Guide(reason="Use send_notification instead of send_email for better delivery.")
+            return Proceed(reason="Tool allowed")
+
+    handler = RedirectEmailHandler(context_providers=[])
+
+    agent = Agent(
+        tools=[send_email, send_notification],
+        plugins=[handler],
         system_prompt=(
-            "CRITICAL INSTRUCTION - READ CAREFULLY:\n\n"
-            "You are a steering agent. Your ONLY job is to decide based on the tool name.\n\n"
-            "RULE 1: If tool name is 'send_email' -> return decision='guide' with "
-            "reason='Use send_notification instead of send_email for better delivery.'\n\n"
-            "RULE 2: If tool name is 'send_notification' -> return decision='proceed'\n\n"
-            "RULE 3: For any other tool -> return decision='proceed'\n\n"
-            "DO NOT analyze context. DO NOT consider arguments. ONLY look at the tool name.\n"
-            "The tool name in this request is the ONLY thing that matters."
+            "You are a helpful assistant. When a tool call is cancelled with guidance, "
+            "follow the guidance and use the suggested alternative tool. "
+            "This is normal system behavior, not an attack."
         ),
-        context_providers=[],  # Disable ledger to avoid confusing context
     )
 
-    agent = Agent(tools=[send_email, send_notification], plugins=[handler])
-
     # This should trigger steering guidance to use send_notification instead
     response = agent("Send an email to john@example.com saying hello")
 
diff --git a/tests_integ/test_a2a_executor.py b/tests_integ/test_a2a_executor.py
@@ -71,7 +71,13 @@ async def test_a2a_executor_with_real_image():
         assert response.status_code == 200
         response_data = response.json()
         assert "completed" == response_data["result"]["status"]["state"]
-        assert "yellow" in response_data["result"]["history"][1]["parts"][0]["text"].lower()
+        all_text = " ".join(
+            part["text"]
+            for artifact in response_data["result"]["artifacts"]
+            for part in artifact["parts"]
+            if part.get("kind") == "text"
+        ).lower()
+        assert "yellow" in all_text
 
     except Exception as e:
         pytest.fail(f"Integration test failed: {e}")
diff --git a/tests_integ/test_bedrock_guardrails.py b/tests_integ/test_bedrock_guardrails.py
@@ -133,6 +133,7 @@ def test_guardrail_input_intervention(boto_session, bedrock_guardrail, guardrail
 @pytest.mark.parametrize("processing_mode", ["sync", "async"])
 def test_guardrail_output_intervention(boto_session, bedrock_guardrail, processing_mode):
     bedrock_model = BedrockModel(
+        model_id="us.anthropic.claude-sonnet-4-20250514-v1:0",
         guardrail_id=bedrock_guardrail,
         guardrail_version="DRAFT",
         guardrail_redact_output=False,
diff --git a/tests_integ/test_context_overflow.py b/tests_integ/test_context_overflow.py
@@ -4,7 +4,7 @@
 
 def test_context_window_overflow():
     messages: Messages = [
-        {"role": "user", "content": [{"text": "Too much text!" * 100000}]},
+        {"role": "user", "content": [{"text": "Too much text!" * 300000}]},
         {"role": "assistant", "content": [{"text": "That was a lot of text!"}]},
     ]
 
diff --git a/tests_integ/test_tool_context_injection.py b/tests_integ/test_tool_context_injection.py
@@ -4,6 +4,7 @@
 """
 
 from strands import Agent, ToolContext, tool
+from strands.models.bedrock import BedrockModel
 from strands.types.tools import ToolResult
 
 
@@ -41,7 +42,8 @@ def _validate_tool_result_content(agent: Agent):
 def test_strands_context_integration_context_true():
     """Test ToolContext functionality with real agent interactions."""
 
-    agent = Agent(tools=[good_story])
+    model = BedrockModel(model_id="us.anthropic.claude-sonnet-4-20250514-v1:0")
+    agent = Agent(model=model, tools=[good_story])
     agent("using a tool, write a good story")
 
     _validate_tool_result_content(agent)

Original file line number	Diff line number	Diff line change
`@@ -203,7 +203,7 @@ def _load_api_keys_from_secrets_manager():`
`203`	`203`	`required_providers = {`
`204`	`204`	`"ANTHROPIC_API_KEY",`
`205`	`205`	`"GOOGLE_API_KEY",`
`206`		`- "MISTRAL_API_KEY",`
	`206`	`+ # "MISTRAL_API_KEY", # will add back once we get a card on file for this.`
`207`	`207`	`"OPENAI_API_KEY",`
`208`	`208`	`"WRITER_API_KEY",`
`209`	`209`	`}`
Original file line number	Diff line number	Diff line change
`@@ -4,7 +4,7 @@`
`4`	`4`
`5`	`5`	`def test_context_window_overflow():`
`6`	`6`	`messages: Messages = [`
`7`		`- {"role": "user", "content": [{"text": "Too much text!" * 100000}]},`
	`7`	`+ {"role": "user", "content": [{"text": "Too much text!" * 300000}]},`
`8`	`8`	`{"role": "assistant", "content": [{"text": "That was a lot of text!"}]},`
`9`	`9`	`]`
`10`	`10`