fix: address comments

JackYPCOnline · JackYPCOnline · commit aec50b95d960 · 2026-04-29T14:44:19.000-04:00
diff --git a/src/strands/models/bedrock.py b/src/strands/models/bedrock.py
@@ -124,9 +124,12 @@ class OpenAIEndpointConfig(TypedDict, total=False):
     OpenAI-compatible surface, such as the Responses API's server-side stateful conversations
     and reasoning controls.
 
-    Generic inference parameters (``temperature``, ``top_p``, ``max_tokens``,
-    ``stop_sequences``, ``streaming``) continue to live on :class:`BedrockModel.BedrockConfig`
-    and are forwarded to the underlying OpenAI model.
+    Generic inference parameters (``temperature``, ``top_p``, ``max_tokens``) live on
+    :class:`BedrockModel.BedrockConfig` and are forwarded to the underlying OpenAI model.
+    ``stop_sequences`` is forwarded to Chat Completions as ``stop`` but is rejected at
+    init time when ``api="responses"`` (the Responses API does not accept stop sequences).
+    ``streaming=False`` is not supported on this path and is also rejected at init time,
+    since the OpenAI SDK's Responses and Chat Completions surfaces always stream.
 
     Attributes:
         api: Which OpenAI API surface to use. ``"responses"`` maps to the Responses API and
diff --git a/tests/strands/models/test_bedrock.py b/tests/strands/models/test_bedrock.py
@@ -3414,3 +3414,29 @@ def test_openai_endpoint_invalid_config_raises(session_cls, config_kwargs, error
 
     with pytest.raises(ValueError, match=error_match):
         BedrockModel(model_id="openai.gpt-oss-120b", region_name="us-east-1", **config_kwargs)
+
+
+@pytest.mark.asyncio
+async def test_openai_endpoint_count_tokens_falls_back_to_base(session_cls, openai_responses_model_cls, messages):
+    """count_tokens bypasses the Converse client on the openai_endpoint path.
+
+    Bedrock's native CountTokens API lives on ``bedrock-runtime`` and has no Mantle
+    equivalent, so ``BedrockModel.count_tokens`` must route to the base ``Model.count_tokens``
+    estimator (tiktoken or heuristic). A regression that routed through ``self.client`` would
+    raise ``AttributeError`` since ``self.client is None`` on the Mantle path.
+    """
+    _ = session_cls
+
+    model = BedrockModel(
+        model_id="openai.gpt-oss-120b",
+        region_name="us-east-1",
+        openai_endpoint={"api": "responses"},
+    )
+
+    # Delegate is a mock and does not implement count_tokens. Call should still succeed
+    # because the override dispatches to super() rather than the delegate or the boto client.
+    result = await model.count_tokens(messages=messages)
+
+    assert isinstance(result, int)
+    assert result > 0
+    openai_responses_model_cls.return_value.count_tokens.assert_not_called()