fix: connect anthropic_llm with top_k, top_p, etc

sebastienc · sebastienc · commit 2b72e5f41653 · 2026-04-27T20:49:41.000-04:00
diff --git a/src/google/adk/models/anthropic_llm.py b/src/google/adk/models/anthropic_llm.py
@@ -493,15 +493,20 @@ async def generate_content_async(
     )
     thinking = _build_anthropic_thinking_param(llm_request.config)
 
+    config = llm_request.config
     if not stream:
       message = await self._anthropic_client.messages.create(
           model=model_to_use,
-          system=llm_request.config.system_instruction,
+          system=config.system_instruction,
           messages=messages,
           tools=tools,
           tool_choice=tool_choice,
           max_tokens=self.max_tokens,
           thinking=thinking,
+          temperature=config.temperature if config.temperature is not None else NOT_GIVEN,
+          top_p=config.top_p if config.top_p is not None else NOT_GIVEN,
+          top_k=config.top_k if config.top_k is not None else NOT_GIVEN,
+          stop_sequences=config.stop_sequences if config.stop_sequences is not None else NOT_GIVEN,
       )
       yield message_to_generate_content_response(message)
     else:
@@ -528,13 +533,18 @@ async def _generate_content_streaming(
     a final aggregated LlmResponse with all content.
     """
     model_to_use = self._resolve_model_name(llm_request.model)
+    config = llm_request.config
     raw_stream = await self._anthropic_client.messages.create(
         model=model_to_use,
-        system=llm_request.config.system_instruction,
+        system=config.system_instruction,
         messages=messages,
         tools=tools,
         tool_choice=tool_choice,
         max_tokens=self.max_tokens,
+        temperature=config.temperature if config.temperature is not None else NOT_GIVEN,
+        top_p=config.top_p if config.top_p is not None else NOT_GIVEN,
+        top_k=config.top_k if config.top_k is not None else NOT_GIVEN,
+        stop_sequences=config.stop_sequences if config.stop_sequences is not None else NOT_GIVEN,
         stream=True,
         thinking=thinking,
     )
diff --git a/tests/unittests/models/test_anthropic_llm.py b/tests/unittests/models/test_anthropic_llm.py
@@ -1905,3 +1905,185 @@ async def test_streaming_redacted_thinking_block_preserved_in_final():
 
   text_part = final.content.parts[1]
   assert text_part.text == "Done."
+
+
+
+
+# --- Tests for generation config parameter forwarding ---
+
+
+def _make_minimal_stream(text="Hi"):
+  """Minimal streaming event sequence for param-forwarding tests."""
+  return [
+      MagicMock(
+          type="message_start",
+          message=MagicMock(usage=MagicMock(input_tokens=5, output_tokens=0)),
+      ),
+      MagicMock(
+          type="content_block_start",
+          index=0,
+          content_block=anthropic_types.TextBlock(text="", type="text"),
+      ),
+      MagicMock(
+          type="content_block_delta",
+          index=0,
+          delta=anthropic_types.TextDelta(text=text, type="text_delta"),
+      ),
+      MagicMock(type="content_block_stop", index=0),
+      MagicMock(
+          type="message_delta",
+          delta=MagicMock(stop_reason="end_turn"),
+          usage=MagicMock(output_tokens=1),
+      ),
+      MagicMock(type="message_stop"),
+  ]
+
+
+@pytest.mark.asyncio
+async def test_non_streaming_forwards_generation_params():
+  """temperature, top_p, top_k, stop_sequences forwarded to messages.create."""
+  from anthropic import NOT_GIVEN
+
+  llm = AnthropicLlm(model="claude-sonnet-4-20250514")
+  mock_message = anthropic_types.Message(
+      id="msg_test",
+      content=[anthropic_types.TextBlock(text="Hi", type="text", citations=None)],
+      model="claude-sonnet-4-20250514",
+      role="assistant",
+      stop_reason="end_turn",
+      stop_sequence=None,
+      type="message",
+      usage=anthropic_types.Usage(
+          input_tokens=5,
+          output_tokens=2,
+          cache_creation_input_tokens=0,
+          cache_read_input_tokens=0,
+          server_tool_use=None,
+          service_tier=None,
+      ),
+  )
+  mock_client = MagicMock()
+  mock_client.messages.create = AsyncMock(return_value=mock_message)
+
+  llm_request = LlmRequest(
+      model="claude-sonnet-4-20250514",
+      contents=[Content(role="user", parts=[Part.from_text(text="Hi")])],
+      config=types.GenerateContentConfig(
+          system_instruction="Test",
+          temperature=0.7,
+          top_p=0.9,
+          top_k=40,
+          stop_sequences=["STOP", "END"],
+      ),
+  )
+
+  with mock.patch.object(llm, "_anthropic_client", mock_client):
+    _ = [r async for r in llm.generate_content_async(llm_request, stream=False)]
+
+  _, kwargs = mock_client.messages.create.call_args
+  assert kwargs["temperature"] == 0.7
+  assert kwargs["top_p"] == 0.9
+  assert kwargs["top_k"] == 40
+  assert kwargs["stop_sequences"] == ["STOP", "END"]
+
+
+@pytest.mark.asyncio
+async def test_non_streaming_omits_unset_generation_params():
+  """Unset generation params should be NOT_GIVEN, not None."""
+  from anthropic import NOT_GIVEN
+
+  llm = AnthropicLlm(model="claude-sonnet-4-20250514")
+  mock_message = anthropic_types.Message(
+      id="msg_test",
+      content=[anthropic_types.TextBlock(text="Hi", type="text", citations=None)],
+      model="claude-sonnet-4-20250514",
+      role="assistant",
+      stop_reason="end_turn",
+      stop_sequence=None,
+      type="message",
+      usage=anthropic_types.Usage(
+          input_tokens=5,
+          output_tokens=2,
+          cache_creation_input_tokens=0,
+          cache_read_input_tokens=0,
+          server_tool_use=None,
+          service_tier=None,
+      ),
+  )
+  mock_client = MagicMock()
+  mock_client.messages.create = AsyncMock(return_value=mock_message)
+
+  llm_request = LlmRequest(
+      model="claude-sonnet-4-20250514",
+      contents=[Content(role="user", parts=[Part.from_text(text="Hi")])],
+      config=types.GenerateContentConfig(system_instruction="Test"),
+  )
+
+  with mock.patch.object(llm, "_anthropic_client", mock_client):
+    _ = [r async for r in llm.generate_content_async(llm_request, stream=False)]
+
+  _, kwargs = mock_client.messages.create.call_args
+  assert kwargs["temperature"] is NOT_GIVEN
+  assert kwargs["top_p"] is NOT_GIVEN
+  assert kwargs["top_k"] is NOT_GIVEN
+  assert kwargs["stop_sequences"] is NOT_GIVEN
+
+
+@pytest.mark.asyncio
+async def test_streaming_forwards_generation_params():
+  """temperature, top_p, top_k, stop_sequences forwarded in streaming path."""
+  from anthropic import NOT_GIVEN
+
+  llm = AnthropicLlm(model="claude-sonnet-4-20250514")
+  mock_client = MagicMock()
+  mock_client.messages.create = AsyncMock(
+      return_value=_make_mock_stream_events(_make_minimal_stream())
+  )
+
+  llm_request = LlmRequest(
+      model="claude-sonnet-4-20250514",
+      contents=[Content(role="user", parts=[Part.from_text(text="Hi")])],
+      config=types.GenerateContentConfig(
+          system_instruction="Test",
+          temperature=0.5,
+          top_p=0.8,
+          top_k=20,
+          stop_sequences=["DONE"],
+      ),
+  )
+
+  with mock.patch.object(llm, "_anthropic_client", mock_client):
+    _ = [r async for r in llm.generate_content_async(llm_request, stream=True)]
+
+  _, kwargs = mock_client.messages.create.call_args
+  assert kwargs["temperature"] == 0.5
+  assert kwargs["top_p"] == 0.8
+  assert kwargs["top_k"] == 20
+  assert kwargs["stop_sequences"] == ["DONE"]
+
+
+@pytest.mark.asyncio
+async def test_streaming_omits_unset_generation_params():
+  """Unset generation params should be NOT_GIVEN in streaming path."""
+  from anthropic import NOT_GIVEN
+
+  llm = AnthropicLlm(model="claude-sonnet-4-20250514")
+  mock_client = MagicMock()
+  mock_client.messages.create = AsyncMock(
+      return_value=_make_mock_stream_events(_make_minimal_stream())
+  )
+
+  llm_request = LlmRequest(
+      model="claude-sonnet-4-20250514",
+      contents=[Content(role="user", parts=[Part.from_text(text="Hi")])],
+      config=types.GenerateContentConfig(system_instruction="Test"),
+  )
+
+  with mock.patch.object(llm, "_anthropic_client", mock_client):
+    _ = [r async for r in llm.generate_content_async(llm_request, stream=True)]
+
+  _, kwargs = mock_client.messages.create.call_args
+  assert kwargs["temperature"] is NOT_GIVEN
+  assert kwargs["top_p"] is NOT_GIVEN
+  assert kwargs["top_k"] is NOT_GIVEN
+  assert kwargs["stop_sequences"] is NOT_GIVEN