fix: Generate IDs for FunctionCalls when processing streaming LLM responses

xuanyang15 · copybara-github · commit fe4181718d10 · 2026-03-26T18:05:46.000-07:00
Close: #4609 Co-authored-by: Xuan Yang <xygoogle@google.com> PiperOrigin-RevId: 890144644
diff --git a/src/google/adk/utils/streaming_utils.py b/src/google/adk/utils/streaming_utils.py
@@ -225,6 +225,13 @@ def _process_function_call_part(self, part: types.Part) -> None:
     if fc.partial_args or fc.will_continue:
       # Streaming function call arguments
 
+      # Generate ID on first chunk if not provided by LLM
+      if not fc.id and not self._current_fc_id:
+        # Lazy import to avoid circular dependency
+        from ..flows.llm_flows.functions import generate_client_function_call_id
+
+        fc.id = generate_client_function_call_id()
+
       # Save thought_signature from the part (first chunk should have it)
       if part.thought_signature and not self._current_thought_signature:
         self._current_thought_signature = part.thought_signature
@@ -233,6 +240,12 @@ def _process_function_call_part(self, part: types.Part) -> None:
       # Non-streaming function call (standard format with args)
       # Skip empty function calls (used as streaming end markers)
       if fc.name:
+        # Generate ID if not provided by LLM
+        if not fc.id:
+          # Lazy import to avoid circular dependency
+          from ..flows.llm_flows.functions import generate_client_function_call_id
+
+          fc.id = generate_client_function_call_id()
         # Flush any buffered text first, then add the FC part
         self._flush_text_buffer_to_sequence()
         self._parts_sequence.append(part)
diff --git a/tests/unittests/utils/test_streaming_utils.py b/tests/unittests/utils/test_streaming_utils.py
@@ -16,6 +16,7 @@
 
 from google.adk.features._feature_registry import FeatureName
 from google.adk.features._feature_registry import temporary_feature_override
+from google.adk.flows.llm_flows.functions import AF_FUNCTION_CALL_ID_PREFIX
 from google.adk.utils import streaming_utils
 from google.genai import types
 import pytest
@@ -304,3 +305,234 @@ async def run_test():
         await run_test()
     else:
       await run_test()
+
+
+class TestFunctionCallIdGeneration:
+  """Tests for function call ID generation in streaming mode.
+
+  Regression tests for https://github.com/google/adk-python/issues/4609.
+  """
+
+  @pytest.mark.asyncio
+  async def test_non_streaming_fc_generates_id_when_empty(self):
+    """Non-streaming function call should get an adk-* ID if LLM didn't provide one."""
+    with temporary_feature_override(
+        FeatureName.PROGRESSIVE_SSE_STREAMING, True
+    ):
+      aggregator = streaming_utils.StreamingResponseAggregator()
+
+      response = types.GenerateContentResponse(
+          candidates=[
+              types.Candidate(
+                  content=types.Content(
+                      parts=[
+                          types.Part(
+                              function_call=types.FunctionCall(
+                                  name="my_tool",
+                                  args={"x": 1},
+                                  id=None,  # No ID from LLM
+                              )
+                          )
+                      ]
+                  ),
+                  finish_reason=types.FinishReason.STOP,
+              )
+          ]
+      )
+
+      async for _ in aggregator.process_response(response):
+        pass
+
+      closed_response = aggregator.close()
+      assert closed_response is not None
+      fc = closed_response.content.parts[0].function_call
+      assert fc.id is not None
+      assert fc.id.startswith(AF_FUNCTION_CALL_ID_PREFIX)
+
+  @pytest.mark.asyncio
+  async def test_non_streaming_fc_preserves_llm_assigned_id(self):
+    """Non-streaming function call should preserve ID if LLM provided one."""
+    with temporary_feature_override(
+        FeatureName.PROGRESSIVE_SSE_STREAMING, True
+    ):
+      aggregator = streaming_utils.StreamingResponseAggregator()
+
+      response = types.GenerateContentResponse(
+          candidates=[
+              types.Candidate(
+                  content=types.Content(
+                      parts=[
+                          types.Part(
+                              function_call=types.FunctionCall(
+                                  name="my_tool",
+                                  args={"x": 1},
+                                  id="llm-assigned-id",
+                              )
+                          )
+                      ]
+                  ),
+                  finish_reason=types.FinishReason.STOP,
+              )
+          ]
+      )
+
+      async for _ in aggregator.process_response(response):
+        pass
+
+      closed_response = aggregator.close()
+      assert closed_response is not None
+      fc = closed_response.content.parts[0].function_call
+      assert fc.id == "llm-assigned-id"
+
+  @pytest.mark.asyncio
+  async def test_streaming_fc_generates_consistent_id_across_chunks(self):
+    """Streaming function call should have the same ID in partial and final responses."""
+    with temporary_feature_override(
+        FeatureName.PROGRESSIVE_SSE_STREAMING, True
+    ):
+      aggregator = streaming_utils.StreamingResponseAggregator()
+
+      # First chunk: function call starts
+      response1 = types.GenerateContentResponse(
+          candidates=[
+              types.Candidate(
+                  content=types.Content(
+                      parts=[
+                          types.Part(
+                              function_call=types.FunctionCall(
+                                  name="my_tool",
+                                  id=None,
+                                  partial_args=[
+                                      types.PartialArg(
+                                          json_path="$.x",
+                                          string_value="hello",
+                                      )
+                                  ],
+                                  will_continue=True,
+                              )
+                          )
+                      ]
+                  )
+              )
+          ]
+      )
+
+      # Second chunk: function call continues
+      response2 = types.GenerateContentResponse(
+          candidates=[
+              types.Candidate(
+                  content=types.Content(
+                      parts=[
+                          types.Part(
+                              function_call=types.FunctionCall(
+                                  name=None,
+                                  id=None,
+                                  partial_args=[
+                                      types.PartialArg(
+                                          json_path="$.x",
+                                          string_value=" world",
+                                      )
+                                  ],
+                                  will_continue=False,  # Complete
+                              )
+                          )
+                      ]
+                  ),
+                  finish_reason=types.FinishReason.STOP,
+              )
+          ]
+      )
+
+      partial_results = []
+      async for r in aggregator.process_response(response1):
+        partial_results.append(r)
+      async for r in aggregator.process_response(response2):
+        partial_results.append(r)
+
+      closed_response = aggregator.close()
+      assert closed_response is not None
+      final_fc = closed_response.content.parts[0].function_call
+      assert final_fc.id is not None
+      assert final_fc.id.startswith(AF_FUNCTION_CALL_ID_PREFIX)
+      assert final_fc.args == {"x": "hello world"}
+
+      # Verify partial and final events share the same ID
+      partial_fc = partial_results[0].content.parts[0].function_call
+      assert (
+          partial_fc.id == final_fc.id
+      ), f"Partial FC ID ({partial_fc.id!r}) != Final FC ID ({final_fc.id!r})"
+
+  @pytest.mark.asyncio
+  async def test_multiple_streaming_fcs_get_different_ids(self):
+    """Multiple function calls arriving in separate chunks should get different IDs."""
+    with temporary_feature_override(
+        FeatureName.PROGRESSIVE_SSE_STREAMING, True
+    ):
+      aggregator = streaming_utils.StreamingResponseAggregator()
+
+      # First FC
+      response1 = types.GenerateContentResponse(
+          candidates=[
+              types.Candidate(
+                  content=types.Content(
+                      parts=[
+                          types.Part(
+                              function_call=types.FunctionCall(
+                                  name="tool_a",
+                                  id=None,
+                                  partial_args=[
+                                      types.PartialArg(
+                                          json_path="$.a", string_value="val_a"
+                                      )
+                                  ],
+                                  will_continue=False,
+                              )
+                          )
+                      ]
+                  )
+              )
+          ]
+      )
+
+      # Second FC
+      response2 = types.GenerateContentResponse(
+          candidates=[
+              types.Candidate(
+                  content=types.Content(
+                      parts=[
+                          types.Part(
+                              function_call=types.FunctionCall(
+                                  name="tool_b",
+                                  id=None,
+                                  partial_args=[
+                                      types.PartialArg(
+                                          json_path="$.b", string_value="val_b"
+                                      )
+                                  ],
+                                  will_continue=False,
+                              )
+                          )
+                      ]
+                  ),
+                  finish_reason=types.FinishReason.STOP,
+              )
+          ]
+      )
+
+      async for _ in aggregator.process_response(response1):
+        pass
+      async for _ in aggregator.process_response(response2):
+        pass
+
+      closed_response = aggregator.close()
+      assert closed_response is not None
+      assert len(closed_response.content.parts) == 2
+
+      fc_a = closed_response.content.parts[0].function_call
+      fc_b = closed_response.content.parts[1].function_call
+
+      assert fc_a.id is not None
+      assert fc_b.id is not None
+      assert fc_a.id.startswith(AF_FUNCTION_CALL_ID_PREFIX)
+      assert fc_b.id.startswith(AF_FUNCTION_CALL_ID_PREFIX)
+      assert fc_a.id != fc_b.id  # Different IDs for different FCs