From c41889f7e2ec5b473f3f8bf30aa28bde2d5af220 Mon Sep 17 00:00:00 2001
From: theonlychant <sacehenry@gmail.com>
Date: Tue, 5 May 2026 23:38:55 -0500
Subject: [PATCH 1/3] fix: accumulate text across tool calls for output_key in
 streaming mode

---
 src/google/adk/agents/llm_agent.py | 70 ++++++++++++++++++++++--------
 1 file changed, 52 insertions(+), 18 deletions(-)

diff --git a/src/google/adk/agents/llm_agent.py b/src/google/adk/agents/llm_agent.py
index ed83d00413..9baa38f6d4 100644
--- a/src/google/adk/agents/llm_agent.py
+++ b/src/google/adk/agents/llm_agent.py
@@ -486,7 +486,7 @@ async def _run_async_impl(
     should_pause = False
     async with Aclosing(self._llm_flow.run_async(ctx)) as agen:
       async for event in agen:
-        self.__maybe_save_output_to_state(event)
+        self.__maybe_save_output_to_state(event, ctx)
         yield event
         if ctx.should_pause_invocation(event):
           # Do not pause immediately, wait until the long-running tool call is
@@ -510,7 +510,7 @@ async def _run_live_impl(
   ) -> AsyncGenerator[Event, None]:
     async with Aclosing(self._llm_flow.run_live(ctx)) as agen:
       async for event in agen:
-        self.__maybe_save_output_to_state(event)
+        self.__maybe_save_output_to_state(event, ctx)
         yield event
       if ctx.end_invocation:
         return
@@ -827,8 +827,16 @@ def __get_transfer_to_agent_or_none(
         return self.__get_agent_to_run(event.actions.transfer_to_agent)
     return None
 
-  def __maybe_save_output_to_state(self, event: Event):
-    """Saves the model output to state if needed."""
+  def __maybe_save_output_to_state(
+      self, event: Event, ctx: Optional[InvocationContext] = None
+  ):
+    """Saves the model output to state if needed.
+
+    Backwards-compatible: if `ctx` is None, keeps the original behavior of
+    only saving on final responses. If `ctx` is provided, append streamed
+    partial text to the existing session state so intermediate streamed
+    fragments are not lost when tools are called.
+    """
     # skip if the event was authored by some other agent (e.g. current agent
     # transferred to another agent)
     if event.author != self.name:
@@ -842,28 +850,54 @@ def __maybe_save_output_to_state(self, event: Event):
     if not self.output_key:
       return
 
-    # Handle text responses
-    if event.is_final_response() and event.content and event.content.parts:
+    # Collect text parts from this event
+    if not (event.content and event.content.parts):
+      return
 
-      result = ''.join(
-          part.text
-          for part in event.content.parts
-          if part.text and not part.thought
-      )
+    result = ''.join(
+        part.text for part in event.content.parts if part.text and not part.thought
+    )
+
+    # If no invocation context was provided, preserve legacy behavior: only
+    # save on final responses and apply schema validation then.
+    if ctx is None:
+      if not event.is_final_response():
+        return
       if self.output_schema:
-        # If the result from the final chunk is just whitespace or empty,
-        # it means this is an empty final chunk of a stream.
-        # Do not attempt to parse it as JSON.
         if not result.strip():
           return
         result = validate_schema(self.output_schema, result)
       elif not result:
-        # No text parts found and no output_schema. Skip to avoid
-        # overwriting state_delta values already set by callbacks
-        # (e.g. after_tool_callback with skip_summarization on
-        # function_response-only events).
         return
       event.actions.state_delta[self.output_key] = result
+      return
+
+    # When ctx is provided, append partial streamed results into session
+    # state so earlier streamed text is preserved across tool calls.
+    # Read the existing value from the session (may be empty).
+    try:
+      previous = ctx.session.state.get(self.output_key, '') or ''
+    except Exception:
+      previous = ''
+
+    # Final response: perform schema validation if needed and replace
+    # previous aggregated value with the validated final result.
+    if event.is_final_response():
+      if self.output_schema:
+        if not result.strip():
+          return
+        validated = validate_schema(self.output_schema, result)
+        event.actions.state_delta[self.output_key] = validated
+        return
+      elif not result:
+        return
+      event.actions.state_delta[self.output_key] = result
+      return
+
+    # Non-final (streaming) response: append the fragment to previous value.
+    if result:
+      event.actions.state_delta[self.output_key] = previous + result
+    return
 
   @model_validator(mode='after')
   def __model_validator_after(self) -> LlmAgent:

From c9c8703dd1bb138ba1c92260c88a7d930b1b5000 Mon Sep 17 00:00:00 2001
From: theonlychant <sacehenry@gmail.com>
Date: Wed, 6 May 2026 03:11:40 -0500
Subject: [PATCH 2/3] fix: accumulate all streamed text for output_key across
 tool calls

---
 src/google/adk/agents/llm_agent.py | 17 ++++++++++-------
 1 file changed, 10 insertions(+), 7 deletions(-)

diff --git a/src/google/adk/agents/llm_agent.py b/src/google/adk/agents/llm_agent.py
index 9baa38f6d4..89922c1424 100644
--- a/src/google/adk/agents/llm_agent.py
+++ b/src/google/adk/agents/llm_agent.py
@@ -880,18 +880,21 @@ def __maybe_save_output_to_state(
     except Exception:
       previous = ''
 
-    # Final response: perform schema validation if needed and replace
-    # previous aggregated value with the validated final result.
+    # Final response: combine previous aggregated value with the final
+    # fragment, then perform schema validation if needed and save the
+    # combined result.
     if event.is_final_response():
+      combined = (previous or '') + (result or '')
+      if not combined:
+        return
       if self.output_schema:
-        if not result.strip():
+        # If combined is just whitespace, skip.
+        if not combined.strip():
           return
-        validated = validate_schema(self.output_schema, result)
+        validated = validate_schema(self.output_schema, combined)
         event.actions.state_delta[self.output_key] = validated
         return
-      elif not result:
-        return
-      event.actions.state_delta[self.output_key] = result
+      event.actions.state_delta[self.output_key] = combined
       return
 
     # Non-final (streaming) response: append the fragment to previous value.

From fabd5fe11c3164dd2f160ea26ee705f3d8e17b29 Mon Sep 17 00:00:00 2001
From: theonlychant <sacehenry@gmail.com>
Date: Wed, 6 May 2026 20:28:08 -0500
Subject: [PATCH 3/3] fix(agent): add accumulate_output_key option for output
 aggregation

---
 src/google/adk/agents/llm_agent.py            | 38 ++++++++++++--
 src/google/adk/agents/llm_agent_config.py     |  5 ++
 .../agents/test_llm_agent_output_save.py      | 50 +++++++++++++++++++
 3 files changed, 88 insertions(+), 5 deletions(-)

diff --git a/src/google/adk/agents/llm_agent.py b/src/google/adk/agents/llm_agent.py
index 89922c1424..23745e8d4c 100644
--- a/src/google/adk/agents/llm_agent.py
+++ b/src/google/adk/agents/llm_agent.py
@@ -350,6 +350,14 @@ class LlmAgent(BaseAgent):
   - Extracts agent reply for later use, such as in tools, callbacks, etc.
   - Connects agents to coordinate with each other.
   """
+  accumulate_output_key: bool = True
+  """Whether to accumulate streamed output fragments into `output_key`.
+
+  When True (default) streamed fragments received before tool calls are
+  appended into the session state under `output_key` so the final saved value
+  includes all streamed text. When False, preserves legacy behavior where
+  only the final response's text from the last event is saved.
+  """
   # Controlled input/output configurations - End
 
   # Advance features - Start
@@ -873,22 +881,40 @@ def __maybe_save_output_to_state(
       return
 
     # When ctx is provided, append partial streamed results into session
-    # state so earlier streamed text is preserved across tool calls.
+    # state so earlier streamed text is preserved across tool calls. If the
+    # caller disabled accumulation via `accumulate_output_key`, fall back to
+    # legacy behavior: ignore non-final fragments and save only the final
+    # fragment (without combining previous fragments).
     # Read the existing value from the session (may be empty).
     try:
       previous = ctx.session.state.get(self.output_key, '') or ''
     except Exception:
       previous = ''
+    # If accumulation disabled, ignore non-final fragments and save only
+    # the final fragment as legacy behavior.
+    if not self.accumulate_output_key:
+      if not event.is_final_response():
+        return
+      # Final-only behavior: validate only the final fragment.
+      if self.output_schema:
+        if not result.strip():
+          return
+        validated = validate_schema(self.output_schema, result)
+        event.actions.state_delta[self.output_key] = validated
+        return
+      if not result:
+        return
+      event.actions.state_delta[self.output_key] = result
+      return
 
-    # Final response: combine previous aggregated value with the final
-    # fragment, then perform schema validation if needed and save the
-    # combined result.
+    # Accumulation enabled: Final response combines previous + result
+    # then validate and save. Non-final events append current fragment to
+    # previous value so it is available to future finalization.
     if event.is_final_response():
       combined = (previous or '') + (result or '')
       if not combined:
         return
       if self.output_schema:
-        # If combined is just whitespace, skip.
         if not combined.strip():
           return
         validated = validate_schema(self.output_schema, combined)
@@ -1032,6 +1058,8 @@ def _parse_config(
       kwargs['output_schema'] = resolve_code_reference(config.output_schema)
     if config.output_key:
       kwargs['output_key'] = config.output_key
+    if getattr(config, 'accumulate_output_key', None) is not None:
+      kwargs['accumulate_output_key'] = config.accumulate_output_key
     if config.tools:
       kwargs['tools'] = cls._resolve_tools(config.tools, config_abs_path)
     if config.before_model_callbacks:
diff --git a/src/google/adk/agents/llm_agent_config.py b/src/google/adk/agents/llm_agent_config.py
index 93ca718094..e8d248b42b 100644
--- a/src/google/adk/agents/llm_agent_config.py
+++ b/src/google/adk/agents/llm_agent_config.py
@@ -139,6 +139,11 @@ def _validate_model_sources(self) -> LlmAgentConfig:
       default=None, description='Optional. LlmAgent.output_key.'
   )
 
+  accumulate_output_key: Optional[bool] = Field(
+      default=None,
+      description='Optional. When true, streamed fragments are accumulated into the `output_key` across tool calls. When false, only the final response is saved to `output_key`.',
+  )
+
   include_contents: Literal['default', 'none'] = Field(
       default='default', description='Optional. LlmAgent.include_contents.'
   )
diff --git a/tests/unittests/agents/test_llm_agent_output_save.py b/tests/unittests/agents/test_llm_agent_output_save.py
index ad7b48e3e2..41588525f0 100644
--- a/tests/unittests/agents/test_llm_agent_output_save.py
+++ b/tests/unittests/agents/test_llm_agent_output_save.py
@@ -307,3 +307,53 @@ def test_maybe_save_output_to_state_skips_function_response_only_event(self):
 
     # The callback-set value should be preserved, not overwritten with ""
     assert event.actions.state_delta["result"] == [1, 2, 3]
+
+  def test_accumulate_output_key_toggle(self):
+    """Test that `accumulate_output_key` controls accumulation behavior.
+
+    Simulate two streamed fragments separated by a tool call by manually
+    updating the session state between calls.
+    """
+    class Ctx:
+      pass
+
+    # Prepare a fake invocation context with session.state
+    ctx = Ctx()
+    ctx.session = type('S', (), {'state': {}})()
+
+    # Case 1: accumulation enabled (default)
+    agent = LlmAgent(name="test_agent", output_key="result")
+
+    # First (partial) fragment
+    event1 = create_test_event(
+        author="test_agent", content_text="Intro: ", is_final=False
+    )
+    agent._LlmAgent__maybe_save_output_to_state(event1, ctx)
+    # Simulate session update that runner would do
+    ctx.session.state["result"] = event1.actions.state_delta.get("result", "")
+
+    # Final fragment
+    event2 = create_test_event(author="test_agent", content_text="Conclusion", is_final=True)
+    agent._LlmAgent__maybe_save_output_to_state(event2, ctx)
+
+    # With accumulation enabled, final saved value should include both parts
+    assert event2.actions.state_delta["result"] == "Intro: Conclusion"
+
+    # Case 2: accumulation disabled
+    ctx2 = Ctx()
+    ctx2.session = type('S', (), {'state': {}})()
+    agent2 = LlmAgent(name="test_agent", output_key="result", accumulate_output_key=False)
+
+    event1b = create_test_event(
+        author="test_agent", content_text="Intro: ", is_final=False
+    )
+    agent2._LlmAgent__maybe_save_output_to_state(event1b, ctx2)
+    # Simulate runner updating session with the partial (though when disabled
+    # we expect the partial not to be used for final save)
+    ctx2.session.state["result"] = event1b.actions.state_delta.get("result", "")
+
+    event2b = create_test_event(author="test_agent", content_text="Conclusion", is_final=True)
+    agent2._LlmAgent__maybe_save_output_to_state(event2b, ctx2)
+
+    # With accumulation disabled, final saved value should be only final fragment
+    assert event2b.actions.state_delta["result"] == "Conclusion"