fix: several review comments

constantinius · constantinius · commit b09e718ad06c · 2026-01-13T12:54:22.000+01:00
diff --git a/sentry_sdk/integrations/openai_agents/patches/agent_run.py b/sentry_sdk/integrations/openai_agents/patches/agent_run.py
@@ -163,7 +163,7 @@ async def patched_execute_final_output(
             # (For non-streaming, the workflow span is closed by the context manager in _create_run_wrapper)
             if agent and hasattr(agent, "_sentry_workflow_span"):
                 workflow_span = agent._sentry_workflow_span
-                workflow_span.__exit__(None, None, None)
+                workflow_span.__exit__(*sys.exc_info())
                 delattr(agent, "_sentry_workflow_span")
 
         return result
diff --git a/sentry_sdk/integrations/openai_agents/patches/models.py b/sentry_sdk/integrations/openai_agents/patches/models.py
@@ -92,6 +92,11 @@ async def wrapped_stream_response(*args: "Any", **kwargs: "Any") -> "Any":
                 Wrap stream_response to create an AI client span for streaming.
                 stream_response is an async generator, so we yield events within the span.
 
+                Note: We use explicit try/finally instead of a context manager because
+                if the consumer abandons the stream (breaks early, network error, etc.),
+                the context manager's __exit__ may not be called. With try/finally,
+                cleanup happens even when GeneratorExit is thrown.
+
                 Note: stream_response is called with positional args unlike get_response
                 which uses keyword args. The signature is:
                     stream_response(
@@ -108,17 +113,21 @@ async def wrapped_stream_response(*args: "Any", **kwargs: "Any") -> "Any":
                         prompt,
                     )
                 """
+                import sys
+
                 # Build kwargs dict from positional args for span data capture
                 span_kwargs = dict(kwargs)
                 if len(args) > 0:
                     span_kwargs["system_instructions"] = args[0]
                 if len(args) > 1:
                     span_kwargs["input"] = args[1]
 
-                with ai_client_span(agent, span_kwargs) as span:
-                    span.set_data(SPANDATA.GEN_AI_RESPONSE_STREAMING, True)
+                span = ai_client_span(agent, span_kwargs)
+                span.__enter__()
+                span.set_data(SPANDATA.GEN_AI_RESPONSE_STREAMING, True)
 
-                    streaming_response = None
+                streaming_response = None
+                try:
                     async for event in original_stream_response(*args, **kwargs):
                         # Capture the full response from ResponseCompletedEvent
                         if hasattr(event, "response"):
@@ -135,6 +144,8 @@ async def wrapped_stream_response(*args: "Any", **kwargs: "Any") -> "Any":
                         )
                         _set_response_model_on_agent_span(agent, response_model)
                         update_ai_client_span(span, streaming_response)
+                finally:
+                    span.__exit__(*sys.exc_info())
 
             model.stream_response = wrapped_stream_response
 
diff --git a/sentry_sdk/integrations/openai_agents/spans/ai_client.py b/sentry_sdk/integrations/openai_agents/spans/ai_client.py
@@ -61,7 +61,7 @@ def update_ai_client_span(
         _set_usage_data(span, response.usage)
 
     # Set output data and create MCP tool spans if available
-    if hasattr(response, "output"):
+    if hasattr(response, "output") and response.output:
         _set_output_data(span, response)
         _create_mcp_execute_tool_spans(span, response)