From 5cee69e5b78dc5ea370ecc5c7ef9a543aaf343ad Mon Sep 17 00:00:00 2001
From: Alexander Alderman Webb <alexander.webb@sentry.io>
Date: Thu, 26 Feb 2026 11:12:07 +0100
Subject: [PATCH 1/5] ref(openai): Separate output handling

---
 sentry_sdk/integrations/openai.py | 68 +++++++++++++++++++++++++++++--
 1 file changed, 64 insertions(+), 4 deletions(-)

diff --git a/sentry_sdk/integrations/openai.py b/sentry_sdk/integrations/openai.py
index 4f851bf0fb..7381fbec0c 100644
--- a/sentry_sdk/integrations/openai.py
+++ b/sentry_sdk/integrations/openai.py
@@ -462,7 +462,7 @@ def _set_embeddings_input_data(
     _commmon_set_input_data(span, kwargs)
 
 
-def _set_output_data(
+def _common_set_output_data(
     span: "Span",
     response: "Any",
     kwargs: "dict[str, Any]",
@@ -706,11 +706,67 @@ def _new_chat_completion_common(f: "Any", *args: "Any", **kwargs: "Any") -> "Any
     start_time = time.perf_counter()
     response = yield f, args, kwargs
 
-    _set_output_data(span, response, kwargs, integration, start_time, finish_span=True)
+    _set_completions_api_output_data(
+        span, response, kwargs, integration, start_time, finish_span=True
+    )
 
     return response
 
 
+def _set_completions_api_output_data(
+    span: "Span",
+    response: "Any",
+    kwargs: "dict[str, Any]",
+    integration: "OpenAIIntegration",
+    start_time: "Optional[float]" = None,
+    finish_span: bool = True,
+) -> None:
+    _common_set_output_data(
+        span,
+        response,
+        kwargs,
+        integration,
+        start_time,
+        finish_span,
+    )
+
+
+def _set_responses_api_output_data(
+    span: "Span",
+    response: "Any",
+    kwargs: "dict[str, Any]",
+    integration: "OpenAIIntegration",
+    start_time: "Optional[float]" = None,
+    finish_span: bool = True,
+) -> None:
+    _common_set_output_data(
+        span,
+        response,
+        kwargs,
+        integration,
+        start_time,
+        finish_span,
+    )
+
+
+def _set_embeddings_output_data(
+    span: "Span",
+    response: "Any",
+    kwargs: "dict[str, Any]",
+    integration: "OpenAIIntegration",
+    start_time: "Optional[float]" = None,
+    finish_span: bool = True,
+) -> None:
+    _common_set_output_data(
+        span,
+        response,
+        kwargs,
+        integration,
+        start_time,
+        finish_span,
+    )
+
+
 def _wrap_chat_completion_create(f: "Callable[..., Any]") -> "Callable[..., Any]":
     def _execute_sync(f: "Any", *args: "Any", **kwargs: "Any") -> "Any":
         gen = _new_chat_completion_common(f, *args, **kwargs)
@@ -795,7 +851,9 @@ def _new_embeddings_create_common(f: "Any", *args: "Any", **kwargs: "Any") -> "A
 
         response = yield f, args, kwargs
 
-        _set_output_data(span, response, kwargs, integration, finish_span=False)
+        _set_embeddings_output_data(
+            span, response, kwargs, integration, finish_span=False
+        )
 
         return response
 
@@ -885,7 +943,9 @@ def _new_responses_create_common(f: "Any", *args: "Any", **kwargs: "Any") -> "An
     start_time = time.perf_counter()
     response = yield f, args, kwargs
 
-    _set_output_data(span, response, kwargs, integration, start_time, finish_span=True)
+    _set_responses_api_output_data(
+        span, response, kwargs, integration, start_time, finish_span=True
+    )
 
     return response
 

From d94f9535290256161785e9e683a8dbddb28efb0b Mon Sep 17 00:00:00 2001
From: Alexander Alderman Webb <alexander.webb@sentry.io>
Date: Thu, 26 Feb 2026 11:26:37 +0100
Subject: [PATCH 2/5] .

---
 sentry_sdk/integrations/openai.py | 60 +++++++++++++++++++++++++++----
 1 file changed, 54 insertions(+), 6 deletions(-)

diff --git a/sentry_sdk/integrations/openai.py b/sentry_sdk/integrations/openai.py
index 7381fbec0c..8b26f08b4a 100644
--- a/sentry_sdk/integrations/openai.py
+++ b/sentry_sdk/integrations/openai.py
@@ -706,9 +706,15 @@ def _new_chat_completion_common(f: "Any", *args: "Any", **kwargs: "Any") -> "Any
     start_time = time.perf_counter()
     response = yield f, args, kwargs
 
-    _set_completions_api_output_data(
-        span, response, kwargs, integration, start_time, finish_span=True
-    )
+    is_streaming_response = kwargs.get("stream", False)
+    if is_streaming_response:
+        _set_streaming_completions_api_output_data(
+            span, response, kwargs, integration, start_time, finish_span=True
+        )
+    else:
+        _set_completions_api_output_data(
+            span, response, kwargs, integration, start_time, finish_span=True
+        )
 
     return response
 
@@ -731,6 +737,24 @@ def _set_completions_api_output_data(
     )
 
 
+def _set_streaming_completions_api_output_data(
+    span: "Span",
+    response: "Any",
+    kwargs: "dict[str, Any]",
+    integration: "OpenAIIntegration",
+    start_time: "Optional[float]" = None,
+    finish_span: bool = True,
+) -> None:
+    _common_set_output_data(
+        span,
+        response,
+        kwargs,
+        integration,
+        start_time,
+        finish_span,
+    )
+
+
 def _set_responses_api_output_data(
     span: "Span",
     response: "Any",
@@ -749,6 +773,24 @@ def _set_responses_api_output_data(
     )
 
 
+def _set_streaming_responses_api_output_data(
+    span: "Span",
+    response: "Any",
+    kwargs: "dict[str, Any]",
+    integration: "OpenAIIntegration",
+    start_time: "Optional[float]" = None,
+    finish_span: bool = True,
+) -> None:
+    _common_set_output_data(
+        span,
+        response,
+        kwargs,
+        integration,
+        start_time,
+        finish_span,
+    )
+
+
 def _set_embeddings_output_data(
     span: "Span",
     response: "Any",
@@ -943,9 +985,15 @@ def _new_responses_create_common(f: "Any", *args: "Any", **kwargs: "Any") -> "An
     start_time = time.perf_counter()
     response = yield f, args, kwargs
 
-    _set_responses_api_output_data(
-        span, response, kwargs, integration, start_time, finish_span=True
-    )
+    is_streaming_response = kwargs.get("stream", False)
+    if is_streaming_response:
+        _set_responses_api_output_data(
+            span, response, kwargs, integration, start_time, finish_span=True
+        )
+    else:
+        _set_streaming_responses_api_output_data(
+            span, response, kwargs, integration, start_time, finish_span=True
+        )
 
     return response
 

From 4ab8e744c094cd2725520e8fbfcdf2e21fd84b61 Mon Sep 17 00:00:00 2001
From: Alexander Alderman Webb <alexander.webb@sentry.io>
Date: Thu, 26 Feb 2026 11:45:06 +0100
Subject: [PATCH 3/5] ref(openai): Extract input in API-specific functions

---
 sentry_sdk/integrations/openai.py | 46 +++++++++++++++++--------------
 1 file changed, 25 insertions(+), 21 deletions(-)

diff --git a/sentry_sdk/integrations/openai.py b/sentry_sdk/integrations/openai.py
index 8b26f08b4a..6b63e96c0f 100644
--- a/sentry_sdk/integrations/openai.py
+++ b/sentry_sdk/integrations/openai.py
@@ -465,7 +465,7 @@ def _set_embeddings_input_data(
 def _common_set_output_data(
     span: "Span",
     response: "Any",
-    kwargs: "dict[str, Any]",
+    input: "Any",
     integration: "OpenAIIntegration",
     start_time: "Optional[float]" = None,
     finish_span: bool = True,
@@ -473,14 +473,8 @@ def _common_set_output_data(
     if hasattr(response, "model"):
         set_data_normalized(span, SPANDATA.GEN_AI_RESPONSE_MODEL, response.model)
 
-    # Input messages (the prompt or data sent to the model)
-    # used for the token usage calculation
-    messages = kwargs.get("messages")
-    if messages is None:
-        messages = kwargs.get("input")
-
-    if messages is not None and isinstance(messages, str):
-        messages = [messages]
+    if input is not None and isinstance(input, str):
+        input = [input]
 
     ttft: "Optional[float]" = None
 
@@ -494,7 +488,7 @@ def _common_set_output_data(
             if len(response_text) > 0:
                 set_data_normalized(span, SPANDATA.GEN_AI_RESPONSE_TEXT, response_text)
 
-        _calculate_token_usage(messages, response, span, None, integration.count_tokens)
+        _calculate_token_usage(input, response, span, None, integration.count_tokens)
 
         if finish_span:
             span.__exit__(None, None, None)
@@ -530,7 +524,7 @@ def _common_set_output_data(
                     span, SPANDATA.GEN_AI_RESPONSE_TEXT, output_messages["response"]
                 )
 
-        _calculate_token_usage(messages, response, span, None, integration.count_tokens)
+        _calculate_token_usage(input, response, span, None, integration.count_tokens)
 
         if finish_span:
             span.__exit__(None, None, None)
@@ -571,7 +565,7 @@ def new_iterator() -> "Iterator[ChatCompletionChunk]":
                     # OpenAI responses API end of streaming response
                     if RESPONSES_API_ENABLED and isinstance(x, ResponseCompletedEvent):
                         _calculate_token_usage(
-                            messages,
+                            input,
                             x.response,
                             span,
                             None,
@@ -594,7 +588,7 @@ def new_iterator() -> "Iterator[ChatCompletionChunk]":
                         )
                     if count_tokens_manually:
                         _calculate_token_usage(
-                            messages,
+                            input,
                             response,
                             span,
                             all_responses,
@@ -635,7 +629,7 @@ async def new_iterator_async() -> "AsyncIterator[ChatCompletionChunk]":
                     # OpenAI responses API end of streaming response
                     if RESPONSES_API_ENABLED and isinstance(x, ResponseCompletedEvent):
                         _calculate_token_usage(
-                            messages,
+                            input,
                             x.response,
                             span,
                             None,
@@ -658,7 +652,7 @@ async def new_iterator_async() -> "AsyncIterator[ChatCompletionChunk]":
                         )
                     if count_tokens_manually:
                         _calculate_token_usage(
-                            messages,
+                            input,
                             response,
                             span,
                             all_responses,
@@ -672,7 +666,7 @@ async def new_iterator_async() -> "AsyncIterator[ChatCompletionChunk]":
         else:
             response._iterator = new_iterator()
     else:
-        _calculate_token_usage(messages, response, span, None, integration.count_tokens)
+        _calculate_token_usage(input, response, span, None, integration.count_tokens)
         if finish_span:
             span.__exit__(None, None, None)
 
@@ -727,10 +721,12 @@ def _set_completions_api_output_data(
     start_time: "Optional[float]" = None,
     finish_span: bool = True,
 ) -> None:
+    messages = kwargs.get("messages")
+
     _common_set_output_data(
         span,
         response,
-        kwargs,
+        messages,
         integration,
         start_time,
         finish_span,
@@ -745,10 +741,12 @@ def _set_streaming_completions_api_output_data(
     start_time: "Optional[float]" = None,
     finish_span: bool = True,
 ) -> None:
+    messages = kwargs.get("messages")
+
     _common_set_output_data(
         span,
         response,
-        kwargs,
+        messages,
         integration,
         start_time,
         finish_span,
@@ -763,10 +761,12 @@ def _set_responses_api_output_data(
     start_time: "Optional[float]" = None,
     finish_span: bool = True,
 ) -> None:
+    input = kwargs.get("input")
+
     _common_set_output_data(
         span,
         response,
-        kwargs,
+        input,
         integration,
         start_time,
         finish_span,
@@ -781,10 +781,12 @@ def _set_streaming_responses_api_output_data(
     start_time: "Optional[float]" = None,
     finish_span: bool = True,
 ) -> None:
+    input = kwargs.get("input")
+
     _common_set_output_data(
         span,
         response,
-        kwargs,
+        input,
         integration,
         start_time,
         finish_span,
@@ -799,10 +801,12 @@ def _set_embeddings_output_data(
     start_time: "Optional[float]" = None,
     finish_span: bool = True,
 ) -> None:
+    input = kwargs.get("input")
+
     _common_set_output_data(
         span,
         response,
-        kwargs,
+        input,
         integration,
         start_time,
         finish_span,

From fb12a441bc613b88eb758f7e95ab57258eb8e5ef Mon Sep 17 00:00:00 2001
From: Alexander Alderman Webb <alexander.webb@sentry.io>
Date: Thu, 26 Feb 2026 11:53:00 +0100
Subject: [PATCH 4/5] .

---
 sentry_sdk/integrations/openai.py | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/sentry_sdk/integrations/openai.py b/sentry_sdk/integrations/openai.py
index 8b26f08b4a..fbaf91cee4 100644
--- a/sentry_sdk/integrations/openai.py
+++ b/sentry_sdk/integrations/openai.py
@@ -987,11 +987,11 @@ def _new_responses_create_common(f: "Any", *args: "Any", **kwargs: "Any") -> "An
 
     is_streaming_response = kwargs.get("stream", False)
     if is_streaming_response:
-        _set_responses_api_output_data(
+        _set_streaming_responses_api_output_data(
             span, response, kwargs, integration, start_time, finish_span=True
         )
     else:
-        _set_streaming_responses_api_output_data(
+        _set_responses_api_output_data(
             span, response, kwargs, integration, start_time, finish_span=True
         )
 

From 4f84f98cc4486e64c5118fd9066ddc8adab3617b Mon Sep 17 00:00:00 2001
From: Alexander Alderman Webb <alexander.webb@sentry.io>
Date: Thu, 26 Feb 2026 12:07:10 +0100
Subject: [PATCH 5/5] .

---
 sentry_sdk/integrations/openai.py | 18 +++++++++++++++---
 1 file changed, 15 insertions(+), 3 deletions(-)

diff --git a/sentry_sdk/integrations/openai.py b/sentry_sdk/integrations/openai.py
index 0308adda94..d8139f217b 100644
--- a/sentry_sdk/integrations/openai.py
+++ b/sentry_sdk/integrations/openai.py
@@ -473,9 +473,6 @@ def _common_set_output_data(
     if hasattr(response, "model"):
         set_data_normalized(span, SPANDATA.GEN_AI_RESPONSE_MODEL, response.model)
 
-    if input is not None and isinstance(input, str):
-        input = [input]
-
     ttft: "Optional[float]" = None
 
     if hasattr(response, "choices"):
@@ -723,6 +720,9 @@ def _set_completions_api_output_data(
 ) -> None:
     messages = kwargs.get("messages")
 
+    if messages is not None and isinstance(messages, str):
+        messages = [messages]
+
     _common_set_output_data(
         span,
         response,
@@ -743,6 +743,9 @@ def _set_streaming_completions_api_output_data(
 ) -> None:
     messages = kwargs.get("messages")
 
+    if messages is not None and isinstance(messages, str):
+        messages = [messages]
+
     _common_set_output_data(
         span,
         response,
@@ -763,6 +766,9 @@ def _set_responses_api_output_data(
 ) -> None:
     input = kwargs.get("input")
 
+    if input is not None and isinstance(input, str):
+        input = [input]
+
     _common_set_output_data(
         span,
         response,
@@ -783,6 +789,9 @@ def _set_streaming_responses_api_output_data(
 ) -> None:
     input = kwargs.get("input")
 
+    if input is not None and isinstance(input, str):
+        input = [input]
+
     _common_set_output_data(
         span,
         response,
@@ -803,6 +812,9 @@ def _set_embeddings_output_data(
 ) -> None:
     input = kwargs.get("input")
 
+    if input is not None and isinstance(input, str):
+        input = [input]
+
     _common_set_output_data(
         span,
         response,