clarify

shellmayr · shellmayr · commit dadbc7957c1d · 2026-03-05T11:08:20.000+01:00
diff --git a/sentry_sdk/ai/span_config.py b/sentry_sdk/ai/span_config.py
@@ -1,7 +1,10 @@
 import sentry_sdk
 from sentry_sdk.consts import SPANDATA
+from sentry_sdk.ai.monitoring import record_token_usage
 from sentry_sdk.ai.utils import (
+    get_first_from_sources,
     set_data_normalized,
+    set_span_data_from_sources,
     normalize_message_roles,
     truncate_and_annotate_messages,
 )
@@ -10,11 +13,11 @@
 from typing import TYPE_CHECKING
 
 if TYPE_CHECKING:
-    from typing import Any, Dict
+    from typing import Any, Dict, List, Optional
     from sentry_sdk.tracing import Span
 
 
-def set_input_span_data(span, kwargs, integration, config, span_data=None):
+def set_request_span_data(span, kwargs, integration, config, span_data=None):
     # type: (Span, Dict[str, Any], Any, Dict[str, Any], Dict[str, Any] | None) -> None
     """
     Set input span data from a declarative config.
@@ -57,3 +60,49 @@ def set_input_span_data(span, kwargs, integration, config, span_data=None):
             if kwarg_key in kwargs:
                 value = kwargs[kwarg_key]
                 set_data_normalized(span, span_attr, value)
+
+
+def set_response_span_data(span, response, include_pii, response_config, collected_text=None):
+    # type: (Span, Any, bool, Dict[str, Any], Optional[List[str]]) -> None
+    """
+    Set response span data from a declarative config.
+
+    response_config keys:
+        sources: dict - always set from response object
+        pii_sources: dict - only when PII allowed
+        extract_text: (response) -> list[str] | None (PII only)
+        usage: dict with input_tokens/output_tokens source paths
+    collected_text: pre-collected streaming text (overrides extract_text)
+    """
+    set_span_data_from_sources(
+        span, response, response_config.get("sources", {}), require_truthy=False
+    )
+
+    if include_pii:
+        pii_sources = response_config.get("pii_sources")
+        if pii_sources:
+            set_span_data_from_sources(
+                span, response, pii_sources, require_truthy=True
+            )
+        if collected_text:
+            set_data_normalized(
+                span, SPANDATA.GEN_AI_RESPONSE_TEXT, ["".join(collected_text)]
+            )
+        else:
+            extract_text = response_config.get("extract_text")
+            if extract_text:
+                texts = extract_text(response)
+                if texts:
+                    set_data_normalized(span, SPANDATA.GEN_AI_RESPONSE_TEXT, texts)
+
+    usage_config = response_config.get("usage")
+    if usage_config:
+        record_token_usage(
+            span,
+            input_tokens=get_first_from_sources(
+                response, usage_config.get("input_tokens", [])
+            ),
+            output_tokens=get_first_from_sources(
+                response, usage_config.get("output_tokens", [])
+            ),
+        )
diff --git a/sentry_sdk/ai/utils.py b/sentry_sdk/ai/utils.py
@@ -8,7 +8,7 @@
 from sentry_sdk._types import BLOB_DATA_SUBSTITUTE
 
 if TYPE_CHECKING:
-    from typing import Any, Callable, Dict, List, Optional, Tuple
+    from typing import Any, Callable, Dict, List, Mapping, Optional, Sequence, Tuple
 
     from sentry_sdk.tracing import Span
 
@@ -725,3 +725,32 @@ def set_conversation_id(conversation_id: str) -> None:
     """
     scope = sentry_sdk.get_current_scope()
     scope.set_conversation_id(conversation_id)
+
+
+def transitive_getattr(obj, *attrs):
+    # type: (Any, str) -> Any
+    current = obj
+    for attr in attrs:
+        current = getattr(current, attr, None)
+        if current is None:
+            return None
+    return current
+
+
+def get_first_from_sources(obj, source_paths, require_truthy=False):
+    # type: (Any, Sequence[tuple[str, ...]], bool) -> Any
+    for source_path in source_paths:
+        value = transitive_getattr(obj, *source_path)
+        if not value:
+            continue
+        if not require_truthy or value:
+            return value
+    return None
+
+
+def set_span_data_from_sources(span, obj, target_sources, require_truthy):
+    # type: (Any, Any, Mapping[str, Sequence[tuple[str, ...]]], bool) -> None
+    for spandata_key, source_paths in target_sources.items():
+        value = get_first_from_sources(obj, source_paths, require_truthy=require_truthy)
+        if value is not None:
+            set_data_normalized(span, spandata_key, value)
diff --git a/sentry_sdk/integrations/cohere/__init__.py b/sentry_sdk/integrations/cohere/__init__.py
@@ -3,7 +3,7 @@
 
 from sentry_sdk.ai.monitoring import record_token_usage
 from sentry_sdk.consts import OP, SPANDATA
-from sentry_sdk.ai.span_config import set_input_span_data
+from sentry_sdk.ai.span_config import set_request_span_data
 
 from typing import TYPE_CHECKING
 
@@ -92,7 +92,7 @@ def new_embed(*args, **kwargs):
             name=f"embeddings {model}".strip(),
             origin=CohereIntegration.origin,
         ) as span:
-            set_input_span_data(span, kwargs, integration, COHERE_EMBED_CONFIG)
+            set_request_span_data(span, kwargs, integration, COHERE_EMBED_CONFIG)
 
             try:
                 res = f(*args, **kwargs)
diff --git a/sentry_sdk/integrations/cohere/utils.py b/sentry_sdk/integrations/cohere/utils.py
diff --git a/sentry_sdk/integrations/cohere/v1.py b/sentry_sdk/integrations/cohere/v1.py
@@ -1,9 +1,11 @@
 import sys
 from functools import wraps
 
-from sentry_sdk.ai.monitoring import record_token_usage
-from sentry_sdk.ai.span_config import set_input_span_data
-from sentry_sdk.ai.utils import set_data_normalized, transform_message_content
+from sentry_sdk.ai.span_config import set_request_span_data, set_response_span_data
+from sentry_sdk.ai.utils import (
+    get_first_from_sources,
+    transform_message_content,
+)
 from sentry_sdk.consts import OP, SPANDATA
 
 from typing import TYPE_CHECKING
@@ -17,10 +19,6 @@
     CohereIntegration,
     _capture_exception,
 )
-from sentry_sdk.integrations.cohere.utils import (
-    get_first_from_sources,
-    set_span_data_from_sources,
-)
 from sentry_sdk.scope import should_send_default_pii
 from sentry_sdk.utils import capture_internal_exceptions, reraise
 
@@ -38,34 +36,41 @@
 except ImportError:
     _has_chat_types = False
 
+def _extract_response_text(response):
+    # type: (Any) -> list[str] | None
+    text = getattr(response, "text", None)
+    return [text] if text is not None else None
+
+
 COHERE_V1_CHAT_CONFIG = {
     "static": {
         SPANDATA.GEN_AI_SYSTEM: "cohere",
         SPANDATA.GEN_AI_OPERATION_NAME: "chat",
     },
     "extract_messages": lambda kw: _extract_messages(kw),
+    "response": {
+        "sources": {
+            SPANDATA.GEN_AI_RESPONSE_ID: [("generation_id",)],
+            SPANDATA.GEN_AI_RESPONSE_FINISH_REASONS: [("finish_reason",)],
+        },
+        "pii_sources": {
+            SPANDATA.GEN_AI_RESPONSE_TOOL_CALLS: [("tool_calls",)],
+        },
+        "extract_text": _extract_response_text,
+        "usage": {
+            "input_tokens": [
+                ("meta", "billed_units", "input_tokens"),
+                ("meta", "tokens", "input_tokens"),
+            ],
+            "output_tokens": [
+                ("meta", "billed_units", "output_tokens"),
+                ("meta", "tokens", "output_tokens"),
+            ],
+        },
+    },
+    "stream_response_object": [("response",)],
 }
 
-CHAT_RESPONSE_SOURCES = {
-    SPANDATA.GEN_AI_RESPONSE_ID: [("generation_id",)],
-    SPANDATA.GEN_AI_RESPONSE_FINISH_REASONS: [("finish_reason",)],
-}
-PII_CHAT_RESPONSE_SOURCES = {
-    SPANDATA.GEN_AI_RESPONSE_TOOL_CALLS: [("tool_calls",)],
-}
-CHAT_RESPONSE_TEXT_SOURCES = [("text",)]
-CHAT_USAGE_TOKEN_SOURCES = {
-    SPANDATA.GEN_AI_USAGE_INPUT_TOKENS: [
-        ("meta", "billed_units", "input_tokens"),
-        ("meta", "tokens", "input_tokens"),
-    ],
-    SPANDATA.GEN_AI_USAGE_OUTPUT_TOKENS: [
-        ("meta", "billed_units", "output_tokens"),
-        ("meta", "tokens", "output_tokens"),
-    ],
-}
-STREAM_RESPONSE_SOURCES = [("response",)]
-
 
 def setup_v1(wrap_embed_fn):
     # type: (Callable[..., Any]) -> None
@@ -113,19 +118,20 @@ def new_chat(*args, **kwargs):
                 reraise(*exc_info)
 
             with capture_internal_exceptions():
-                span_data = {SPANDATA.GEN_AI_RESPONSE_STREAMING: streaming}
-                if model:
-                    span_data[SPANDATA.GEN_AI_REQUEST_MODEL] = model
-                set_input_span_data(
+                span_data = {
+                    SPANDATA.GEN_AI_RESPONSE_STREAMING: streaming,
+                    SPANDATA.GEN_AI_REQUEST_MODEL: model if model else None,
+                }
+                set_request_span_data(
                     span, kwargs, integration, COHERE_V1_CHAT_CONFIG, span_data
                 )
 
                 if streaming:
                     return _iter_stream_events(res, span, include_pii)
-                if isinstance(res, NonStreamedChatResponse):
-                    _collect_response_fields(span, res, include_pii=include_pii)
                 else:
-                    set_data_normalized(span, "unknown_response", True)
+                    set_response_span_data(
+                        span, res, include_pii, COHERE_V1_CHAT_CONFIG["response"]
+                    )
                 return res
 
     return new_chat
@@ -154,36 +160,11 @@ def _iter_stream_events(old_iterator, span, include_pii):
             if isinstance(x, ChatStreamEndEvent) or isinstance(
                 x, StreamEndStreamedChatResponse
             ):
-                _collect_v1_stream_end_fields(span, x, include_pii)
+                response = get_first_from_sources(
+                    x, COHERE_V1_CHAT_CONFIG["stream_response_object"]
+                )
+                if response is not None:
+                    set_response_span_data(
+                        span, response, include_pii, COHERE_V1_CHAT_CONFIG["response"]
+                    )
             yield x
-
-
-def _collect_v1_stream_end_fields(span, event, include_pii):
-    # type: (Any, Any, bool) -> None
-    response = get_first_from_sources(event, STREAM_RESPONSE_SOURCES)
-    if response is not None:
-        _collect_response_fields(span, response, include_pii)
-
-
-def _collect_response_fields(span, response, include_pii):
-    # type: (Any, Any, bool) -> None
-    if include_pii:
-        text = get_first_from_sources(response, CHAT_RESPONSE_TEXT_SOURCES)
-        if text is not None:
-            set_data_normalized(span, SPANDATA.GEN_AI_RESPONSE_TEXT, [text])
-        set_span_data_from_sources(
-            span, response, PII_CHAT_RESPONSE_SOURCES, require_truthy=False
-        )
-
-    set_span_data_from_sources(
-        span, response, CHAT_RESPONSE_SOURCES, require_truthy=False
-    )
-    record_token_usage(
-        span,
-        input_tokens=get_first_from_sources(
-            response, CHAT_USAGE_TOKEN_SOURCES[SPANDATA.GEN_AI_USAGE_INPUT_TOKENS]
-        ),
-        output_tokens=get_first_from_sources(
-            response, CHAT_USAGE_TOKEN_SOURCES[SPANDATA.GEN_AI_USAGE_OUTPUT_TOKENS]
-        ),
-    )
diff --git a/sentry_sdk/integrations/cohere/v2.py b/sentry_sdk/integrations/cohere/v2.py