Preview: tracing_utils.py
Size: 54.36 KB
//proc/thread-self/root/opt/hc_python/lib/python3.12/site-packages/sentry_sdk/tracing_utils.py
import contextlib
import functools
import inspect
import os
import re
import sys
import uuid
import warnings
from collections.abc import Mapping, MutableMapping
from datetime import datetime, timedelta, timezone
from random import Random
from urllib.parse import quote, unquote
try:
from re import Pattern
except ImportError:
# 3.6
from typing import Pattern
from typing import TYPE_CHECKING
import sentry_sdk
from sentry_sdk.consts import OP, SPANDATA, SPANTEMPLATE
from sentry_sdk.utils import (
_is_external_source,
_is_in_project_root,
_module_in_list,
capture_internal_exceptions,
filename_for_module,
is_sentry_url,
is_valid_sample_rate,
logger,
match_regex_list,
qualname_from_function,
safe_repr,
to_string,
try_convert,
)
if TYPE_CHECKING:
from types import FrameType
from typing import Any, Dict, Generator, Iterator, Optional, Tuple, Union
from sentry_sdk._types import Attributes
SENTRY_TRACE_REGEX = re.compile(
"^[ \t]*" # whitespace
"([0-9a-f]{32})?" # trace_id
"-?([0-9a-f]{16})?" # span_id
"-?([01])?" # sampled
"[ \t]*$" # whitespace
)
# This is a normal base64 regex, modified to reflect that fact that we strip the
# trailing = or == off
base64_stripped = (
# any of the characters in the base64 "alphabet", in multiples of 4
"([a-zA-Z0-9+/]{4})*"
# either nothing or 2 or 3 base64-alphabet characters (see
# https://en.wikipedia.org/wiki/Base64#Decoding_Base64_without_padding for
# why there's never only 1 extra character)
"([a-zA-Z0-9+/]{2,3})?"
)
class EnvironHeaders(Mapping): # type: ignore
def __init__(
self,
environ: "Mapping[str, str]",
prefix: str = "HTTP_",
) -> None:
self.environ = environ
self.prefix = prefix
def __getitem__(self, key: str) -> "Optional[Any]":
return self.environ[self.prefix + key.replace("-", "_").upper()]
def __len__(self) -> int:
return sum(1 for _ in iter(self))
def __iter__(self) -> "Generator[str, None, None]":
for k in self.environ:
if not isinstance(k, str):
continue
k = k.replace("-", "_").upper()
if not k.startswith(self.prefix):
continue
yield k[len(self.prefix) :]
def has_tracing_enabled(options: "Optional[Dict[str, Any]]") -> bool:
"""
Returns True if either traces_sample_rate or traces_sampler is
defined and enable_tracing is set and not false.
"""
if options is None:
return False
return bool(
options.get("enable_tracing") is not False
and (
options.get("traces_sample_rate") is not None
or options.get("traces_sampler") is not None
)
)
def has_span_streaming_enabled(options: "Optional[dict[str, Any]]") -> bool:
if options is None:
return False
return (options.get("_experiments") or {}).get("trace_lifecycle") == "stream"
def should_truncate_gen_ai_input(options: "Optional[dict[str, Any]]") -> bool:
if options is None:
return True
return not options.get(
"stream_gen_ai_spans", False
) and not has_span_streaming_enabled(options)
@contextlib.contextmanager
def record_sql_queries(
cursor: "Any",
query: "Any",
params_list: "Any",
paramstyle: "Optional[str]",
executemany: bool,
record_cursor_repr: bool = False,
span_origin: str = "manual",
) -> "Generator[Union[sentry_sdk.tracing.Span, sentry_sdk.traces.StreamedSpan], None, None]":
# TODO: Bring back capturing of params by default
client = sentry_sdk.get_client()
if client.options["_experiments"].get("record_sql_params", False):
if not params_list or params_list == [None]:
params_list = None
if paramstyle == "pyformat":
paramstyle = "format"
else:
params_list = None
paramstyle = None
query = _format_sql(cursor, query)
data = {}
if params_list is not None:
data["db.params"] = params_list
if paramstyle is not None:
data["db.paramstyle"] = paramstyle
if executemany:
data["db.executemany"] = True
if record_cursor_repr and cursor is not None:
data["db.cursor"] = cursor
with capture_internal_exceptions():
sentry_sdk.add_breadcrumb(message=query, category="query", data=data)
if has_span_streaming_enabled(client.options):
with sentry_sdk.traces.start_span(
name="<unknown SQL query>" if query is None else query,
attributes={
"sentry.origin": span_origin,
"sentry.op": OP.DB,
},
) as span:
yield span
else:
with sentry_sdk.start_span(
op=OP.DB,
name=query,
origin=span_origin,
) as span:
for k, v in data.items():
span.set_data(k, v)
yield span
def maybe_create_breadcrumbs_from_span(
scope: "sentry_sdk.Scope", span: "sentry_sdk.tracing.Span"
) -> None:
if span.op == OP.DB_REDIS:
scope.add_breadcrumb(
message=span.description, type="redis", category="redis", data=span._tags
)
elif span.op == OP.HTTP_CLIENT:
level = None
status_code = span._data.get(SPANDATA.HTTP_STATUS_CODE)
if status_code:
if 500 <= status_code <= 599:
level = "error"
elif 400 <= status_code <= 499:
level = "warning"
if level:
scope.add_breadcrumb(
type="http", category="httplib", data=span._data, level=level
)
else:
scope.add_breadcrumb(type="http", category="httplib", data=span._data)
elif span.op == "subprocess":
scope.add_breadcrumb(
type="subprocess",
category="subprocess",
message=span.description,
data=span._data,
)
def _get_frame_module_abs_path(frame: "FrameType") -> "Optional[str]":
try:
return frame.f_code.co_filename
except Exception:
return None
def _should_be_included(
is_sentry_sdk_frame: bool,
namespace: "Optional[str]",
in_app_include: "Optional[list[str]]",
in_app_exclude: "Optional[list[str]]",
abs_path: "Optional[str]",
project_root: "Optional[str]",
) -> bool:
# in_app_include takes precedence over in_app_exclude
should_be_included = _module_in_list(namespace, in_app_include)
should_be_excluded = _is_external_source(abs_path) or _module_in_list(
namespace, in_app_exclude
)
return not is_sentry_sdk_frame and (
should_be_included
or (_is_in_project_root(abs_path, project_root) and not should_be_excluded)
)
def add_source(
span: "Union[sentry_sdk.tracing.Span, sentry_sdk.traces.StreamedSpan]",
project_root: "Optional[str]",
in_app_include: "Optional[list[str]]",
in_app_exclude: "Optional[list[str]]",
) -> None:
"""
Adds OTel compatible source code information to the span
"""
# Find the correct frame
frame: "Union[FrameType, None]" = sys._getframe()
while frame is not None:
abs_path = _get_frame_module_abs_path(frame)
try:
namespace: "Optional[str]" = frame.f_globals.get("__name__")
except Exception:
namespace = None
is_sentry_sdk_frame = namespace is not None and namespace.startswith(
"sentry_sdk."
)
should_be_included = _should_be_included(
is_sentry_sdk_frame=is_sentry_sdk_frame,
namespace=namespace,
in_app_include=in_app_include,
in_app_exclude=in_app_exclude,
abs_path=abs_path,
project_root=project_root,
)
if should_be_included:
break
frame = frame.f_back
else:
frame = None
# Set the data
if frame is not None:
try:
lineno = frame.f_lineno
except Exception:
lineno = None
if lineno is not None:
if isinstance(span, Span):
span.set_data(SPANDATA.CODE_LINENO, lineno)
else:
span.set_attribute("code.line.number", lineno)
try:
namespace = frame.f_globals.get("__name__")
except Exception:
namespace = None
if namespace is not None:
if isinstance(span, Span):
span.set_data(SPANDATA.CODE_NAMESPACE, namespace)
else:
span.set_attribute(SPANDATA.CODE_NAMESPACE, namespace)
filepath = _get_frame_module_abs_path(frame)
if filepath is not None:
if namespace is not None:
in_app_path = filename_for_module(namespace, filepath)
elif project_root is not None and filepath.startswith(project_root):
in_app_path = filepath.replace(project_root, "").lstrip(os.sep)
else:
in_app_path = filepath
if isinstance(span, Span):
span.set_data(SPANDATA.CODE_FILEPATH, in_app_path)
else:
if in_app_path is not None:
span.set_attribute("code.file.path", in_app_path)
try:
code_function = frame.f_code.co_name
except Exception:
code_function = None
if code_function is not None:
if isinstance(span, Span):
span.set_data(SPANDATA.CODE_FUNCTION, frame.f_code.co_name)
else:
span.set_attribute(SPANDATA.CODE_FUNCTION, frame.f_code.co_name)
def add_query_source(
span: "Union[sentry_sdk.tracing.Span, sentry_sdk.traces.StreamedSpan]",
) -> None:
"""
Adds OTel compatible source code information to a database query span
"""
client = sentry_sdk.get_client()
if not client.is_active():
return
if isinstance(span, Span):
# In the StreamedSpan case, we need to add the extra span information before
# the span finishes, so it's expected that this will be None. In the Span case,
# it should already be finished.
if span.timestamp is None:
return
if span.start_timestamp is None:
return
should_add_query_source = client.options.get("enable_db_query_source", True)
if not should_add_query_source:
return
if isinstance(span, StreamedSpan):
end_timestamp = span.end_timestamp
else:
end_timestamp = span.timestamp
end_timestamp = end_timestamp or datetime.now(timezone.utc)
duration = end_timestamp - span.start_timestamp
threshold = client.options.get("db_query_source_threshold_ms", 0)
slow_query = duration / timedelta(milliseconds=1) > threshold
if not slow_query:
return
add_source(
span=span,
project_root=client.options["project_root"],
in_app_include=client.options.get("in_app_include"),
in_app_exclude=client.options.get("in_app_exclude"),
)
def add_http_request_source(
span: "Union[sentry_sdk.tracing.Span, sentry_sdk.traces.StreamedSpan]",
) -> None:
"""
Adds OTel compatible source code information to a span for an outgoing HTTP request
"""
client = sentry_sdk.get_client()
if not client.is_active():
return
if isinstance(span, Span):
# In the StreamedSpan case, we need to add the extra span information before
# the span finishes, so it's expected that this will be None. In the Span case,
# it should already be finished.
if span.timestamp is None:
return
if span.start_timestamp is None:
return
should_add_request_source = client.options.get("enable_http_request_source", True)
if not should_add_request_source:
return
if isinstance(span, StreamedSpan):
end_timestamp = span.end_timestamp
else:
end_timestamp = span.timestamp
end_timestamp = end_timestamp or datetime.now(timezone.utc)
duration = end_timestamp - span.start_timestamp
threshold = client.options.get("http_request_source_threshold_ms", 0)
slow_query = duration / timedelta(milliseconds=1) > threshold
if not slow_query:
return
add_source(
span=span,
project_root=client.options["project_root"],
in_app_include=client.options.get("in_app_include"),
in_app_exclude=client.options.get("in_app_exclude"),
)
def extract_sentrytrace_data(
header: "Optional[str]",
) -> "Optional[Dict[str, Union[str, bool, None]]]":
"""
Given a `sentry-trace` header string, return a dictionary of data.
"""
if not header:
return None
if header.startswith("00-") and header.endswith("-00"):
header = header[3:-3]
match = SENTRY_TRACE_REGEX.match(header)
if not match:
return None
trace_id, parent_span_id, sampled_str = match.groups()
parent_sampled = None
if trace_id:
trace_id = "{:032x}".format(int(trace_id, 16))
if parent_span_id:
parent_span_id = "{:016x}".format(int(parent_span_id, 16))
if sampled_str:
parent_sampled = sampled_str != "0"
return {
"trace_id": trace_id,
"parent_span_id": parent_span_id,
"parent_sampled": parent_sampled,
}
def _format_sql(cursor: "Any", sql: str) -> "Optional[str]":
real_sql = None
# If we're using psycopg2, it could be that we're
# looking at a query that uses Composed objects. Use psycopg2's mogrify
# function to format the query. We lose per-parameter trimming but gain
# accuracy in formatting.
try:
if hasattr(cursor, "mogrify"):
real_sql = cursor.mogrify(sql)
if isinstance(real_sql, bytes):
real_sql = real_sql.decode(cursor.connection.encoding)
except Exception:
real_sql = None
return real_sql or to_string(sql)
class PropagationContext:
"""
The PropagationContext represents the data of a trace in Sentry.
"""
__slots__ = (
"_trace_id",
"_span_id",
"parent_span_id",
"parent_sampled",
"baggage",
"custom_sampling_context",
)
def __init__(
self,
trace_id: "Optional[str]" = None,
span_id: "Optional[str]" = None,
parent_span_id: "Optional[str]" = None,
parent_sampled: "Optional[bool]" = None,
dynamic_sampling_context: "Optional[Dict[str, str]]" = None,
baggage: "Optional[Baggage]" = None,
) -> None:
self._trace_id = trace_id
"""The trace id of the Sentry trace."""
self._span_id = span_id
"""The span id of the currently executing span."""
self.parent_span_id = parent_span_id
"""The id of the parent span that started this span.
The parent span could also be a span in an upstream service."""
self.parent_sampled = parent_sampled
"""Boolean indicator if the parent span was sampled.
Important when the parent span originated in an upstream service,
because we want to sample the whole trace, or nothing from the trace."""
self.baggage = baggage
"""Parsed baggage header that is used for dynamic sampling decisions."""
"""DEPRECATED this only exists for backwards compat of constructor."""
if baggage is None and dynamic_sampling_context is not None:
self.baggage = Baggage(dynamic_sampling_context)
self.custom_sampling_context: "Optional[dict[str, Any]]" = None
@classmethod
def from_incoming_data(
cls, incoming_data: "Dict[str, Any]"
) -> "PropagationContext":
propagation_context = PropagationContext()
normalized_data = normalize_incoming_data(incoming_data)
sentry_trace_header = normalized_data.get(SENTRY_TRACE_HEADER_NAME)
sentrytrace_data = extract_sentrytrace_data(sentry_trace_header)
# nothing to propagate if no sentry-trace
if sentrytrace_data is None:
return propagation_context
baggage_header = normalized_data.get(BAGGAGE_HEADER_NAME)
baggage = (
Baggage.from_incoming_header(baggage_header) if baggage_header else None
)
if not _should_continue_trace(baggage):
return propagation_context
propagation_context.update(sentrytrace_data)
if baggage:
propagation_context.baggage = baggage
propagation_context._fill_sample_rand()
return propagation_context
@property
def trace_id(self) -> str:
"""The trace id of the Sentry trace."""
if not self._trace_id:
# New trace, don't fill in sample_rand
self._trace_id = uuid.uuid4().hex
return self._trace_id
@trace_id.setter
def trace_id(self, value: str) -> None:
self._trace_id = value
@property
def span_id(self) -> str:
"""The span id of the currently executed span."""
if not self._span_id:
self._span_id = uuid.uuid4().hex[16:]
return self._span_id
@span_id.setter
def span_id(self, value: str) -> None:
self._span_id = value
@property
def dynamic_sampling_context(self) -> "Optional[Dict[str, Any]]":
return self.get_baggage().dynamic_sampling_context()
def to_traceparent(self) -> str:
return f"{self.trace_id}-{self.span_id}"
def get_baggage(self) -> "Baggage":
if self.baggage is None:
self.baggage = Baggage.populate_from_propagation_context(self)
return self.baggage
def iter_headers(self) -> "Iterator[Tuple[str, str]]":
"""
Creates a generator which returns the propagation_context's ``sentry-trace`` and ``baggage`` headers.
"""
yield SENTRY_TRACE_HEADER_NAME, self.to_traceparent()
baggage = self.get_baggage().serialize()
if baggage:
yield BAGGAGE_HEADER_NAME, baggage
def update(self, other_dict: "Dict[str, Any]") -> None:
"""
Updates the PropagationContext with data from the given dictionary.
"""
for key, value in other_dict.items():
try:
setattr(self, key, value)
except AttributeError:
pass
def _set_custom_sampling_context(
self, custom_sampling_context: "dict[str, Any]"
) -> None:
self.custom_sampling_context = custom_sampling_context
def __repr__(self) -> str:
return "<PropagationContext _trace_id={} _span_id={} parent_span_id={} parent_sampled={} baggage={}>".format(
self._trace_id,
self._span_id,
self.parent_span_id,
self.parent_sampled,
self.baggage,
)
def _fill_sample_rand(self) -> None:
"""
Ensure that there is a valid sample_rand value in the baggage.
If there is a valid sample_rand value in the baggage, we keep it.
Otherwise, we generate a sample_rand value according to the following:
- If we have a parent_sampled value and a sample_rate in the DSC, we compute
a sample_rand value randomly in the range:
- [0, sample_rate) if parent_sampled is True,
- or, in the range [sample_rate, 1) if parent_sampled is False.
- If either parent_sampled or sample_rate is missing, we generate a random
value in the range [0, 1).
The sample_rand is deterministically generated from the trace_id, if present.
This function does nothing if there is no baggage.
"""
if self.baggage is None:
return
sample_rand = try_convert(float, self.baggage.sentry_items.get("sample_rand"))
if sample_rand is not None and 0 <= sample_rand < 1:
# sample_rand is present and valid, so don't overwrite it
return
# Get the sample rate and compute the transformation that will map the random value
# to the desired range: [0, 1), [0, sample_rate), or [sample_rate, 1).
sample_rate = try_convert(float, self.baggage.sentry_items.get("sample_rate"))
lower, upper = _sample_rand_range(self.parent_sampled, sample_rate)
try:
sample_rand = _generate_sample_rand(self.trace_id, interval=(lower, upper))
except ValueError:
# ValueError is raised if the interval is invalid, i.e. lower >= upper.
# lower >= upper might happen if the incoming trace's sampled flag
# and sample_rate are inconsistent, e.g. sample_rate=0.0 but sampled=True.
# We cannot generate a sensible sample_rand value in this case.
logger.debug(
f"Could not backfill sample_rand, since parent_sampled={self.parent_sampled} "
f"and sample_rate={sample_rate}."
)
return
self.baggage.sentry_items["sample_rand"] = f"{sample_rand:.6f}" # noqa: E231
def _sample_rand(self) -> "Optional[str]":
"""Convenience method to get the sample_rand value from the baggage."""
if self.baggage is None:
return None
return self.baggage.sentry_items.get("sample_rand")
class Baggage:
"""
The W3C Baggage header information (see https://www.w3.org/TR/baggage/).
Before mutating a `Baggage` object, calling code must check that `mutable` is `True`.
Mutating a `Baggage` object that has `mutable` set to `False` is not allowed, but
it is the caller's responsibility to enforce this restriction.
"""
__slots__ = ("sentry_items", "third_party_items", "mutable")
SENTRY_PREFIX = "sentry-"
SENTRY_PREFIX_REGEX = re.compile("^sentry-")
def __init__(
self,
sentry_items: "Dict[str, str]",
third_party_items: str = "",
mutable: bool = True,
):
self.sentry_items = sentry_items
self.third_party_items = third_party_items
self.mutable = mutable
@classmethod
def from_incoming_header(
cls,
header: "Optional[str]",
*,
_sample_rand: "Optional[str]" = None,
) -> "Baggage":
"""
freeze if incoming header already has sentry baggage
"""
sentry_items = {}
third_party_items = ""
mutable = True
if header:
for item in header.split(","):
if "=" not in item:
continue
with capture_internal_exceptions():
item = item.strip()
key, val = item.split("=", 1)
if Baggage.SENTRY_PREFIX_REGEX.match(key):
baggage_key = unquote(key.split("-")[1])
sentry_items[baggage_key] = unquote(val)
mutable = False
else:
third_party_items += ("," if third_party_items else "") + item
if _sample_rand is not None:
sentry_items["sample_rand"] = str(_sample_rand)
mutable = False
return Baggage(sentry_items, third_party_items, mutable)
@classmethod
def from_options(cls, scope: "sentry_sdk.scope.Scope") -> "Optional[Baggage]":
"""
Deprecated: use populate_from_propagation_context
"""
if scope._propagation_context is None:
return Baggage({})
return Baggage.populate_from_propagation_context(scope._propagation_context)
@classmethod
def populate_from_propagation_context(
cls, propagation_context: "PropagationContext"
) -> "Baggage":
sentry_items: "Dict[str, str]" = {}
third_party_items = ""
mutable = False
client = sentry_sdk.get_client()
if not client.is_active():
return Baggage(sentry_items)
options = client.options
sentry_items["trace_id"] = propagation_context.trace_id
if options.get("environment"):
sentry_items["environment"] = options["environment"]
if options.get("release"):
sentry_items["release"] = options["release"]
if client.parsed_dsn:
sentry_items["public_key"] = client.parsed_dsn.public_key
if client.parsed_dsn.org_id:
sentry_items["org_id"] = client.parsed_dsn.org_id
if options.get("traces_sample_rate"):
sentry_items["sample_rate"] = str(options["traces_sample_rate"])
return Baggage(sentry_items, third_party_items, mutable)
@classmethod
def populate_from_transaction(
cls, transaction: "sentry_sdk.tracing.Transaction"
) -> "Baggage":
"""
Populate fresh baggage entry with sentry_items and make it immutable
if this is the head SDK which originates traces.
"""
client = sentry_sdk.get_client()
sentry_items: "Dict[str, str]" = {}
if not client.is_active():
return Baggage(sentry_items)
options = client.options or {}
sentry_items["trace_id"] = transaction.trace_id
sentry_items["sample_rand"] = f"{transaction._sample_rand:.6f}" # noqa: E231
if options.get("environment"):
sentry_items["environment"] = options["environment"]
if options.get("release"):
sentry_items["release"] = options["release"]
if client.parsed_dsn:
sentry_items["public_key"] = client.parsed_dsn.public_key
if client.parsed_dsn.org_id:
sentry_items["org_id"] = client.parsed_dsn.org_id
if (
transaction.name
and transaction.source not in LOW_QUALITY_TRANSACTION_SOURCES
):
sentry_items["transaction"] = transaction.name
if transaction.sample_rate is not None:
sentry_items["sample_rate"] = str(transaction.sample_rate)
if transaction.sampled is not None:
sentry_items["sampled"] = "true" if transaction.sampled else "false"
# there's an existing baggage but it was mutable,
# which is why we are creating this new baggage.
# However, if by chance the user put some sentry items in there, give them precedence.
if transaction._baggage and transaction._baggage.sentry_items:
sentry_items.update(transaction._baggage.sentry_items)
return Baggage(sentry_items, mutable=False)
@classmethod
def populate_from_segment(cls, segment: "StreamedSpan") -> "Baggage":
"""
Populate fresh baggage entry with sentry_items and make it immutable
if this is the head SDK which originates traces.
"""
client = sentry_sdk.get_client()
sentry_items: "Dict[str, str]" = {}
if not client.is_active():
return Baggage(sentry_items)
options = client.options or {}
sentry_items["trace_id"] = segment.trace_id
sentry_items["sample_rand"] = f"{segment._sample_rand:.6f}" # noqa: E231
if options.get("environment"):
sentry_items["environment"] = options["environment"]
if options.get("release"):
sentry_items["release"] = options["release"]
if client.parsed_dsn:
sentry_items["public_key"] = client.parsed_dsn.public_key
if client.parsed_dsn.org_id:
sentry_items["org_id"] = client.parsed_dsn.org_id
if (
segment.get_attributes().get("sentry.span.source")
not in LOW_QUALITY_SEGMENT_SOURCES
) and segment._name:
sentry_items["transaction"] = segment._name
if segment._sample_rate is not None:
sentry_items["sample_rate"] = str(segment._sample_rate)
if segment.sampled is not None:
sentry_items["sampled"] = "true" if segment.sampled else "false"
# There's an existing baggage but it was mutable, which is why we are
# creating this new baggage.
# However, if by chance the user put some sentry items in there, give
# them precedence.
if segment._baggage and segment._baggage.sentry_items:
sentry_items.update(segment._baggage.sentry_items)
return Baggage(sentry_items, mutable=False)
def freeze(self) -> None:
self.mutable = False
def dynamic_sampling_context(self) -> "Dict[str, str]":
header = {}
for key, item in self.sentry_items.items():
header[key] = item
return header
def serialize(self, include_third_party: bool = False) -> str:
items = []
for key, val in self.sentry_items.items():
with capture_internal_exceptions():
item = Baggage.SENTRY_PREFIX + quote(key) + "=" + quote(str(val))
items.append(item)
if include_third_party:
items.append(self.third_party_items)
return ",".join(items)
@staticmethod
def strip_sentry_baggage(header: str) -> str:
"""Remove Sentry baggage from the given header.
Given a Baggage header, return a new Baggage header with all Sentry baggage items removed.
"""
return ",".join(
(
item
for item in header.split(",")
if not Baggage.SENTRY_PREFIX_REGEX.match(item.strip())
)
)
def _sample_rand(self) -> "Optional[float]":
"""Convenience method to get the sample_rand value from the sentry_items.
We validate the value and parse it as a float before returning it. The value is considered
valid if it is a float in the range [0, 1).
"""
sample_rand = try_convert(float, self.sentry_items.get("sample_rand"))
if sample_rand is not None and 0.0 <= sample_rand < 1.0:
return sample_rand
return None
def __repr__(self) -> str:
return f'<Baggage "{self.serialize(include_third_party=True)}", mutable={self.mutable}>'
def should_propagate_trace(client: "sentry_sdk.client.BaseClient", url: str) -> bool:
"""
Returns True if url matches trace_propagation_targets configured in the given client. Otherwise, returns False.
"""
trace_propagation_targets = client.options["trace_propagation_targets"]
if is_sentry_url(client, url):
return False
return match_regex_list(url, trace_propagation_targets, substring_matching=True)
def normalize_incoming_data(incoming_data: "Dict[str, Any]") -> "Dict[str, Any]":
"""
Normalizes incoming data so the keys are all lowercase with dashes instead of underscores and stripped from known prefixes.
"""
data = {}
for key, value in incoming_data.items():
if key.startswith("HTTP_"):
key = key[5:]
key = key.replace("_", "-").lower()
data[key] = value
return data
def create_span_decorator(
op: "Optional[Union[str, OP]]" = None,
name: "Optional[str]" = None,
attributes: "Optional[dict[str, Any]]" = None,
template: "SPANTEMPLATE" = SPANTEMPLATE.DEFAULT,
) -> "Any":
"""
Create a span decorator that can wrap both sync and async functions.
:param op: The operation type for the span.
:type op: str or :py:class:`sentry_sdk.consts.OP` or None
:param name: The name of the span.
:type name: str or None
:param attributes: Additional attributes to set on the span.
:type attributes: dict or None
:param template: The type of span to create. This determines what kind of
span instrumentation and data collection will be applied. Use predefined
constants from :py:class:`sentry_sdk.consts.SPANTEMPLATE`.
The default is `SPANTEMPLATE.DEFAULT` which is the right choice for most
use cases.
:type template: :py:class:`sentry_sdk.consts.SPANTEMPLATE`
"""
from sentry_sdk.scope import should_send_default_pii
def span_decorator(f: "Any") -> "Any":
"""
Decorator to create a span for the given function.
"""
@functools.wraps(f)
async def async_wrapper(*args: "Any", **kwargs: "Any") -> "Any":
current_span = get_current_span()
if current_span is None:
logger.debug(
"Cannot create a child span for %s. "
"Please start a Sentry transaction before calling this function.",
qualname_from_function(f),
)
return await f(*args, **kwargs)
if isinstance(current_span, StreamedSpan):
warnings.warn(
"Use the @sentry_sdk.traces.trace decorator in span streaming mode.",
DeprecationWarning,
stacklevel=2,
)
return await f(*args, **kwargs)
span_op = op or _get_span_op(template)
function_name = name or qualname_from_function(f) or ""
span_name = _get_span_name(template, function_name, kwargs)
send_pii = should_send_default_pii()
with current_span.start_child(
op=span_op,
name=span_name,
) as span:
span.update_data(attributes or {})
_set_input_attributes(
span, template, send_pii, function_name, f, args, kwargs
)
result = await f(*args, **kwargs)
_set_output_attributes(span, template, send_pii, result)
return result
try:
async_wrapper.__signature__ = inspect.signature(f) # type: ignore[attr-defined]
except Exception:
pass
@functools.wraps(f)
def sync_wrapper(*args: "Any", **kwargs: "Any") -> "Any":
current_span = get_current_span()
if current_span is None:
logger.debug(
"Cannot create a child span for %s. "
"Please start a Sentry transaction before calling this function.",
qualname_from_function(f),
)
return f(*args, **kwargs)
if isinstance(current_span, StreamedSpan):
warnings.warn(
"Use the @sentry_sdk.traces.trace decorator in span streaming mode.",
DeprecationWarning,
stacklevel=2,
)
return f(*args, **kwargs)
span_op = op or _get_span_op(template)
function_name = name or qualname_from_function(f) or ""
span_name = _get_span_name(template, function_name, kwargs)
send_pii = should_send_default_pii()
with current_span.start_child(
op=span_op,
name=span_name,
) as span:
span.update_data(attributes or {})
_set_input_attributes(
span, template, send_pii, function_name, f, args, kwargs
)
result = f(*args, **kwargs)
_set_output_attributes(span, template, send_pii, result)
return result
try:
sync_wrapper.__signature__ = inspect.signature(f) # type: ignore[attr-defined]
except Exception:
pass
if inspect.iscoroutinefunction(f):
return async_wrapper
else:
return sync_wrapper
return span_decorator
def create_streaming_span_decorator(
name: "Optional[str]" = None,
attributes: "Optional[dict[str, Any]]" = None,
active: bool = True,
) -> "Any":
"""
Create a span creating decorator that can wrap both sync and async functions.
"""
def span_decorator(f: "Any") -> "Any":
"""
Decorator to create a span for the given function.
"""
@functools.wraps(f)
async def async_wrapper(*args: "Any", **kwargs: "Any") -> "Any":
client = sentry_sdk.get_client()
if client.is_active() and not has_span_streaming_enabled(client.options):
warnings.warn(
"Using span streaming API in non-span-streaming mode. Use "
"@sentry_sdk.trace instead.",
stacklevel=2,
)
span_name = name or qualname_from_function(f) or ""
with start_streaming_span(
name=span_name, attributes=attributes, active=active
):
result = await f(*args, **kwargs)
return result
try:
async_wrapper.__signature__ = inspect.signature(f) # type: ignore[attr-defined]
except Exception:
pass
@functools.wraps(f)
def sync_wrapper(*args: "Any", **kwargs: "Any") -> "Any":
client = sentry_sdk.get_client()
if client.is_active() and not has_span_streaming_enabled(client.options):
warnings.warn(
"Using span streaming API in non-span-streaming mode. Use "
"@sentry_sdk.trace instead.",
stacklevel=2,
)
span_name = name or qualname_from_function(f) or ""
with start_streaming_span(
name=span_name, attributes=attributes, active=active
):
return f(*args, **kwargs)
try:
sync_wrapper.__signature__ = inspect.signature(f) # type: ignore[attr-defined]
except Exception:
pass
if inspect.iscoroutinefunction(f):
return async_wrapper
else:
return sync_wrapper
return span_decorator
def get_current_span(
scope: "Optional[sentry_sdk.Scope]" = None,
) -> "Optional[Span]":
"""
Returns the currently active span if there is one running, otherwise `None`
"""
scope = scope or sentry_sdk.get_current_scope()
current_span = scope.span
return current_span
def _generate_sample_rand(
trace_id: "Optional[str]",
*,
interval: "tuple[float, float]" = (0.0, 1.0),
) -> float:
"""Generate a sample_rand value from a trace ID.
The generated value will be pseudorandomly chosen from the provided
interval. Specifically, given (lower, upper) = interval, the generated
value will be in the range [lower, upper). The value has 6-digit precision,
so when printing with .6f, the value will never be rounded up.
The pseudorandom number generator is seeded with the trace ID.
"""
lower, upper = interval
if not lower < upper: # using `if lower >= upper` would handle NaNs incorrectly
raise ValueError("Invalid interval: lower must be less than upper")
rng = Random(trace_id)
lower_scaled = int(lower * 1_000_000)
upper_scaled = int(upper * 1_000_000)
try:
sample_rand_scaled = rng.randrange(lower_scaled, upper_scaled)
except ValueError:
# In some corner cases it might happen that the range is too small
# In that case, just take the lower bound
sample_rand_scaled = lower_scaled
return sample_rand_scaled / 1_000_000
def _sample_rand_range(
parent_sampled: "Optional[bool]", sample_rate: "Optional[float]"
) -> "tuple[float, float]":
"""
Compute the lower (inclusive) and upper (exclusive) bounds of the range of values
that a generated sample_rand value must fall into, given the parent_sampled and
sample_rate values.
"""
if parent_sampled is None or sample_rate is None:
return 0.0, 1.0
elif parent_sampled is True:
return 0.0, sample_rate
else: # parent_sampled is False
return sample_rate, 1.0
def _get_value(source: "Any", key: str) -> "Optional[Any]":
"""
Gets a value from a source object. The source can be a dict or an object.
It is checked for dictionary keys and object attributes.
"""
value = None
if isinstance(source, dict):
value = source.get(key)
else:
if hasattr(source, key):
try:
value = getattr(source, key)
except Exception:
value = None
return value
def _get_span_name(
template: "Union[str, SPANTEMPLATE]",
name: str,
kwargs: "Optional[dict[str, Any]]" = None,
) -> str:
"""
Get the name of the span based on the template and the name.
"""
span_name = name
if template == SPANTEMPLATE.AI_CHAT:
model = None
if kwargs:
for key in ("model", "model_name"):
if kwargs.get(key) and isinstance(kwargs[key], str):
model = kwargs[key]
break
span_name = f"chat {model}" if model else "chat"
elif template == SPANTEMPLATE.AI_AGENT:
span_name = f"invoke_agent {name}"
elif template == SPANTEMPLATE.AI_TOOL:
span_name = f"execute_tool {name}"
return span_name
def _get_span_op(template: "Union[str, SPANTEMPLATE]") -> str:
"""
Get the operation of the span based on the template.
"""
mapping: "dict[Union[str, SPANTEMPLATE], Union[str, OP]]" = {
SPANTEMPLATE.AI_CHAT: OP.GEN_AI_CHAT,
SPANTEMPLATE.AI_AGENT: OP.GEN_AI_INVOKE_AGENT,
SPANTEMPLATE.AI_TOOL: OP.GEN_AI_EXECUTE_TOOL,
}
op = mapping.get(template, OP.FUNCTION)
return str(op)
def _get_input_attributes(
template: "Union[str, SPANTEMPLATE]",
send_pii: bool,
args: "tuple[Any, ...]",
kwargs: "dict[str, Any]",
) -> "dict[str, Any]":
"""
Get input attributes for the given span template.
"""
attributes: "dict[str, Any]" = {}
if template in [SPANTEMPLATE.AI_AGENT, SPANTEMPLATE.AI_TOOL, SPANTEMPLATE.AI_CHAT]:
mapping = {
"model": (SPANDATA.GEN_AI_REQUEST_MODEL, str),
"model_name": (SPANDATA.GEN_AI_REQUEST_MODEL, str),
"agent": (SPANDATA.GEN_AI_AGENT_NAME, str),
"agent_name": (SPANDATA.GEN_AI_AGENT_NAME, str),
"max_tokens": (SPANDATA.GEN_AI_REQUEST_MAX_TOKENS, int),
"frequency_penalty": (SPANDATA.GEN_AI_REQUEST_FREQUENCY_PENALTY, float),
"presence_penalty": (SPANDATA.GEN_AI_REQUEST_PRESENCE_PENALTY, float),
"temperature": (SPANDATA.GEN_AI_REQUEST_TEMPERATURE, float),
"top_p": (SPANDATA.GEN_AI_REQUEST_TOP_P, float),
"top_k": (SPANDATA.GEN_AI_REQUEST_TOP_K, int),
}
def _set_from_key(key: str, value: "Any") -> None:
if key in mapping:
(attribute, data_type) = mapping[key]
if value is not None and isinstance(value, data_type):
attributes[attribute] = value
for key, value in list(kwargs.items()):
if key == "prompt" and isinstance(value, str):
attributes.setdefault(SPANDATA.GEN_AI_REQUEST_MESSAGES, []).append(
{"role": "user", "content": value}
)
continue
if key == "system_prompt" and isinstance(value, str):
attributes.setdefault(SPANDATA.GEN_AI_REQUEST_MESSAGES, []).append(
{"role": "system", "content": value}
)
continue
_set_from_key(key, value)
if template == SPANTEMPLATE.AI_TOOL and send_pii:
attributes[SPANDATA.GEN_AI_TOOL_INPUT] = safe_repr(
{"args": args, "kwargs": kwargs}
)
# Coerce to string
if SPANDATA.GEN_AI_REQUEST_MESSAGES in attributes:
attributes[SPANDATA.GEN_AI_REQUEST_MESSAGES] = safe_repr(
attributes[SPANDATA.GEN_AI_REQUEST_MESSAGES]
)
return attributes
def _get_usage_attributes(usage: "Any") -> "dict[str, Any]":
"""
Get usage attributes.
"""
attributes = {}
def _set_from_keys(attribute: str, keys: "tuple[str, ...]") -> None:
for key in keys:
value = _get_value(usage, key)
if value is not None and isinstance(value, int):
attributes[attribute] = value
_set_from_keys(
SPANDATA.GEN_AI_USAGE_INPUT_TOKENS,
("prompt_tokens", "input_tokens"),
)
_set_from_keys(
SPANDATA.GEN_AI_USAGE_OUTPUT_TOKENS,
("completion_tokens", "output_tokens"),
)
_set_from_keys(
SPANDATA.GEN_AI_USAGE_TOTAL_TOKENS,
("total_tokens",),
)
return attributes
def _get_output_attributes(
template: "Union[str, SPANTEMPLATE]", send_pii: bool, result: "Any"
) -> "dict[str, Any]":
"""
Get output attributes for the given span template.
"""
attributes: "dict[str, Any]" = {}
if template in [SPANTEMPLATE.AI_AGENT, SPANTEMPLATE.AI_TOOL, SPANTEMPLATE.AI_CHAT]:
with capture_internal_exceptions():
# Usage from result, result.usage, and result.metadata.usage
usage_candidates = [result]
usage = _get_value(result, "usage")
usage_candidates.append(usage)
meta = _get_value(result, "metadata")
usage = _get_value(meta, "usage")
usage_candidates.append(usage)
for usage_candidate in usage_candidates:
if usage_candidate is not None:
attributes.update(_get_usage_attributes(usage_candidate))
# Response model
model_name = _get_value(result, "model")
if model_name is not None and isinstance(model_name, str):
attributes[SPANDATA.GEN_AI_RESPONSE_MODEL] = model_name
model_name = _get_value(result, "model_name")
if model_name is not None and isinstance(model_name, str):
attributes[SPANDATA.GEN_AI_RESPONSE_MODEL] = model_name
# Tool output
if template == SPANTEMPLATE.AI_TOOL and send_pii:
attributes[SPANDATA.GEN_AI_TOOL_OUTPUT] = safe_repr(result)
return attributes
def _set_input_attributes(
span: "Span",
template: "Union[str, SPANTEMPLATE]",
send_pii: bool,
name: str,
f: "Any",
args: "tuple[Any, ...]",
kwargs: "dict[str, Any]",
) -> None:
"""
Set span input attributes based on the given span template.
:param span: The span to set attributes on.
:param template: The template to use to set attributes on the span.
:param send_pii: Whether to send PII data.
:param f: The wrapped function.
:param args: The arguments to the wrapped function.
:param kwargs: The keyword arguments to the wrapped function.
"""
attributes: "dict[str, Any]" = {}
if template == SPANTEMPLATE.AI_AGENT:
attributes = {
SPANDATA.GEN_AI_OPERATION_NAME: "invoke_agent",
SPANDATA.GEN_AI_AGENT_NAME: name,
}
elif template == SPANTEMPLATE.AI_CHAT:
attributes = {
SPANDATA.GEN_AI_OPERATION_NAME: "chat",
}
elif template == SPANTEMPLATE.AI_TOOL:
attributes = {
SPANDATA.GEN_AI_OPERATION_NAME: "execute_tool",
SPANDATA.GEN_AI_TOOL_NAME: name,
}
docstring = f.__doc__
if docstring is not None:
attributes[SPANDATA.GEN_AI_TOOL_DESCRIPTION] = docstring
attributes.update(_get_input_attributes(template, send_pii, args, kwargs))
span.update_data(attributes or {})
def _set_output_attributes(
span: "Span", template: "Union[str, SPANTEMPLATE]", send_pii: bool, result: "Any"
) -> None:
"""
Set span output attributes based on the given span template.
:param span: The span to set attributes on.
:param template: The template to use to set attributes on the span.
:param send_pii: Whether to send PII data.
:param result: The result of the wrapped function.
"""
span.update_data(_get_output_attributes(template, send_pii, result) or {})
def _should_continue_trace(baggage: "Optional[Baggage]") -> bool:
"""
Check if we should continue the incoming trace according to the strict_trace_continuation spec.
https://develop.sentry.dev/sdk/telemetry/traces/#stricttracecontinuation
"""
client = sentry_sdk.get_client()
parsed_dsn = client.parsed_dsn
client_org_id = parsed_dsn.org_id if parsed_dsn else None
baggage_org_id = baggage.sentry_items.get("org_id") if baggage else None
if (
client_org_id is not None
and baggage_org_id is not None
and client_org_id != baggage_org_id
):
logger.debug(
f"Starting a new trace because org IDs don't match (incoming baggage org_id: {baggage_org_id}, SDK org_id: {client_org_id})"
)
return False
strict_trace_continuation: bool = client.options.get(
"strict_trace_continuation", False
)
if strict_trace_continuation:
if (baggage_org_id is not None and client_org_id is None) or (
baggage_org_id is None and client_org_id is not None
):
logger.debug(
f"Starting a new trace because strict trace continuation is enabled and one org ID is missing (incoming baggage org_id: {baggage_org_id}, SDK org_id: {client_org_id})"
)
return False
return True
def add_sentry_baggage_to_headers(
headers: "MutableMapping[str, str]", sentry_baggage: str
) -> None:
"""Add the Sentry baggage to the headers.
This function directly mutates the provided headers. The provided sentry_baggage
is appended to the existing baggage. If the baggage already contains Sentry items,
they are stripped out first.
"""
existing_baggage = headers.get(BAGGAGE_HEADER_NAME, "")
stripped_existing_baggage = Baggage.strip_sentry_baggage(existing_baggage)
separator = "," if len(stripped_existing_baggage) > 0 else ""
headers[BAGGAGE_HEADER_NAME] = (
stripped_existing_baggage + separator + sentry_baggage
)
def _make_sampling_decision(
name: str,
attributes: "Optional[Attributes]",
scope: "sentry_sdk.Scope",
) -> "tuple[bool, Optional[float], Optional[float], Optional[str]]":
"""
Decide whether a span should be sampled.
Returns a tuple with:
1. the sampling decision
2. the effective sample rate
3. the sample rand
4. the reason for not sampling the span, if unsampled
"""
client = sentry_sdk.get_client()
if not has_tracing_enabled(client.options):
return False, None, None, None
propagation_context = scope.get_active_propagation_context()
sample_rand = None
if propagation_context.baggage is not None:
sample_rand = propagation_context.baggage._sample_rand()
if sample_rand is None:
sample_rand = _generate_sample_rand(propagation_context.trace_id)
# If there's a traces_sampler, use that; otherwise use traces_sample_rate
traces_sampler_defined = callable(client.options.get("traces_sampler"))
if traces_sampler_defined:
sampling_context = {
"span_context": {
"name": name,
"trace_id": propagation_context.trace_id,
"parent_span_id": propagation_context.parent_span_id,
"parent_sampled": propagation_context.parent_sampled,
"attributes": dict(attributes) if attributes else {},
},
}
if propagation_context.custom_sampling_context:
sampling_context.update(propagation_context.custom_sampling_context)
sample_rate = client.options["traces_sampler"](sampling_context)
else:
if propagation_context.parent_sampled is not None:
sample_rate = propagation_context.parent_sampled
else:
sample_rate = client.options["traces_sample_rate"]
# Validate whether the sample_rate we got is actually valid. Since
# traces_sampler is user-provided, it could return anything.
if not is_valid_sample_rate(sample_rate, source="Tracing"):
logger.warning(f"[Tracing] Discarding {name} because of invalid sample rate.")
return False, None, None, "sample_rate"
sample_rate = float(sample_rate)
if not sample_rate:
if traces_sampler_defined:
reason = "traces_sampler returned 0 or False"
else:
reason = "traces_sample_rate is set to 0"
logger.debug(f"[Tracing] Discarding {name} because {reason}")
return False, 0.0, None, "sample_rate"
# Adjust sample rate if we're under backpressure
sample_rate_before_backpressure = sample_rate
if client.monitor:
sample_rate /= 2**client.monitor.downsample_factor
if not sample_rate:
logger.debug(f"[Tracing] Discarding {name} because backpressure")
return False, 0.0, None, "backpressure"
# Make the actual decision
sampled = sample_rand < sample_rate
if sampled:
logger.debug(f"[Tracing] Starting {name}")
outcome = None
else:
# Determine why exactly the span will not be sampled. If we've lowered
# the effective sample_rate because of backpressure, check whether the
# span would've been sampled if backpressure wasn't active. If that's the
# case, backpressure is the actual reason, otherwise just pure sampling
# rate.
if (
sample_rate_before_backpressure != sample_rate
and sample_rand < sample_rate_before_backpressure
):
logger.debug(f"[Tracing] Discarding {name} because backpressure")
outcome = "backpressure"
else:
logger.debug(
f"[Tracing] Discarding {name} because it's not included in the random sample (sampling rate = {sample_rate})"
)
outcome = "sample_rate"
return sampled, sample_rate, sample_rand, outcome
def is_ignored_span(name: str, attributes: "Optional[Attributes]") -> bool:
"""Determine if a span fits one of the rules in ignore_spans."""
client = sentry_sdk.get_client()
ignore_spans = (client.options.get("_experiments") or {}).get("ignore_spans")
if not ignore_spans:
return False
def _matches(rule: "Any", value: "Any") -> bool:
if isinstance(rule, Pattern):
if isinstance(value, str):
return bool(rule.fullmatch(value))
else:
return False
return rule == value
for rule in ignore_spans:
if isinstance(rule, (str, Pattern)):
if _matches(rule, name):
return True
elif isinstance(rule, dict) and ("name" in rule or "attributes" in rule):
name_matches = True
attributes_match = True
if "name" in rule:
name_matches = _matches(rule["name"], name)
if "attributes" in rule:
attributes = attributes or {}
for attribute, value in rule["attributes"].items():
if attribute not in attributes or not _matches(
value, attributes[attribute]
):
attributes_match = False
break
if name_matches and attributes_match:
return True
return False
# Circular imports
from sentry_sdk.traces import (
LOW_QUALITY_SEGMENT_SOURCES,
StreamedSpan,
)
from sentry_sdk.traces import (
start_span as start_streaming_span,
)
from sentry_sdk.tracing import (
BAGGAGE_HEADER_NAME,
LOW_QUALITY_TRANSACTION_SOURCES,
SENTRY_TRACE_HEADER_NAME,
Span,
)
if TYPE_CHECKING:
from sentry_sdk.tracing import Span
Directory Contents
Dirs: 5 × Files: 36