Skip to content

Cleanup op and description mapping #4560

New issue

Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.

By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.

Already on GitHub? Sign in to your account

Open
wants to merge 1 commit into
base: potel-base
Choose a base branch
from
Open
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
2 changes: 0 additions & 2 deletions sentry_sdk/_types.py
Original file line number Diff line number Diff line change
Expand Up @@ -262,5 +262,3 @@ class SDKInfo(TypedDict):
)

HttpStatusCodeRange = Union[int, Container[int]]

OtelExtractedSpanData = tuple[str, str, Optional[str], Optional[int], Optional[str]]
2 changes: 2 additions & 0 deletions sentry_sdk/consts.py
Original file line number Diff line number Diff line change
Expand Up @@ -674,6 +674,7 @@ class OP:
HTTP_CLIENT = "http.client"
HTTP_CLIENT_STREAM = "http.client.stream"
HTTP_SERVER = "http.server"
MESSAGE = "message"
MIDDLEWARE_DJANGO = "middleware.django"
MIDDLEWARE_LITESTAR = "middleware.litestar"
MIDDLEWARE_LITESTAR_RECEIVE = "middleware.litestar.receive"
Expand Down Expand Up @@ -705,6 +706,7 @@ class OP:
QUEUE_TASK_HUEY = "queue.task.huey"
QUEUE_SUBMIT_RAY = "queue.submit.ray"
QUEUE_TASK_RAY = "queue.task.ray"
RPC = "rpc"
SUBPROCESS = "subprocess"
SUBPROCESS_WAIT = "subprocess.wait"
SUBPROCESS_COMMUNICATE = "subprocess.communicate"
Expand Down
20 changes: 10 additions & 10 deletions sentry_sdk/opentelemetry/span_processor.py
Original file line number Diff line number Diff line change
Expand Up @@ -219,18 +219,16 @@ def _root_span_to_transaction_event(self, span: ReadableSpan) -> Optional[Event]
if profile_context:
contexts["profile"] = profile_context

(_, description, _, http_status, _) = span_data

if http_status:
contexts["response"] = {"status_code": http_status}
if span_data.http_status:
contexts["response"] = {"status_code": span_data.http_status}

if span.resource.attributes:
contexts[OTEL_SENTRY_CONTEXT] = {"resource": dict(span.resource.attributes)}

event.update(
{
"type": "transaction",
"transaction": transaction_name or description,
"transaction": transaction_name or span_data.description,
"transaction_info": {"source": transaction_source or "custom"},
"contexts": contexts,
}
Expand All @@ -257,19 +255,21 @@ def _span_to_json(self, span: ReadableSpan) -> Optional[dict[str, Any]]:
span_id = format_span_id(span.context.span_id)
parent_span_id = format_span_id(span.parent.span_id) if span.parent else None

(op, description, status, _, origin) = extract_span_data(span)
span_data = extract_span_data(span)

span_json.update(
{
"trace_id": trace_id,
"span_id": span_id,
"op": op,
"description": description,
"status": status,
"origin": origin or DEFAULT_SPAN_ORIGIN,
"description": span_data.description,
"origin": span_data.origin or DEFAULT_SPAN_ORIGIN,
}
)

if span_data.op:
span_json["op"] = span_data.op
if span_data.status:
span_json["status"] = span_data.status
if parent_span_id:
span_json["parent_span_id"] = parent_span_id

Expand Down
218 changes: 94 additions & 124 deletions sentry_sdk/opentelemetry/utils.py
Original file line number Diff line number Diff line change
@@ -1,6 +1,7 @@
from __future__ import annotations
import re
from datetime import datetime, timezone
from dataclasses import dataclass

from urllib3.util import parse_url as urlparse
from urllib.parse import quote, unquote
Expand Down Expand Up @@ -30,8 +31,7 @@
from sentry_sdk._types import TYPE_CHECKING

if TYPE_CHECKING:
from typing import Any, Optional, Mapping, Sequence, Union, Type, TypeVar
from sentry_sdk._types import OtelExtractedSpanData
from typing import Any, Optional, Mapping, Union, Type, TypeVar

T = TypeVar("T")

Expand Down Expand Up @@ -111,115 +111,111 @@ def extract_transaction_name_source(
)


def extract_span_data(span: ReadableSpan) -> OtelExtractedSpanData:
op = span.name
description = span.name
status, http_status = extract_span_status(span)
@dataclass
class ExtractedSpanData:
description: str
op: Optional[str] = None
status: Optional[str] = None
http_status: Optional[int] = None
origin: Optional[str] = None


def extract_span_data(span: ReadableSpan) -> ExtractedSpanData:
"""
Try to populate sane values for op, description and statuses based on what we have.
The op and description mapping is fundamentally janky because otel only has a single `name`.

Priority is given first to attributes explicitly defined by us via the SDK.
Otherwise we try to infer sane values from other attributes.
"""
op = None
description = None
origin = None
if span.attributes is None:
return (op, description, status, http_status, origin)

attribute_op = get_typed_attribute(span.attributes, SentrySpanAttribute.OP, str)
op = attribute_op or op
description = (
get_typed_attribute(span.attributes, SentrySpanAttribute.DESCRIPTION, str)
or description
)
origin = get_typed_attribute(span.attributes, SentrySpanAttribute.ORIGIN, str)

http_method = get_typed_attribute(span.attributes, SpanAttributes.HTTP_METHOD, str)
if http_method:
return span_data_for_http_method(span)

db_query = span.attributes.get(SpanAttributes.DB_SYSTEM)
if db_query:
return span_data_for_db_query(span)

rpc_service = span.attributes.get(SpanAttributes.RPC_SERVICE)
if rpc_service:
return (
attribute_op or "rpc",
description,
status,
http_status,
origin,
)
if span.attributes is not None:
op = get_typed_attribute(
span.attributes, SentrySpanAttribute.OP, str
) or infer_op(span)

messaging_system = span.attributes.get(SpanAttributes.MESSAGING_SYSTEM)
if messaging_system:
return (
attribute_op or "message",
description,
status,
http_status,
origin,
description = (
get_typed_attribute(span.attributes, SentrySpanAttribute.DESCRIPTION, str)
or get_typed_attribute(span.attributes, SentrySpanAttribute.NAME, str)
or infer_description(span)
)

faas_trigger = span.attributes.get(SpanAttributes.FAAS_TRIGGER)
if faas_trigger:
return (str(faas_trigger), description, status, http_status, origin)
origin = get_typed_attribute(span.attributes, SentrySpanAttribute.ORIGIN, str)

return (op, description, status, http_status, origin)
# TODO status cleanup
(status, http_status) = extract_span_status(span)

return ExtractedSpanData(
description=description or span.name,
op=op,
status=status,
http_status=http_status,
origin=origin,
)

def span_data_for_http_method(span: ReadableSpan) -> OtelExtractedSpanData:
span_attributes = span.attributes or {}

op = get_typed_attribute(span_attributes, SentrySpanAttribute.OP, str)
if op is None:
op = "http"
def infer_op(span: ReadableSpan) -> Optional[str]:
"""
Try to infer op for the various types of instrumentation.
"""
if span.attributes is None:
return None

if SpanAttributes.HTTP_METHOD in span.attributes:
op = "http"
if span.kind == SpanKind.SERVER:
op += ".server"
elif span.kind == SpanKind.CLIENT:
op += ".client"
return op
elif SpanAttributes.DB_SYSTEM in span.attributes:
return OP.DB
elif SpanAttributes.RPC_SERVICE in span.attributes:
return OP.RPC
elif SpanAttributes.MESSAGING_SYSTEM in span.attributes:
return OP.MESSAGE
elif SpanAttributes.FAAS_TRIGGER in span.attributes:
return get_typed_attribute(span.attributes, SpanAttributes.FAAS_TRIGGER, str)
else:
return None

http_method = span_attributes.get(SpanAttributes.HTTP_METHOD)
route = span_attributes.get(SpanAttributes.HTTP_ROUTE)
target = span_attributes.get(SpanAttributes.HTTP_TARGET)
peer_name = span_attributes.get(SpanAttributes.NET_PEER_NAME)

# TODO-neel-potel remove description completely
description = get_typed_attribute(
span_attributes, SentrySpanAttribute.DESCRIPTION, str
) or get_typed_attribute(span_attributes, SentrySpanAttribute.NAME, str)
if description is None:
description = f"{http_method}"
def infer_description(span: ReadableSpan) -> Optional[str]:
if span.attributes is None:
return None

if SpanAttributes.HTTP_METHOD in span.attributes:
http_method = get_typed_attribute(
span.attributes, SpanAttributes.HTTP_METHOD, str
)
route = get_typed_attribute(span.attributes, SpanAttributes.HTTP_ROUTE, str)
target = get_typed_attribute(span.attributes, SpanAttributes.HTTP_TARGET, str)
peer_name = get_typed_attribute(
span.attributes, SpanAttributes.NET_PEER_NAME, str
)
url = get_typed_attribute(span.attributes, SpanAttributes.HTTP_URL, str)

if route:
description = f"{http_method} {route}"
return f"{http_method} {route}"
elif target:
description = f"{http_method} {target}"
return f"{http_method} {target}"
elif peer_name:
description = f"{http_method} {peer_name}"
return f"{http_method} {peer_name}"
elif url:
parsed_url = urlparse(url)
url = "{}://{}{}".format(
parsed_url.scheme, parsed_url.netloc, parsed_url.path
)
return f"{http_method} {url}"
else:
url = span_attributes.get(SpanAttributes.HTTP_URL)
url = get_typed_attribute(span_attributes, SpanAttributes.HTTP_URL, str)

if url:
parsed_url = urlparse(url)
url = "{}://{}{}".format(
parsed_url.scheme, parsed_url.netloc, parsed_url.path
)
description = f"{http_method} {url}"

status, http_status = extract_span_status(span)

origin = get_typed_attribute(span_attributes, SentrySpanAttribute.ORIGIN, str)

return (op, description, status, http_status, origin)


def span_data_for_db_query(span: ReadableSpan) -> OtelExtractedSpanData:
span_attributes = span.attributes or {}

op = get_typed_attribute(span_attributes, SentrySpanAttribute.OP, str) or OP.DB
statement = get_typed_attribute(span_attributes, SpanAttributes.DB_STATEMENT, str)

description = statement or span.name
origin = get_typed_attribute(span_attributes, SentrySpanAttribute.ORIGIN, str)

return (op, description, None, None, origin)
return http_method
elif SpanAttributes.DB_SYSTEM in span.attributes:
return get_typed_attribute(span.attributes, SpanAttributes.DB_STATEMENT, str)
else:
return None


def extract_span_status(span: ReadableSpan) -> tuple[Optional[str], Optional[int]]:
Expand Down Expand Up @@ -258,17 +254,7 @@ def extract_span_status(span: ReadableSpan) -> tuple[Optional[str], Optional[int


def infer_status_from_attributes(
span_attributes: Mapping[
str,
str
| bool
| int
| float
| Sequence[str]
| Sequence[bool]
| Sequence[int]
| Sequence[float],
],
span_attributes: Mapping[str, Any],
) -> tuple[Optional[str], Optional[int]]:
http_status = get_http_status_code(span_attributes)

Expand All @@ -282,19 +268,7 @@ def infer_status_from_attributes(
return (None, None)


def get_http_status_code(
span_attributes: Mapping[
str,
str
| bool
| int
| float
| Sequence[str]
| Sequence[bool]
| Sequence[int]
| Sequence[float],
],
) -> Optional[int]:
def get_http_status_code(span_attributes: Mapping[str, Any]) -> Optional[int]:
try:
http_status = get_typed_attribute(
span_attributes, SpanAttributes.HTTP_RESPONSE_STATUS_CODE, int
Expand Down Expand Up @@ -329,7 +303,7 @@ def extract_span_attributes(span: ReadableSpan, namespace: str) -> dict[str, Any


def get_trace_context(
span: ReadableSpan, span_data: Optional[OtelExtractedSpanData] = None
span: ReadableSpan, span_data: Optional[ExtractedSpanData] = None
) -> dict[str, Any]:
if not span.context:
return {}
Expand All @@ -341,27 +315,23 @@ def get_trace_context(
if span_data is None:
span_data = extract_span_data(span)

(op, _, status, _, origin) = span_data

trace_context: dict[str, Any] = {
"trace_id": trace_id,
"span_id": span_id,
"parent_span_id": parent_span_id,
"op": op,
"origin": origin or DEFAULT_SPAN_ORIGIN,
"origin": span_data.origin or DEFAULT_SPAN_ORIGIN,
}

if status:
trace_context["status"] = status

if span_data.op:
trace_context["op"] = span_data.op
if span_data.status:
trace_context["status"] = span_data.status
if span.attributes:
trace_context["data"] = dict(span.attributes)

trace_state = get_trace_state(span)
trace_context["dynamic_sampling_context"] = dsc_from_trace_state(trace_state)

# TODO-neel-potel profiler thread_id, thread_name

return trace_context


Expand Down
2 changes: 1 addition & 1 deletion sentry_sdk/tracing.py
Original file line number Diff line number Diff line change
Expand Up @@ -187,7 +187,7 @@ def __init__(
# OTel timestamps have nanosecond precision
start_timestamp = convert_to_otel_timestamp(start_timestamp)

span_name = name or description or op or DEFAULT_SPAN_NAME
span_name = name or description or DEFAULT_SPAN_NAME

# Prepopulate some attrs so that they're accessible in traces_sampler
attributes = attributes or {}
Expand Down
Original file line number Diff line number Diff line change
@@ -1,7 +1,7 @@
"""
Tests need a local clickhouse instance running, this can best be done using
```sh
docker run -d -p 18123:8123 -p9000:9000 --name clickhouse-test --ulimit nofile=262144:262144 --rm clickhouse
docker run -d -e CLICKHOUSE_SKIP_USER_SETUP=1 -p 8123:8123 -p 9000:9000 --name clickhouse-test --ulimit nofile=262144:262144 --rm clickhouse
```
"""

Expand Down Expand Up @@ -822,7 +822,7 @@ def test_clickhouse_dbapi_spans(sentry_init, capture_events, capture_envelopes)
span.pop("span_id", None)
span.pop("start_timestamp", None)
span.pop("timestamp", None)
span.pop("status")
span.pop("status", None)
Copy link
Member Author

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

these were all None before anyway


assert event["spans"] == expected_spans

Expand Down
Loading
Loading