Skip to content

Truncate long sql queries to prevent oversized events to APM server #842

New issue

Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.

By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.

Already on GitHub? Sign in to your account

Merged
merged 9 commits into from
Jun 4, 2020
Merged
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
4 changes: 4 additions & 0 deletions CHANGELOG.asciidoc
Original file line number Diff line number Diff line change
Expand Up @@ -33,6 +33,10 @@ endif::[]

* Added error handling around frame processing in Django {pull}837[#837]

[float]
===== Bug fixes

* Limit SQL queries in context data to 10000 characters {pull}842[#842]

[[release-notes-5.x]]
=== Python Agent version 5.x
Expand Down
7 changes: 6 additions & 1 deletion elasticapm/instrumentation/packages/dbapi2.py
Original file line number Diff line number Diff line change
Expand Up @@ -38,7 +38,7 @@
from elasticapm.instrumentation.packages.base import AbstractInstrumentedModule
from elasticapm.traces import capture_span
from elasticapm.utils import compat, wrapt
from elasticapm.utils.encoding import force_text
from elasticapm.utils.encoding import force_text, shorten


class Literal(object):
Expand Down Expand Up @@ -225,6 +225,11 @@ def _trace_sql(self, method, sql, params, action=QUERY_ACTION):
signature = sql_string + "()"
else:
signature = self.extract_signature(sql_string)

# Truncate sql_string to 10000 characters to prevent large queries from
# causing an error to APM server.
sql_string = shorten(sql_string, string_length=10000)

with capture_span(
signature,
span_type="db",
Expand Down
4 changes: 3 additions & 1 deletion elasticapm/instrumentation/packages/sqlite.py
Original file line number Diff line number Diff line change
Expand Up @@ -35,6 +35,7 @@
extract_signature,
)
from elasticapm.traces import capture_span
from elasticapm.utils.encoding import shorten


class SQLiteCursorProxy(CursorProxy):
Expand All @@ -52,12 +53,13 @@ class SQLiteConnectionProxy(ConnectionProxy):

def _trace_sql(self, method, sql, params):
signature = extract_signature(sql)
sql_string = shorten(sql, string_length=10000)
with capture_span(
signature,
span_type="db",
span_subtype="sqlite",
span_action="query",
extra={"db": {"type": "sql", "statement": sql}},
extra={"db": {"type": "sql", "statement": sql_string}},
):
if params is None:
return method(sql)
Expand Down
4 changes: 4 additions & 0 deletions elasticapm/utils/encoding.py
Original file line number Diff line number Diff line change
Expand Up @@ -218,6 +218,10 @@ def shorten(var, list_length=50, string_length=200, dict_length=50):


def keyword_field(string):
"""
If the given string is longer than KEYWORD_MAX_LENGTH, truncate it to
KEYWORD_MAX_LENGTH-1, adding the "…" character at the end.
"""
if not isinstance(string, compat.string_types) or len(string) <= KEYWORD_MAX_LENGTH:
return string
return string[: KEYWORD_MAX_LENGTH - 1] + u"…"
Expand Down
17 changes: 17 additions & 0 deletions tests/instrumentation/sqlite_tests.py
Original file line number Diff line number Diff line change
Expand Up @@ -125,3 +125,20 @@ def test_nonstandard_connection_execute(instrument, elasticapm_client):
assert spans[3]["action"] == "query"

assert len(spans) == 4


def test_truncate_long_sql(instrument, elasticapm_client):
conn = sqlite3.connect(":memory:")

conn.execute("CREATE TABLE testdb (id integer, username text)")
conn.execute('INSERT INTO testdb VALUES (1, "Ron")')
elasticapm_client.begin_transaction("transaction.test")
conn.execute("""SELECT id, username FROM testdb WHERE username = "%s";""" % ("x" * 10010))
elasticapm_client.end_transaction("MyView")
conn.execute("DROP TABLE testdb")

transactions = elasticapm_client.events[TRANSACTION]
spans = elasticapm_client.spans_for_transaction(transactions[0])

assert len(spans[0]["context"]["db"]["statement"]) == 10000
assert spans[0]["context"]["db"]["statement"].endswith("...")