dask
diff --git a/‎distributed/http/tests/test_core.py‎
Lines changed: 5 additions & 1 deletion b/‎distributed/http/tests/test_core.py‎
Lines changed: 5 additions & 1 deletion
diff --git a/‎distributed/http/worker/prometheus/core.py‎
Lines changed: 25 additions & 64 deletions b/‎distributed/http/worker/prometheus/core.py‎
Lines changed: 25 additions & 64 deletions
diff --git a/‎distributed/http/worker/tests/test_worker_http.py‎
Lines changed: 4 additions & 36 deletions b/‎distributed/http/worker/tests/test_worker_http.py‎
Lines changed: 4 additions & 36 deletions
diff --git a/‎distributed/metrics.py‎
Lines changed: 174 additions & 1 deletion b/‎distributed/metrics.py‎
Lines changed: 174 additions & 1 deletion
@@ -7,7 +7,7 @@
 
 from distributed import Semaphore
 from distributed.utils_test import fetch_metrics_sample_names, gen_cluster, inc
-
+from distributed.metrics import context_meter
 
 @gen_cluster(client=True)
 async def test_scheduler(c, s, a, b):
@@ -26,6 +26,10 @@ async def test_prometheus_api_doc(c, s, a):
     # Some metrics only appear if there are tasks on the cluster
     fut = c.submit(inc, 1)
     await fut
+
+    with context_meter.no_threshold():
+        a.data.evict()
+
     # Semaphore metrics only appear after semaphores are used
     sem = await Semaphore()
     await sem.acquire()
 
@@ -152,44 +152,11 @@ def collect(self) -> Iterator[Metric]:
             unit="seconds",
             value=max_tick_duration,
         )
-
         yield CounterMetricFamily(
             self.build_name("tick_count"),
             "Total number of ticks observed since the server started",
             value=self.server._tick_counter,
         )
-
-        # This duplicates spill_time_total; however the breakdown is different
-        evloop_blocked_total = CounterMetricFamily(
-            self.build_name("event_loop_blocked_time"),
-            "Total time during which the worker's event loop was blocked "
-            "by spill/unspill activity since the latest worker reset",
-            unit="seconds",
-            labels=["cause"],
-        )
-        # This is typically higher than spill_time_per_key_max, as multiple keys can be
-        # spilled/unspilled without yielding the event loop
-        evloop_blocked_max = GaugeMetricFamily(
-            self.build_name("event_loop_blocked_time_max"),
-            "Maximum contiguous time during which the worker's event loop was blocked "
-            "by spill/unspill activity since the previous Prometheus poll",
-            unit="seconds",
-            labels=["cause"],
-        )
-        for family, digest in (
-            (evloop_blocked_total, self.server.digests_total),
-            (evloop_blocked_max, self.server.digests_max),
-        ):
-            for family_label, digest_label in (
-                ("disk-write-target", "disk-write-target-duration"),
-                ("disk-write-spill", "disk-write-spill-duration"),
-                ("disk-read-execute", "disk-load-duration"),
-                ("disk-read-get-data", "get-data-load-duration"),
-            ):
-                family.add_metric([family_label], digest[digest_label])
-
-        yield evloop_blocked_total
-        yield evloop_blocked_max
         self.server.digests_max.clear()
 
     def collect_crick(self) -> Iterator[Metric]:
@@ -243,42 +210,36 @@ def collect_spillbuffer(self) -> Iterator[Metric]:
           read     = spill_bytes.disk_read  / spill_time.disk_read
         """
         try:
-            get_metrics = self.server.data.get_metrics  # type: ignore
+            metrics = self.server.data.cumulative_metrics  # type: ignore
         except AttributeError:
             return  # spilling is disabled
-        metrics = get_metrics()
 
-        total_bytes = CounterMetricFamily(
-            self.build_name("spill_bytes"),
-            "Total size of memory and disk accesses caused by managed data "
-            "since the latest worker restart",
-            labels=["activity"],
-        )
-        # Note: memory_read is used to calculate cache hit ratios (see docstring)
-        for k in ("memory_read", "disk_read", "disk_write"):
-            total_bytes.add_metric([k], metrics[f"{k}_bytes_total"])
-        yield total_bytes
-
-        total_counts = CounterMetricFamily(
-            self.build_name("spill_count"),
-            "Total number of memory and disk accesses caused by managed data "
-            "since the latest worker restart",
-            labels=["activity"],
-        )
+        counters = {
+            "bytes": CounterMetricFamily(
+                self.build_name("spill_bytes"),
+                "Total size of memory and disk accesses caused by managed data "
+                "since the latest worker restart",
+                labels=["activity"],
+            ),
+            "count": CounterMetricFamily(
+                self.build_name("spill_count"),
+                "Total number of memory and disk accesses caused by managed data "
+                "since the latest worker restart",
+                labels=["activity"],
+            ),
+            "seconds": CounterMetricFamily(
+                self.build_name("spill_time"),
+                "Total time spent spilling/unspilling since the latest worker restart",
+                unit="seconds",
+                labels=["activity"],
+            ),
+        }
+
         # Note: memory_read is used to calculate cache hit ratios (see docstring)
-        for k in ("memory_read", "disk_read", "disk_write"):
-            total_counts.add_metric([k], metrics[f"{k}_count_total"])
-        yield total_counts
+        for (label, unit), value in metrics.items():
+            counters[unit].add_metric([label], value)
 
-        total_times = CounterMetricFamily(
-            self.build_name("spill_time"),
-            "Total time spent spilling/unspilling since the latest worker restart",
-            unit="seconds",
-            labels=["activity"],
-        )
-        for k in ("pickle", "disk_write", "disk_read", "unpickle"):
-            total_times.add_metric([k], metrics[f"{k}_time_total"])
-        yield total_times
+        yield from counters.values()
 
 
 class PrometheusHandler(RequestHandler):
 
@@ -7,6 +7,7 @@
 from tornado.httpclient import AsyncHTTPClient
 
 from distributed import Event, Worker, wait
+from distributed.metrics import context_meter
 from distributed.sizeof import sizeof
 from distributed.utils_test import (
     async_wait_for,
@@ -25,13 +26,14 @@ async def test_prometheus(c, s, a):
     fut = c.submit(lambda: 1)
     await wait(fut)
 
+    with context_meter.no_threshold():
+        a.data.evict()
+
     active_metrics = await fetch_metrics_sample_names(
         a.http_server.port, prefix="dask_worker_"
     )
     expected_metrics = {
         "dask_worker_concurrent_fetch_requests",
-        "dask_worker_event_loop_blocked_time_max_seconds",
-        "dask_worker_event_loop_blocked_time_seconds_total",
         "dask_worker_latency_seconds",
         "dask_worker_memory_bytes",
         "dask_worker_spill_bytes_total",
@@ -247,37 +249,3 @@ def __sizeof__(self):
     assert 50 * 2**20 < metrics["managed"] < 100 * 2**30  # capped to process memory
     assert metrics["unmanaged"] == 0  # floored to 0
     assert metrics["spilled"] == 0
-
-
-@gen_cluster(
-    client=True,
-    nthreads=[("127.0.0.1", 1)],
-    worker_kwargs={"memory_limit": "10 MiB"},
-    config={
-        "distributed.worker.memory.target": 1.0,
-        "distributed.worker.memory.spill": False,
-        "distributed.worker.memory.pause": False,
-    },
-)
-async def test_prometheus_resets_max_metrics(c, s, a):
-    pytest.importorskip("prometheus_client")
-    np = pytest.importorskip("numpy")
-
-    # The first GET to /metrics calls collect() twice
-    await fetch_metrics(a.http_server.port)
-
-    # We need substantial data to be sure that spilling it will take more than 5ms.
-    x = c.submit(lambda: "x" * 40_000_000, key="x", workers=[a.address])
-    await wait(x)
-    # Key is individually larger than target threshold, so it was spilled immediately
-    assert "x" in a.data.slow
-
-    nsecs = a.digests_max["disk-write-target-duration"]
-    assert nsecs > 0
-
-    families = await fetch_metrics(a.http_server.port)
-    metric = families["dask_worker_event_loop_blocked_time_max_seconds"]
-    samples = {sample.labels["cause"]: sample.value for sample in metric.samples}
-
-    assert samples["disk-write-target"] == nsecs
-    assert a.digests_max["disk-write-target-duration"] == 0
@@ -2,8 +2,13 @@
 
 import collections
 import time as timemod
-from collections.abc import Callable
+from collections.abc import Callable, Iterator
+from contextlib import contextmanager
+from contextvars import ContextVar
+from dataclasses import dataclass
 from functools import wraps
+from math import nan
+from typing import Literal
 
 import psutil
 
@@ -103,3 +108,171 @@ def resync(self) -> None:
     thread_time = timemod.thread_time
 except (AttributeError, OSError):  # pragma: no cover
     thread_time = process_time
+
+
+@dataclass
+class MeterOutput:
+    start: float
+    stop: float
+    delta: float
+    __slots__ = tuple(__annotations__)
+
+
+@contextmanager
+def meter(
+    func: Callable[[], float] = timemod.perf_counter,
+    floor: float | Literal[False] = 0.0,
+) -> Iterator[MeterOutput]:
+    """Convenience context manager which calls func() before and after the wrapped
+    code and calculates the delta.
+
+    Parameters
+    ----------
+    label: str
+        label to pass to the callback
+    func: callable
+        function to call before and after, which must return a number.
+        Besides time, it could return e.g. cumulative network traffic or disk usage.
+        Default: :func:`timemod.perf_counter`
+    floor: float or False, optional
+        Floor the delta to the given value (default: 0). This is useful for strictly
+        cumulative functions that can occasionally glitch and go backwards.
+        Set to False to disable.
+    """
+    out = MeterOutput(func(), nan, nan)
+    try:
+        yield out
+    finally:
+        out.stop = func()
+        out.delta = out.stop - out.start
+        if floor is not False:
+            out.delta = max(floor, out.delta)
+
+
+class ContextMeter:
+    """Context-based general purpose meter.
+
+    Usage
+    -----
+    1. In high level code, call :meth:`add_callback` to install a hook that defines an
+       activity
+    2. In low level code, typically many stack levels below, log quantitative events
+       (e.g. elapsed time, transferred bytes, etc.) so that they will be attributed to
+       the high-level code calling it, either with :meth:`meter` or
+       :meth:`digest_metric`.
+
+    Examples
+    --------
+    In the code that e.g. sends a Python object from A to B over the network:
+    >>> from distributed.metrics import context_meter
+    >>> with context_meter.add_callback(partial(print, "A->B comms:")):
+    ...     await send_over_the_network(obj)
+
+    In the serialization utilities, called many stack levels below:
+    >>> with context_meter.meter("dumps"):
+    ...     pik = pickle.dumps(obj)
+    >>> with context_meter.meter("compress"):
+    ...     pik = lz4.compress(pik)
+
+    And finally, elsewhere, deep into the TCP stack:
+    >>> with context_meter.meter("network-write"):
+    ...     await comm.write(frames)
+
+    When you call the top-level code, you'll get::
+      A->B comms: dumps 0.012 seconds
+      A->B comms: compress 0.034 seconds
+      A->B comms: network-write 0.567 seconds
+    """
+
+    _callbacks: ContextVar[list[Callable[[str, float, str], None]]]
+    default_threshold: float
+
+    def __init__(self):
+        self._callbacks = ContextVar(f"MetricHook<{id(self)}>._callbacks", default=[])
+        self.default_threshold = 0.001
+
+    @contextmanager
+    def add_callback(
+        self, callback: Callable[[str, float, str], None]
+    ) -> Iterator[None]:
+        """Add a callback when entering the context and remove it when exiting it.
+        The callback must accept the same parameters as :meth:`digest_metric`.
+        """
+        cbs = self._callbacks.get()
+        tok = self._callbacks.set(cbs + [callback])
+        try:
+            yield
+        finally:
+            tok.var.reset(tok)
+
+    def digest_metric(self, label: str, value: float, unit: str) -> None:
+        """Invoke the currently set context callbacks for an arbitrary quantitative
+        metric.
+        """
+        cbs = self._callbacks.get()
+        for cb in cbs:
+            cb(label, value, unit)
+
+    @contextmanager
+    def meter(
+        self,
+        label: str,
+        unit: str = "seconds",
+        func: Callable[[], float] = timemod.perf_counter,
+        floor: float | Literal[False] = 0.0,
+        threshold: float | None = None,
+    ) -> Iterator[None]:
+        """Convenience context manager which calls func() before and after the wrapped
+        code, calculates the delta, and finally calls :meth:`digest_metric`. It also
+        subtracts any other calls to :meth:`meter` or :meth:`digest_metric` with the
+        same unit performed within the context, so that the total is strictly additive.
+
+        :meth:`digest_metric` is not called in case of exception.
+
+        Parameters
+        ----------
+        label: str
+            label to pass to the callback
+        unit: str, optional
+            unit to pass to the callback. Default: seconds
+        func: callable
+            see :func:`meter`
+        floor: bool, optional
+            see :func:`meter`
+        threshold: float, optional
+            Do not call :meth:`digest_metric` if the delta is less than this.
+            Default: 1ms
+        """
+        offsets = []
+
+        def cb(label2: str, value2: float, unit2: str) -> None:
+            if unit2 == unit:
+                # This must be threadsafe to support when callbacks are invoked from
+                # distributed.utils.offload; '+=' on a float would not be threadsafe!
+                offsets.append(value2)
+
+        with self.add_callback(cb), meter(func, floor=False) as m:
+            yield
+
+        delta = m.delta - sum(offsets)
+        if floor is not False:
+            delta = max(floor, delta)
+        if threshold is None:
+            threshold = self.default_threshold
+        if delta >= threshold:
+            self.digest_metric(label, delta, unit)
+
+    @contextmanager
+    def no_threshold(self) -> Iterator[None]:
+        """Temporarily disable default threshold in :meth:`meter()`.
+        Useful for unit testing trivial timings.
+        """
+        bak = self.default_threshold
+        self.default_threshold = 0.0
+        try:
+            yield
+        finally:
+            self.default_threshold = bak
+
+
+context_meter = ContextMeter()