added 2D (normalized) surface dice metric (#4050)

SilviaSeidlitz · web-flow · commit 6602303578cb · 2022-04-10T21:51:00.000+01:00
* added 2D (normalized) surface dice metric

Signed-off-by: Silvia Seidlitz &lt;s.seidlitz@dkfz-heidelberg.de&gt;

* exclude from min tests

Signed-off-by: Wenqi Li &lt;wenqil@nvidia.com&gt;

* more detailled docstring

Signed-off-by: Silvia Seidlitz &lt;s.seidlitz@dkfz-heidelberg.de&gt;
diff --git a/docs/source/metrics.rst b/docs/source/metrics.rst
@@ -69,6 +69,13 @@ Metrics
 .. autoclass:: SurfaceDistanceMetric
     :members:
 
+`Surface dice`
+--------------
+.. autofunction:: compute_surface_dice
+
+.. autoclass:: SurfaceDiceMetric
+    :members:
+
 `Mean squared error`
 --------------------
 .. autoclass:: MSEMetric
diff --git a/monai/metrics/__init__.py b/monai/metrics/__init__.py
@@ -17,5 +17,6 @@
 from .metric import Cumulative, CumulativeIterationMetric, IterationMetric, Metric
 from .regression import MAEMetric, MSEMetric, PSNRMetric, RMSEMetric
 from .rocauc import ROCAUCMetric, compute_roc_auc
+from .surface_dice import SurfaceDiceMetric, compute_surface_dice
 from .surface_distance import SurfaceDistanceMetric, compute_average_surface_distance
 from .utils import do_metric_reduction, get_mask_edges, get_surface_distance, ignore_background
diff --git a/monai/metrics/surface_dice.py b/monai/metrics/surface_dice.py
@@ -0,0 +1,236 @@
+# Copyright (c) MONAI Consortium
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#     http://www.apache.org/licenses/LICENSE-2.0
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+import warnings
+from typing import List, Union
+
+import numpy as np
+import torch
+
+from monai.metrics.utils import do_metric_reduction, get_mask_edges, get_surface_distance, ignore_background
+from monai.utils import MetricReduction, convert_data_type
+
+from .metric import CumulativeIterationMetric
+
+
+class SurfaceDiceMetric(CumulativeIterationMetric):
+    """
+    Computes the Normalized Surface Distance (NSD) for each batch sample and class of
+    predicted segmentations `y_pred` and corresponding reference segmentations `y` according to equation :eq:`nsd`.
+    This implementation supports 2D images. For 3D images, please refer to DeepMind's implementation
+    https://github.com/deepmind/surface-distance.
+
+    The class- and batch sample-wise NSD values can be aggregated with the function `aggregate`.
+
+    Args:
+        class_thresholds: List of class-specific thresholds.
+            The thresholds relate to the acceptable amount of deviation in the segmentation boundary in pixels.
+            Each threshold needs to be a finite, non-negative number.
+        include_background: Whether to skip NSD computation on the first channel of the predicted output.
+            Defaults to ``False``.
+        distance_metric: The metric used to compute surface distances.
+            One of [``"euclidean"``, ``"chessboard"``, ``"taxicab"``].
+            Defaults to ``"euclidean"``.
+        reduction: The mode to aggregate metrics.
+            One of [``"mean"``, ``"sum"``, ``"mean_batch"``, ``"sum_batch"``, ``"mean_channel"``, ``"sum_channel"``,
+            ``"none"``].
+            Defaults to ``"mean"``.
+            If ``"none"`` is chosen, no aggregation will be performed.
+            The aggregation will ignore nan values.
+        get_not_nans: whether to return the `not_nans` count.
+            Defaults to ``False``.
+            `not_nans` is the number of batch samples for which not all class-specific NSD values were nan values.
+            If set to ``True``, the function `aggregate` will return both the aggregated NSD and the `not_nans` count.
+            If set to ``False``, `aggregate` will only return the aggregated NSD.
+    """
+
+    def __init__(
+        self,
+        class_thresholds: List[float],
+        include_background: bool = False,
+        distance_metric: str = "euclidean",
+        reduction: Union[MetricReduction, str] = MetricReduction.MEAN,
+        get_not_nans: bool = False,
+    ) -> None:
+        super().__init__()
+        self.class_thresholds = class_thresholds
+        self.include_background = include_background
+        self.distance_metric = distance_metric
+        self.reduction = reduction
+        self.get_not_nans = get_not_nans
+
+    def _compute_tensor(self, y_pred: torch.Tensor, y: torch.Tensor):  # type: ignore
+        r"""
+        Args:
+            y_pred: Predicted segmentation, typically segmentation model output.
+                It must be a one-hot encoded, batch-first tensor [B,C,H,W].
+            y: Reference segmentation.
+                It must be a one-hot encoded, batch-first tensor [B,C,H,W].
+
+        Returns:
+            Pytorch Tensor of shape [B,C], containing the NSD values :math:`\operatorname {NSD}_{b,c}` for each batch
+            index :math:`b` and class :math:`c`.
+        """
+        return compute_surface_dice(
+            y_pred=y_pred,
+            y=y,
+            class_thresholds=self.class_thresholds,
+            include_background=self.include_background,
+            distance_metric=self.distance_metric,
+        )
+
+    def aggregate(self):
+        r"""
+        Aggregates the output of `_compute_tensor`.
+
+        Returns:
+            If `get_not_nans` is set to ``True``, this function returns the aggregated NSD and the `not_nans` count.
+            If `get_not_nans` is set to ``False``, this function returns only the aggregated NSD.
+        """
+        data = self.get_buffer()
+        if not isinstance(data, torch.Tensor):
+            raise ValueError("the data to aggregate must be PyTorch Tensor.")
+
+        # do metric reduction
+        f, not_nans = do_metric_reduction(data, self.reduction)
+        return (f, not_nans) if self.get_not_nans else f
+
+
+def compute_surface_dice(
+    y_pred: torch.Tensor,
+    y: torch.Tensor,
+    class_thresholds: List[float],
+    include_background: bool = False,
+    distance_metric: str = "euclidean",
+):
+    r"""
+    This function computes the (Normalized) Surface Dice (NSD) between the two tensors `y_pred` (referred to as
+    :math:`\hat{Y}`) and `y` (referred to as :math:`Y`). This metric determines which fraction of a segmentation
+    boundary is correctly predicted. A boundary element is considered correctly predicted if the closest distance to the
+    reference boundary is smaller than or equal to the specified threshold related to the acceptable amount of deviation in
+    pixels. The NSD is bounded between 0 and 1.
+
+    This implementation supports multi-class tasks with an individual threshold :math:`\tau_c` for each class :math:`c`.
+    The class-specific NSD for batch index :math:`b`, :math:`\operatorname {NSD}_{b,c}`, is computed using the function:
+
+    .. math::
+        \operatorname {NSD}_{b,c} \left(Y_{b,c}, \hat{Y}_{b,c}\right) = \frac{\left|\mathcal{D}_{Y_{b,c}}^{'}\right| +
+        \left| \mathcal{D}_{\hat{Y}_{b,c}}^{'} \right|}{\left|\mathcal{D}_{Y_{b,c}}\right| +
+        \left|\mathcal{D}_{\hat{Y}_{b,c}}\right|}
+        :label: nsd
+
+    with :math:`\mathcal{D}_{Y_{b,c}}` and :math:`\mathcal{D}_{\hat{Y}_{b,c}}` being two sets of nearest-neighbor
+    distances. :math:`\mathcal{D}_{Y_{b,c}}` is computed from the predicted segmentation boundary towards the reference segmentation
+    boundary and vice-versa for :math:`\mathcal{D}_{\hat{Y}_{b,c}}`. :math:`\mathcal{D}_{Y_{b,c}}^{'}` and
+    :math:`\mathcal{D}_{\hat{Y}_{b,c}}^{'}` refer to the subsets of distances that are smaller or equal to the
+    acceptable distance :math:`\tau_c`:
+
+    .. math::
+        \mathcal{D}_{Y_{b,c}}^{'} = \{ d \in \mathcal{D}_{Y_{b,c}} \, | \, d \leq \tau_c \}.
+
+
+    In the case of a class neither being present in the predicted segmentation, nor in the reference segmentation, a nan value
+    will be returned for this class. In the case of a class being present in only one of predicted segmentation or
+    reference segmentation, the class NSD will be 0.
+
+    This implementation is based on https://arxiv.org/abs/2111.05408 and supports 2D images.
+    Be aware that the computation of boundaries is different from DeepMind's implementation
+    https://github.com/deepmind/surface-distance. In this implementation, the length of a segmentation boundary is
+    interpreted as the number of its edge pixels. In DeepMind's implementation, the length of a segmentation boundary
+    depends on the local neighborhood (cf. https://arxiv.org/abs/1809.04430).
+
+    Args:
+        y_pred: Predicted segmentation, typically segmentation model output.
+            It must be a one-hot encoded, batch-first tensor [B,C,H,W].
+        y: Reference segmentation.
+            It must be a one-hot encoded, batch-first tensor [B,C,H,W].
+        class_thresholds: List of class-specific thresholds.
+            The thresholds relate to the acceptable amount of deviation in the segmentation boundary in pixels.
+            Each threshold needs to be a finite, non-negative number.
+        include_background: Whether to skip the surface dice computation on the first channel of
+            the predicted output. Defaults to ``False``.
+        distance_metric: The metric used to compute surface distances.
+            One of [``"euclidean"``, ``"chessboard"``, ``"taxicab"``].
+            Defaults to ``"euclidean"``.
+
+    Raises:
+        ValueError: If `y_pred` and/or `y` are not PyTorch tensors.
+        ValueError: If `y_pred` and/or `y` do not have four dimensions.
+        ValueError: If `y_pred` and/or `y` have different shapes.
+        ValueError: If `y_pred` and/or `y` are not one-hot encoded
+        ValueError: If the number of channels of `y_pred` and/or `y` is different from the number of class thresholds.
+        ValueError: If any class threshold is not finite.
+        ValueError: If any class threshold is negative.
+
+    Returns:
+        Pytorch Tensor of shape [B,C], containing the NSD values :math:`\operatorname {NSD}_{b,c}` for each batch index
+        :math:`b` and class :math:`c`.
+    """
+
+    if not include_background:
+        y_pred, y = ignore_background(y_pred=y_pred, y=y)
+
+    if not isinstance(y_pred, torch.Tensor) or not isinstance(y, torch.Tensor):
+        raise ValueError("y_pred and y must be PyTorch Tensor.")
+
+    if y_pred.ndimension() != 4 or y.ndimension() != 4:
+        raise ValueError("y_pred and y should have four dimensions: [B,C,H,W].")
+
+    if y_pred.shape != y.shape:
+        raise ValueError(
+            f"y_pred and y should have same shape, but instead, shapes are {y_pred.shape} (y_pred) and {y.shape} (y)."
+        )
+
+    if not torch.all(y_pred.byte() == y_pred) or not torch.all(y.byte() == y):
+        raise ValueError("y_pred and y should be binarized tensors (e.g. torch.int64).")
+    if torch.any(y_pred > 1) or torch.any(y > 1):
+        raise ValueError("y_pred and y should be one-hot encoded.")
+
+    y = y.float()
+    y_pred = y_pred.float()
+
+    batch_size, n_class = y_pred.shape[:2]
+
+    if n_class != len(class_thresholds):
+        raise ValueError(
+            f"number of classes ({n_class}) does not match number of class thresholds ({len(class_thresholds)})."
+        )
+
+    if any(~np.isfinite(class_thresholds)):
+        raise ValueError("All class thresholds need to be finite.")
+
+    if any(np.array(class_thresholds) < 0):
+        raise ValueError("All class thresholds need to be >= 0.")
+
+    nsd = np.empty((batch_size, n_class))
+
+    for b, c in np.ndindex(batch_size, n_class):
+        (edges_pred, edges_gt) = get_mask_edges(y_pred[b, c], y[b, c], crop=False)
+        if not np.any(edges_gt):
+            warnings.warn(f"the ground truth of class {c} is all 0, this may result in nan/inf distance.")
+        if not np.any(edges_pred):
+            warnings.warn(f"the prediction of class {c} is all 0, this may result in nan/inf distance.")
+
+        distances_pred_gt = get_surface_distance(edges_pred, edges_gt, distance_metric=distance_metric)
+        distances_gt_pred = get_surface_distance(edges_gt, edges_pred, distance_metric=distance_metric)
+
+        boundary_complete = len(distances_pred_gt) + len(distances_gt_pred)
+        boundary_correct = np.sum(distances_pred_gt <= class_thresholds[c]) + np.sum(
+            distances_gt_pred <= class_thresholds[c]
+        )
+
+        if boundary_complete == 0:
+            # the class is neither present in the prediction, nor in the reference segmentation
+            nsd[b, c] = np.nan
+        else:
+            nsd[b, c] = boundary_correct / boundary_complete
+
+    return convert_data_type(nsd, torch.Tensor)[0]
diff --git a/tests/min_tests.py b/tests/min_tests.py
@@ -145,6 +145,7 @@ def run_testsuit():
         "test_spacingd",
         "test_splitdimd",
         "test_surface_distance",
+        "test_surface_dice",
         "test_testtimeaugmentation",
         "test_torchvision",
         "test_torchvisiond",
diff --git a/tests/test_surface_dice.py b/tests/test_surface_dice.py