Skip to content

Commit

Permalink
added 2D (normalized) surface dice metric (#4050)
Browse files Browse the repository at this point in the history
* added 2D (normalized) surface dice metric

Signed-off-by: Silvia Seidlitz <[email protected]>

* exclude from min tests

Signed-off-by: Wenqi Li <[email protected]>

* more detailled docstring

Signed-off-by: Silvia Seidlitz <[email protected]>
  • Loading branch information
SilviaSeidlitz authored Apr 10, 2022
1 parent 17529e7 commit 6602303
Show file tree
Hide file tree
Showing 5 changed files with 537 additions and 0 deletions.
7 changes: 7 additions & 0 deletions docs/source/metrics.rst
Original file line number Diff line number Diff line change
Expand Up @@ -69,6 +69,13 @@ Metrics
.. autoclass:: SurfaceDistanceMetric
:members:

`Surface dice`
--------------
.. autofunction:: compute_surface_dice

.. autoclass:: SurfaceDiceMetric
:members:

`Mean squared error`
--------------------
.. autoclass:: MSEMetric
Expand Down
1 change: 1 addition & 0 deletions monai/metrics/__init__.py
Original file line number Diff line number Diff line change
Expand Up @@ -17,5 +17,6 @@
from .metric import Cumulative, CumulativeIterationMetric, IterationMetric, Metric
from .regression import MAEMetric, MSEMetric, PSNRMetric, RMSEMetric
from .rocauc import ROCAUCMetric, compute_roc_auc
from .surface_dice import SurfaceDiceMetric, compute_surface_dice
from .surface_distance import SurfaceDistanceMetric, compute_average_surface_distance
from .utils import do_metric_reduction, get_mask_edges, get_surface_distance, ignore_background
236 changes: 236 additions & 0 deletions monai/metrics/surface_dice.py
Original file line number Diff line number Diff line change
@@ -0,0 +1,236 @@
# Copyright (c) MONAI Consortium
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
# http://www.apache.org/licenses/LICENSE-2.0
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

import warnings
from typing import List, Union

import numpy as np
import torch

from monai.metrics.utils import do_metric_reduction, get_mask_edges, get_surface_distance, ignore_background
from monai.utils import MetricReduction, convert_data_type

from .metric import CumulativeIterationMetric


class SurfaceDiceMetric(CumulativeIterationMetric):
"""
Computes the Normalized Surface Distance (NSD) for each batch sample and class of
predicted segmentations `y_pred` and corresponding reference segmentations `y` according to equation :eq:`nsd`.
This implementation supports 2D images. For 3D images, please refer to DeepMind's implementation
https://github.com/deepmind/surface-distance.
The class- and batch sample-wise NSD values can be aggregated with the function `aggregate`.
Args:
class_thresholds: List of class-specific thresholds.
The thresholds relate to the acceptable amount of deviation in the segmentation boundary in pixels.
Each threshold needs to be a finite, non-negative number.
include_background: Whether to skip NSD computation on the first channel of the predicted output.
Defaults to ``False``.
distance_metric: The metric used to compute surface distances.
One of [``"euclidean"``, ``"chessboard"``, ``"taxicab"``].
Defaults to ``"euclidean"``.
reduction: The mode to aggregate metrics.
One of [``"mean"``, ``"sum"``, ``"mean_batch"``, ``"sum_batch"``, ``"mean_channel"``, ``"sum_channel"``,
``"none"``].
Defaults to ``"mean"``.
If ``"none"`` is chosen, no aggregation will be performed.
The aggregation will ignore nan values.
get_not_nans: whether to return the `not_nans` count.
Defaults to ``False``.
`not_nans` is the number of batch samples for which not all class-specific NSD values were nan values.
If set to ``True``, the function `aggregate` will return both the aggregated NSD and the `not_nans` count.
If set to ``False``, `aggregate` will only return the aggregated NSD.
"""

def __init__(
self,
class_thresholds: List[float],
include_background: bool = False,
distance_metric: str = "euclidean",
reduction: Union[MetricReduction, str] = MetricReduction.MEAN,
get_not_nans: bool = False,
) -> None:
super().__init__()
self.class_thresholds = class_thresholds
self.include_background = include_background
self.distance_metric = distance_metric
self.reduction = reduction
self.get_not_nans = get_not_nans

def _compute_tensor(self, y_pred: torch.Tensor, y: torch.Tensor): # type: ignore
r"""
Args:
y_pred: Predicted segmentation, typically segmentation model output.
It must be a one-hot encoded, batch-first tensor [B,C,H,W].
y: Reference segmentation.
It must be a one-hot encoded, batch-first tensor [B,C,H,W].
Returns:
Pytorch Tensor of shape [B,C], containing the NSD values :math:`\operatorname {NSD}_{b,c}` for each batch
index :math:`b` and class :math:`c`.
"""
return compute_surface_dice(
y_pred=y_pred,
y=y,
class_thresholds=self.class_thresholds,
include_background=self.include_background,
distance_metric=self.distance_metric,
)

def aggregate(self):
r"""
Aggregates the output of `_compute_tensor`.
Returns:
If `get_not_nans` is set to ``True``, this function returns the aggregated NSD and the `not_nans` count.
If `get_not_nans` is set to ``False``, this function returns only the aggregated NSD.
"""
data = self.get_buffer()
if not isinstance(data, torch.Tensor):
raise ValueError("the data to aggregate must be PyTorch Tensor.")

# do metric reduction
f, not_nans = do_metric_reduction(data, self.reduction)
return (f, not_nans) if self.get_not_nans else f


def compute_surface_dice(
y_pred: torch.Tensor,
y: torch.Tensor,
class_thresholds: List[float],
include_background: bool = False,
distance_metric: str = "euclidean",
):
r"""
This function computes the (Normalized) Surface Dice (NSD) between the two tensors `y_pred` (referred to as
:math:`\hat{Y}`) and `y` (referred to as :math:`Y`). This metric determines which fraction of a segmentation
boundary is correctly predicted. A boundary element is considered correctly predicted if the closest distance to the
reference boundary is smaller than or equal to the specified threshold related to the acceptable amount of deviation in
pixels. The NSD is bounded between 0 and 1.
This implementation supports multi-class tasks with an individual threshold :math:`\tau_c` for each class :math:`c`.
The class-specific NSD for batch index :math:`b`, :math:`\operatorname {NSD}_{b,c}`, is computed using the function:
.. math::
\operatorname {NSD}_{b,c} \left(Y_{b,c}, \hat{Y}_{b,c}\right) = \frac{\left|\mathcal{D}_{Y_{b,c}}^{'}\right| +
\left| \mathcal{D}_{\hat{Y}_{b,c}}^{'} \right|}{\left|\mathcal{D}_{Y_{b,c}}\right| +
\left|\mathcal{D}_{\hat{Y}_{b,c}}\right|}
:label: nsd
with :math:`\mathcal{D}_{Y_{b,c}}` and :math:`\mathcal{D}_{\hat{Y}_{b,c}}` being two sets of nearest-neighbor
distances. :math:`\mathcal{D}_{Y_{b,c}}` is computed from the predicted segmentation boundary towards the reference segmentation
boundary and vice-versa for :math:`\mathcal{D}_{\hat{Y}_{b,c}}`. :math:`\mathcal{D}_{Y_{b,c}}^{'}` and
:math:`\mathcal{D}_{\hat{Y}_{b,c}}^{'}` refer to the subsets of distances that are smaller or equal to the
acceptable distance :math:`\tau_c`:
.. math::
\mathcal{D}_{Y_{b,c}}^{'} = \{ d \in \mathcal{D}_{Y_{b,c}} \, | \, d \leq \tau_c \}.
In the case of a class neither being present in the predicted segmentation, nor in the reference segmentation, a nan value
will be returned for this class. In the case of a class being present in only one of predicted segmentation or
reference segmentation, the class NSD will be 0.
This implementation is based on https://arxiv.org/abs/2111.05408 and supports 2D images.
Be aware that the computation of boundaries is different from DeepMind's implementation
https://github.com/deepmind/surface-distance. In this implementation, the length of a segmentation boundary is
interpreted as the number of its edge pixels. In DeepMind's implementation, the length of a segmentation boundary
depends on the local neighborhood (cf. https://arxiv.org/abs/1809.04430).
Args:
y_pred: Predicted segmentation, typically segmentation model output.
It must be a one-hot encoded, batch-first tensor [B,C,H,W].
y: Reference segmentation.
It must be a one-hot encoded, batch-first tensor [B,C,H,W].
class_thresholds: List of class-specific thresholds.
The thresholds relate to the acceptable amount of deviation in the segmentation boundary in pixels.
Each threshold needs to be a finite, non-negative number.
include_background: Whether to skip the surface dice computation on the first channel of
the predicted output. Defaults to ``False``.
distance_metric: The metric used to compute surface distances.
One of [``"euclidean"``, ``"chessboard"``, ``"taxicab"``].
Defaults to ``"euclidean"``.
Raises:
ValueError: If `y_pred` and/or `y` are not PyTorch tensors.
ValueError: If `y_pred` and/or `y` do not have four dimensions.
ValueError: If `y_pred` and/or `y` have different shapes.
ValueError: If `y_pred` and/or `y` are not one-hot encoded
ValueError: If the number of channels of `y_pred` and/or `y` is different from the number of class thresholds.
ValueError: If any class threshold is not finite.
ValueError: If any class threshold is negative.
Returns:
Pytorch Tensor of shape [B,C], containing the NSD values :math:`\operatorname {NSD}_{b,c}` for each batch index
:math:`b` and class :math:`c`.
"""

if not include_background:
y_pred, y = ignore_background(y_pred=y_pred, y=y)

if not isinstance(y_pred, torch.Tensor) or not isinstance(y, torch.Tensor):
raise ValueError("y_pred and y must be PyTorch Tensor.")

if y_pred.ndimension() != 4 or y.ndimension() != 4:
raise ValueError("y_pred and y should have four dimensions: [B,C,H,W].")

if y_pred.shape != y.shape:
raise ValueError(
f"y_pred and y should have same shape, but instead, shapes are {y_pred.shape} (y_pred) and {y.shape} (y)."
)

if not torch.all(y_pred.byte() == y_pred) or not torch.all(y.byte() == y):
raise ValueError("y_pred and y should be binarized tensors (e.g. torch.int64).")
if torch.any(y_pred > 1) or torch.any(y > 1):
raise ValueError("y_pred and y should be one-hot encoded.")

y = y.float()
y_pred = y_pred.float()

batch_size, n_class = y_pred.shape[:2]

if n_class != len(class_thresholds):
raise ValueError(
f"number of classes ({n_class}) does not match number of class thresholds ({len(class_thresholds)})."
)

if any(~np.isfinite(class_thresholds)):
raise ValueError("All class thresholds need to be finite.")

if any(np.array(class_thresholds) < 0):
raise ValueError("All class thresholds need to be >= 0.")

nsd = np.empty((batch_size, n_class))

for b, c in np.ndindex(batch_size, n_class):
(edges_pred, edges_gt) = get_mask_edges(y_pred[b, c], y[b, c], crop=False)
if not np.any(edges_gt):
warnings.warn(f"the ground truth of class {c} is all 0, this may result in nan/inf distance.")
if not np.any(edges_pred):
warnings.warn(f"the prediction of class {c} is all 0, this may result in nan/inf distance.")

distances_pred_gt = get_surface_distance(edges_pred, edges_gt, distance_metric=distance_metric)
distances_gt_pred = get_surface_distance(edges_gt, edges_pred, distance_metric=distance_metric)

boundary_complete = len(distances_pred_gt) + len(distances_gt_pred)
boundary_correct = np.sum(distances_pred_gt <= class_thresholds[c]) + np.sum(
distances_gt_pred <= class_thresholds[c]
)

if boundary_complete == 0:
# the class is neither present in the prediction, nor in the reference segmentation
nsd[b, c] = np.nan
else:
nsd[b, c] = boundary_correct / boundary_complete

return convert_data_type(nsd, torch.Tensor)[0]
1 change: 1 addition & 0 deletions tests/min_tests.py
Original file line number Diff line number Diff line change
Expand Up @@ -145,6 +145,7 @@ def run_testsuit():
"test_spacingd",
"test_splitdimd",
"test_surface_distance",
"test_surface_dice",
"test_testtimeaugmentation",
"test_torchvision",
"test_torchvisiond",
Expand Down
Loading

0 comments on commit 6602303

Please sign in to comment.