Merge pull request scikit-image#719 from ahojnnes/slic

This PR: - speeds up SLIC while reducing memory usage, - closes scikit-image#717, - adds support for a voxel spacing argument for anisotropic images, - removes default gaussian blurring, - removes "magic" guessing whether input was multichannel.
luispedro · Sep 27, 2013 · 610b22b · 610b22b
2 parents d194118 + 8fb6fd0
commit 610b22b
Show file tree

Hide file tree

Showing 5 changed files with 262 additions and 152 deletions.
diff --git a/TODO.txt b/TODO.txt
@@ -1,15 +1,15 @@
 Version 0.10
 ------------
-* Remove deprecated functions:
-    - ``skimage.filter.rank.*``
-* Remove deprecated parameter ``epsilon`` of ``skimage.viewer.LineProfile``
-* Remove backwards-compatability of ``skimage.measure.regionprops``
+* Remove deprecated functions in `skimage.filter.rank.*`
+* Remove deprecated parameter `epsilon` of `skimage.viewer.LineProfile`
+* Remove backwards-compatability of `skimage.measure.regionprops`
+* Remove {`ratio`, `sigma`} deprecation warnings of `skimage.segmentation.slic`
 
 Version 0.9
 -----------
 * Remove deprecated functions
-    - ``skimage.filter.denoise_tv_chambolle``
-    - ``skimage.morphology.is_local_maximum``
-    - ``skimage.transform.hough``
-    - ``skimage.transform.probabilistic_hough``
-    - ``skimage.transform.hough_peaks``
+    - `skimage.filter.denoise_tv_chambolle`
+    - `skimage.morphology.is_local_maximum`
+    - `skimage.transform.hough`
+    - `skimage.transform.probabilistic_hough`
+    - `skimage.transform.hough_peaks`
diff --git a/doc/source/api_changes.txt b/doc/source/api_changes.txt
@@ -1,6 +1,8 @@
 Version 0.9
 -----------
-- No longer wrap ``imread`` output in an ``Image`` class.
+- No longer wrap ``imread`` output in an ``Image`` class
+- Change default value of `sigma` parameter in ``skimage.segmentation.slic``
+  to 0
 
 Version 0.4
 -----------

diff --git a/skimage/segmentation/_slic.pyx b/skimage/segmentation/_slic.pyx
@@ -2,93 +2,147 @@
 #cython: boundscheck=False
 #cython: nonecheck=False
 #cython: wraparound=False
+from libc.float cimport DBL_MAX
+
 import numpy as np
-from scipy import ndimage
+cimport numpy as cnp
 
-from skimage.util import img_as_float, regular_grid
-from skimage.color import rgb2lab, gray2rgb
+from skimage.util import regular_grid
 
 
 def _slic_cython(double[:, :, :, ::1] image_zyx,
-                 Py_ssize_t[:, :, ::1] nearest_mean,
-                 double[:, :, ::1] distance,
-                 double[:, ::1] means,
-                 Py_ssize_t max_iter, Py_ssize_t n_segments):
+                 double[:, ::1] segments,
+                 Py_ssize_t max_iter,
+                 double[::1] spacing):
     """Helper function for SLIC segmentation.
 
     Parameters
     ----------
-    image_zyx : 4D array of double, shape (Z, Y, X, 6)
-        The image with embedded coordinates, that is, `image_zyx[i, j, k]` is
-        `array([i, j, k, r, g, b])` or `array([i, j, k, L, a, b])`, depending
-        on the colorspace.
-    nearest_mean : 3D array of int, shape (Z, Y, X)
-        The (initially empty) label field.
-    distance : 3D array of double, shape (Z, Y, X)
-        The (initially infinity) array of distances to the nearest centroid.
-    means : 2D array of double, shape (n_segments, 6)
-        The centroids obtained by SLIC.
+    image_zyx : 4D array of double, shape (Z, Y, X, C)
+        The input image.
+    segments : 2D array of double, shape (N, 3 + C)
+        The initial centroids obtained by SLIC as [Z, Y, X, C...].
     max_iter : int
         The maximum number of k-means iterations.
-    n_segments : int
-        The approximate/desired number of segments.
+    spacing : 1D array of double, shape (3,)
+        The voxel spacing along each image dimension. This parameter
+        controls the weights of the distances along z, y, and x during
+        k-means clustering.
 
     Returns
     -------
-    nearest_mean : 3D array of int, shape (Z, Y, X)
+    nearest_segments : 3D array of int, shape (Z, Y, X)
         The label field/superpixels found by SLIC.
+
+    Notes
+    -----
+    The image is considered to be in (z, y, x) order, which can be
+    surprising. More commonly, the order (x, y, z) is used. However,
+    in 3D image analysis, 'z' is usually the "special" dimension, with,
+    for example, a different effective resolution than the other two
+    axes. Therefore, x and y are often processed together, or viewed as
+    a cut-plane through the volume. So, if the order was (x, y, z) and
+    we wanted to look at the 5th cut plane, we would write::
+
+        my_z_plane = img3d[:, :, 5]
+
+    but, assuming a C-contiguous array, this would grab a discontiguous
+    slice of memory, which is bad for performance. In contrast, if we
+    see the image as (z, y, x) ordered, we would do::
+
+        my_z_plane = img3d[5]
+
+    and get back a contiguous block of memory. This is better both for
+    performance and for readability.
     """
 
-    # initialize on grid:
+    # initialize on grid
     cdef Py_ssize_t depth, height, width
-    depth, height, width = (image_zyx.shape[0], image_zyx.shape[1],
-                            image_zyx.shape[2])
+    depth = image_zyx.shape[0]
+    height = image_zyx.shape[1]
+    width = image_zyx.shape[2]
+
+    cdef Py_ssize_t n_segments = segments.shape[0]
+    # number of features [X, Y, Z, ...]
+    cdef Py_ssize_t n_features = segments.shape[1]
+
     # approximate grid size for desired n_segments
     cdef Py_ssize_t step_z, step_y, step_x
     slices = regular_grid((depth, height, width), n_segments)
     step_z, step_y, step_x = [int(s.step) for s in slices]
 
-    n_means = means.shape[0]
-    cdef Py_ssize_t i, k, x, y, z, x_min, x_max, y_min, y_max, z_min, z_max, \
-            changes
-    cdef double dist_mean
-    cdef double tmp
+    cdef Py_ssize_t[:, :, ::1] nearest_segments \
+        = np.empty((depth, height, width), dtype=np.intp)
+    cdef double[:, :, ::1] distance \
+        = np.empty((depth, height, width), dtype=np.double)
+    cdef Py_ssize_t[::1] n_segment_elems = np.zeros(n_segments, dtype=np.intp)
+
+    cdef Py_ssize_t i, c, k, x, y, z, x_min, x_max, y_min, y_max, z_min, z_max
+    cdef char change
+    cdef double dist_center, cx, cy, cz, dy, dz
+
+    cdef double sz, sy, sx
+    sz = spacing[0]
+    sy = spacing[1]
+    sx = spacing[2]
+
     for i in range(max_iter):
-        changes = 0
-        distance[:, :, :] = np.inf
-        # assign pixels to means
-        for k in range(n_means):
-            # compute windows:
-            z_min = int(max(means[k, 0] - 2 * step_z, 0))
-            z_max = int(min(means[k, 0] + 2 * step_z, depth))
-            y_min = int(max(means[k, 1] - 2 * step_y, 0))
-            y_max = int(min(means[k, 1] + 2 * step_y, height))
-            x_min = int(max(means[k, 2] - 2 * step_x, 0))
-            x_max = int(min(means[k, 2] + 2 * step_x, width))
+        change = 0
+        distance[:, :, :] = DBL_MAX
+
+        # assign pixels to segments
+        for k in range(n_segments):
+
+            # segment coordinate centers
+            cz = segments[k, 0]
+            cy = segments[k, 1]
+            cx = segments[k, 2]
+
+            # compute windows
+            z_min = <Py_ssize_t>max(cz - 2 * step_z, 0)
+            z_max = <Py_ssize_t>min(cz + 2 * step_z + 1, depth)
+            y_min = <Py_ssize_t>max(cy - 2 * step_y, 0)
+            y_max = <Py_ssize_t>min(cy + 2 * step_y + 1, height)
+            x_min = <Py_ssize_t>max(cx - 2 * step_x, 0)
+            x_max = <Py_ssize_t>min(cx + 2 * step_x + 1, width)
+
             for z in range(z_min, z_max):
+                dz = (sz * (cz - z)) ** 2
                 for y in range(y_min, y_max):
+                    dy = (sy * (cy - y)) ** 2
                     for x in range(x_min, x_max):
-                        dist_mean = 0
-                        for c in range(6):
-                            # you would think the compiler can optimize the
-                            # squaring itself. mine can't (with O2)
-                            tmp = image_zyx[z, y, x, c] - means[k, c]
-                            dist_mean += tmp * tmp
-                        if distance[z, y, x] > dist_mean:
-                            nearest_mean[z, y, x] = k
-                            distance[z, y, x] = dist_mean
-                            changes = 1
-        if changes == 0:
+                        dist_center = dz + dy + (sx * (cx - x)) ** 2
+                        for c in range(3, n_features):
+                            dist_center += (image_zyx[z, y, x, c - 3]
+                                            - segments[k, c]) ** 2
+                        if distance[z, y, x] > dist_center:
+                            nearest_segments[z, y, x] = k
+                            distance[z, y, x] = dist_center
+                            change = 1
+
+        # stop if no pixel changed its segment
+        if change == 0:
             break
-        # recompute means:
-        nearest_mean_ravel = np.asarray(nearest_mean).ravel()
-        means_list = []
-        for j in range(6):
-            image_zyx_ravel = (
-                        np.ascontiguousarray(image_zyx[:, :, :, j]).ravel())
-            means_list.append(np.bincount(nearest_mean_ravel,
-                                          image_zyx_ravel))
-        in_mean = np.bincount(nearest_mean_ravel)
-        in_mean[in_mean == 0] = 1
-        means = (np.vstack(means_list) / in_mean).T.copy("C")
-    return np.ascontiguousarray(nearest_mean)
+
+        # recompute segment centers
+
+        # sum features for all segments
+        n_segment_elems[:] = 0
+        segments[:, :] = 0
+        for z in range(depth):
+            for y in range(height):
+                for x in range(width):
+                    k = nearest_segments[z, y, x]
+                    n_segment_elems[k] += 1
+                    segments[k, 0] += z
+                    segments[k, 1] += y
+                    segments[k, 2] += x
+                    for c in range(3, n_features):
+                        segments[k, c] += image_zyx[z, y, x, c - 3]
+
+        # divide by number of elements per segment to obtain mean
+        for k in range(n_segments):
+            for c in range(n_features):
+                segments[k, c] /= n_segment_elems[k]
+
+    return np.asarray(nearest_segments)