Merge pull request #7 from hacarus/issue/6/ksvd

Add implementation of K-SVD
hacarus · Mar 30, 2018 · 476a0a9 · 476a0a9
2 parents 4ffbcaf + 07423ac
commit 476a0a9
Show file tree

Hide file tree

Showing 5 changed files with 282 additions and 0 deletions.
diff --git a/README.md b/README.md
@@ -19,3 +19,17 @@ python -m venv venv
 source venv/bin/activate
 pip install -r requirements.txt
 ```
+
+### Testing
+
+You can run all test cases just like this
+
+```
+python -m unittest tests/test_*.py
+```
+
+Or run specific test case as follows
+
+```
+python -m unittest test_decomposition_ksvd.TestKSVD.test_ksvd
+```
diff --git a/requirements.txt b/requirements.txt
@@ -1 +1,3 @@
 numpy
+scipy
+scikit-learn>=0.19.0
diff --git a/spmimage/decomposition/__init__.py b/spmimage/decomposition/__init__.py
@@ -0,0 +1,3 @@
+from .ksvd import KSVD
+
+__all__ = ['KSVD']
diff --git a/spmimage/decomposition/ksvd.py b/spmimage/decomposition/ksvd.py
@@ -0,0 +1,215 @@
+from logging import getLogger
+
+import numpy as np
+
+from sklearn.base import BaseEstimator
+from sklearn.decomposition.dict_learning import SparseCodingMixin, sparse_encode
+from sklearn.utils import check_array, check_random_state
+
+logger = getLogger(__name__)
+
+
+def _ksvd(Y: np.ndarray, n_components: int, k0: int, max_iter: int, tol: float, code_init: np.ndarray = None,
+          dict_init: np.ndarray = None, n_jobs: int = 1):
+    """_ksvd
+    Finds a dictionary that can be used to represent data using a sparse code.
+    Solves the optimization problem:
+        argmin \sum_{i=1}^M || y_i - w_iH ||_2^2 such that ||w_i||_0 <= k_0 for all 1 <= i <= M
+        ({w_i}_{i=1}^M, H)
+
+    **Note**
+    Y ~= WH = code * dictionary
+
+    Parameters:
+    ------------
+        Y : array-like, shape (n_samples, n_features)
+            Training vector, where n_samples in the number of samples
+            and n_features is the number of features.
+        n_components : int,
+            number of dictionary elements to extract
+        k0 : int,
+            number of non-zero elements of sparse coding
+        max_iter : int,
+            maximum number of iterations to perform
+        tol : float,
+            tolerance for numerical error
+        code_init : array of shape (n_samples, n_components),
+            Initial value for the sparse code for warm restart scenarios.
+        dict_init : array of shape (n_components, n_features),
+            initial values for the dictionary, for warm restart
+        n_jobs : int, optional
+            Number of parallel jobs to run.
+    Returns:
+    ---------
+        code : array of shape (n_samples, n_components)
+            The sparse code factor in the matrix factorization.
+        dictionary : array of shape (n_components, n_features),
+            The dictionary factor in the matrix factorization.
+        errors : array
+            Vector of errors at each iteration.
+        n_iter : int
+            Number of iterations run. Returned only if `return_n_iter` is
+            set to True.
+    """
+
+    if code_init is None:
+        W = np.zeros((Y.shape[0], n_components))
+    else:
+        W = code_init
+
+    if dict_init is None:
+        H = Y[:n_components, :]
+    else:
+        H = dict_init
+    H = np.dot(H, np.diag(1. / np.sqrt(np.diag(np.dot(H.T, H)))))
+
+    errors = [np.linalg.norm(Y - W.dot(H), 'fro')]
+    k = -1
+    for k in range(max_iter):
+        W = sparse_encode(Y, H, algorithm='omp', n_nonzero_coefs=k0, n_jobs=n_jobs)
+
+        for j in range(n_components):
+            x = W[:, j] != 0
+            if np.sum(x) == 0:
+                continue
+            W[x, j] = 0
+
+            error = Y[x, :] - np.dot(W[x, :], H)
+
+            U, s, V = np.linalg.svd(error)
+            W[x, j] = U[:, 0]*s[0]
+            H[j, :] = V.T[:, 0]
+
+        errors.append(np.linalg.norm(Y - W.dot(H), 'fro'))
+        if np.abs(errors[-1] - errors[-2]) < tol:
+            break
+
+    return W, H, errors, k + 1
+
+
+class KSVD(BaseEstimator, SparseCodingMixin):
+    """ K-SVD
+    Finds a dictionary that can be used to represent data using a sparse code.
+    Solves the optimization problem:
+        argmin \sum_{i=1}^M || y_i - Ax_i ||_2^2 such that ||x_i||_0 <= k_0 for all 1 <= i <= M
+        (A,{x_i}_{i=1}^M)
+
+    Parameters
+    ----------
+        n_components : int,
+            number of dictionary elements to extract
+        k0 : int,
+            number of non-zero elements of sparse coding
+        max_iter : int,
+            maximum number of iterations to perform
+        tol : float,
+            tolerance for numerical error
+        transform_algorithm : {'lasso_lars', 'lasso_cd', 'lars', 'omp', 'threshold'}
+            Algorithm used to transform the data
+            lars: uses the least angle regression method (linear_model.lars_path)
+            lasso_lars: uses Lars to compute the Lasso solution
+            lasso_cd: uses the coordinate descent method to compute the
+            Lasso solution (linear_model.Lasso). lasso_lars will be faster if
+            the estimated components are sparse.
+            omp: uses orthogonal matching pursuit to estimate the sparse solution
+            threshold: squashes to zero all coefficients less than alpha from
+            the projection ``dictionary * X'``
+            .. versionadded:: 0.17
+               *lasso_cd* coordinate descent method to improve speed.
+        transform_n_nonzero_coefs : int, ``0.1 * n_features`` by default
+            Number of nonzero coefficients to target in each column of the
+            solution. This is only used by `algorithm='lars'` and `algorithm='omp'`
+            and is overridden by `alpha` in the `omp` case.
+        transform_alpha : float, 1. by default
+            If `algorithm='lasso_lars'` or `algorithm='lasso_cd'`, `alpha` is the
+            penalty applied to the L1 norm.
+            If `algorithm='threshold'`, `alpha` is the absolute value of the
+            threshold below which coefficients will be squashed to zero.
+            If `algorithm='omp'`, `alpha` is the tolerance parameter: the value of
+            the reconstruction error targeted. In this case, it overrides
+            `n_nonzero_coefs`.
+        n_jobs : int,
+            number of parallel jobs to run
+        split_sign : bool, False by default
+            Whether to split the sparse feature vector into the concatenation of
+            its negative part and its positive part. This can improve the
+            performance of downstream classifiers.
+        random_state : int, RandomState instance or None, optional (default=None)
+            If int, random_state is the seed used by the random number generator;
+            If RandomState instance, random_state is the random number generator;
+            If None, the random number generator is the RandomState instance used
+            by `np.random`.
+
+    Attributes
+    ----------
+        components_ : array, [n_components, n_features]
+            dictionary atoms extracted from the data
+        error_ : array
+            vector of errors at each iteration
+        n_iter_ : int
+            Number of iterations run.
+    **References:**
+        Elad, Michael, and Michal Aharon.
+        "Image denoising via sparse and redundant representations over learned dictionaries."
+        IEEE Transactions on Image processing 15.12 (2006): 3736-3745.
+    ----------
+
+    """
+
+    def __init__(self, n_components=None, k0=None, max_iter=1000, tol=1e-8,
+                 transform_algorithm='omp', transform_n_nonzero_coefs=None,
+                 transform_alpha=None, n_jobs=1,
+                 split_sign=False, random_state=None):
+        self._set_sparse_coding_params(n_components, transform_algorithm,
+                                       transform_n_nonzero_coefs,
+                                       transform_alpha, split_sign, n_jobs)
+        self.k0 = k0
+        self.max_iter = max_iter
+        self.tol = tol
+        self.random_state = random_state
+
+    def fit(self, X, y=None):
+        """Fit the model from data in X.
+        Parameters
+        ----------
+        X : array-like, shape (n_samples, n_features)
+            Training vector, where n_samples in the number of samples
+            and n_features is the number of features.
+        y : Ignored
+        Returns
+        -------
+        self : object
+            Returns the object itself
+        """
+
+        # Turn seed into a np.random.RandomState instance
+        random_state = check_random_state(self.random_state)
+
+        # Input validation on an array, list, sparse matrix or similar.
+        # By default, the input is converted to an at least 2D numpy array. If the dtype of the array is object, attempt converting to float, raising on failure.
+        X = check_array(X)
+        n_samples, n_features = X.shape
+        if self.n_components is None:
+            n_components = X.shape[1]
+        else:
+            n_components = self.n_components
+
+        if self.k0 is None:
+            k0 = n_features
+        elif self.k0 > n_features:
+            k0 = n_features
+        else:
+            k0 = self.k0
+
+        # initialize code
+        code_init = random_state.rand(n_samples, n_components)
+        # initialize dictionary
+        dict_init = random_state.rand(n_components, n_features)
+
+        code, self.components_, self.error_, self.n_iter_ = _ksvd(
+            X, n_components, k0,
+            max_iter=self.max_iter, tol=self.tol,
+            code_init=code_init, dict_init=dict_init,
+            n_jobs=self.n_jobs)
+
+        return self
diff --git a/tests/test_decomposition_ksvd.py b/tests/test_decomposition_ksvd.py
@@ -0,0 +1,48 @@
+from unittest import TestCase
+from typing import Tuple
+
+from spmimage.decomposition import KSVD
+
+import numpy as np
+
+
+class TestKSVD(TestCase):
+
+    @staticmethod
+    def generate_input(n_samples: int, n_features: int, n_components: int, k0: int) \
+            -> Tuple[np.ndarray, np.ndarray]:
+        # random dictionary base
+        A0 = np.random.randn(n_components, n_features)
+        A0 = np.dot(A0, np.diag(1. / np.sqrt(np.diag(np.dot(A0.T, A0)))))
+
+        X = np.zeros((n_samples, n_features))
+        for i in range(n_samples):
+            # select k0 components from dictionary
+            X[i, :] = np.dot(np.random.randn(k0), A0[np.random.permutation(range(n_components))[:k0], :])
+        return A0, X
+
+    def test_ksvd(self):
+        np.random.seed(0)
+        k0 = 4
+        n_samples = 512
+        n_features = 32
+        n_components = 24
+        max_iter = 500
+
+        A0, X = self.generate_input(n_samples, n_features, n_components, k0)
+        model = KSVD(n_components=n_components, k0=k0, max_iter=max_iter)
+        model.fit(X)
+
+        # check error of learning
+        self.assertTrue(model.error_[-1] < 10)
+        self.assertTrue(model.n_iter_ <= max_iter)
+
+        # check estimated dictionary
+        norm = np.linalg.norm(model.components_ - A0, ord='fro')
+        self.assertTrue(norm < 15)
+
+        # check reconstructed data
+        code = model.transform(X)
+        reconstructed = np.dot(code, model.components_)
+        reconstruct_error = np.linalg.norm(reconstructed - X, ord='fro')
+        self.assertTrue(reconstruct_error < 15)