seckcoder
diff --git a/‎sklearn/cluster/spectral.py
Lines changed: 26 additions & 9 deletions b/‎sklearn/cluster/spectral.py
Lines changed: 26 additions & 9 deletions
diff --git a/‎sklearn/cluster/tests/test_spectral.py
Lines changed: 16 additions & 15 deletions b/‎sklearn/cluster/tests/test_spectral.py
Lines changed: 16 additions & 15 deletions
@@ -41,7 +41,7 @@ def spectral_embedding(adjacency, n_components=8, mode=None,
     n_components: integer, optional
         The dimension of the projection subspace.
 
-    mode: {None, 'arpack' or 'amg'}
+    mode: {None, 'arpack', 'lobpcg', or 'amg'}
         The eigenvalue decomposition strategy to use. AMG requires pyamg
         to be installed. It can be faster on very large, sparse problems,
         but may also lead to instabilities
@@ -78,6 +78,9 @@ def spectral_embedding(adjacency, n_components=8, mode=None,
     # XXX: Should we check that the matrices given is symmetric
     if mode is None:
         mode = 'arpack'
+    elif not mode in ('arpack', 'lobpcg', 'amg'):
+        raise ValueError("Unknown value for mode: '%s'."
+                         "Should be 'amg' or 'arpack'" % mode)
     laplacian, dd = graph_laplacian(adjacency,
                                     normed=True, return_diag=True)
     if (mode == 'arpack'
@@ -118,25 +121,39 @@ def spectral_embedding(adjacency, n_components=8, mode=No
10000
ne,
         # near 1.0 and leads to much faster convergence: potentially an
         # orders-of-magnitude speedup over simply using keyword which='LA'
         # in standard mode.
-        lambdas, diffusion_map = eigsh(-laplacian, k=n_components,
-                                       sigma=1.0, which='LM')
-        embedding = diffusion_map.T[::-1] * dd
-    elif mode == 'amg':
+        try:
+            lambdas, diffusion_map = eigsh(-laplacian, k=n_components,
+                                        sigma=1.0, which='LM')
+            embedding = diffusion_map.T[::-1] * dd
+        except RuntimeError:
+            # When submatrices are exactly singular, an LU decomposition
+            # in arpack fails. We fallback to lobpcg
+            mode = "lobpcg"
+
+    if mode == 'amg':
         # Use AMG to get a preconditioner and speed up the eigenvalue
         # problem.
         laplacian = laplacian.astype(np.float)  # lobpcg needs native floats
         ml = smoothed_aggregation_solver(laplacian.tocsr())
+        M = ml.aspreconditioner()
         X = random_state.rand(laplacian.shape[0], n_components)
         X[:, 0] = 1. / dd.ravel()
-        M = ml.aspreconditioner()
         lambdas, diffusion_map = lobpcg(laplacian, X, M=M, tol=1.e-12,
                                         largest=False)
         embedding = diffusion_map.T * dd
         if embedding.shape[0] == 1:
             raise ValueError
-    else:
-        raise ValueError("Unknown value for mode: '%s'."
-                         "Should be 'amg' or 'arpack'" % mode)
+    elif mode == "lobpcg":
+        # We increase the number of eigenvectors requested, as lobpcg
+        # doesn't behave well in low dimension
+        X = random_state.rand(laplacian.shape[0], n_components + 4)
+        X[:, 0] = 1. / dd.ravel()
+        lambdas, diffusion_map = lobpcg(laplacian, X, tol=1e-15,
+                                        largest=False, maxiter=2000,
+                                        verbosityLevel=20)
+        embedding = diffusion_map.T[:n_components] * dd
+        if embedding.shape[0] == 1:
+            raise ValueError
     return embedding
 
 
 
@@ -25,21 +25,22 @@ def test_spectral_clustering():
                   [0, 0, 0, 1, 2, 4, 1],
                  ])
 
-    for mat in (S, sparse.csr_matrix(S)):
-        model = SpectralClustering(random_state=0, n_clusters=2,
-                affinity='precomputed').fit(mat)
-        labels = model.labels_
-        if labels[0] == 0:
-            labels = 1 - labels
-
-        assert_equal(labels, [1, 1, 1, 0, 0, 0, 0])
-
-        model_copy = loads(dumps(model))
-        assert_equal(model_copy.n_clusters, model.n_clusters)
-        assert_equal(model_copy.mode, model.mode)
-        assert_equal(model_copy.random_state.get_state(),
-                     model.random_state.get_state())
-        assert_equal(model_copy.labels_, model.labels_)
+    for mode in ('arpack', 'lobpcg'):
+        for mat in (S, sparse.csr_matrix(S)):
+            model = SpectralClustering(random_state=0, n_clusters=2,
+                    affinity='precomputed', mode=mode).fit(mat)
+            labels = model.labels_
+            if labels[0] == 0:
+                labels = 1 - labels
+
+            assert_equal(labels, [1, 1, 1, 0, 0, 0, 0])
+
+            model_copy = loads(dumps(model))
+            assert_equal(model_copy.n_clusters, model.n_clusters)
+            assert_equal(model_copy.mode, model.mode)
+            assert_equal(model_copy.random_state.get_state(),
+                        model.random_state.get_state())
+            assert_equal(model_copy.labels_, model.labels_)
 
 
 def test_spectral_amg_mode():