scikit-learn
diff --git a/‎sklearn/decomposition/pca.py
Lines changed: 5 additions & 8 deletions b/‎sklearn/decomposition/pca.py
Lines changed: 5 additions & 8 deletions
diff --git a/‎sklearn/decomposition/tests/test_pca.py
Lines changed: 9 additions & 18 deletions b/‎sklearn/decomposition/tests/test_pca.py
Lines changed: 9 additions & 18 deletions
diff --git a/‎sklearn/utils/extmath.py
Lines changed: 39 additions & 38 deletions b/‎sklearn/utils/extmath.py
Lines changed: 39 additions & 38 deletions
@@ -527,14 +527,11 @@ def _fit_truncated(self, X, n_components, svd_solver):
 
         elif svd_solver == 'randomized':
             # sign flipping is done inside
-            U, S, V = randomized_svd(
-                X,
-                n_components=n_components,
-                n_iter=self.iterated_power,
-                flip_sign=True,
-                subtract_mean=True,
-                random_state=random_state,
-            )
+            U, S, V = randomized_svd(X, n_components=n_components,
+                                     n_iter=self.iterated_power,
+                                     flip_sign=True,
+                                     random_state=random_state,
+                                     subtract_mean=True)
 
         self.n_samples_, self.n_features_ = n_samples, n_features
         self.components_ = V
 
@@ -283,7 +283,7 @@ def test_singular_values():
     assert_array_almost_equal(apca.singular_values_,
                               np.sqrt(np.sum(X_apca**2.0, axis=0)), 12)
     assert_array_almost_equal(rpca.singular_values_,
-                              np.sqrt(np.sum(X_rpca**2.0, axis=0)), 2)
+                              np.sqrt(np.sum(X_rpca**2.0, axis=0)), 12)
 
     # Set the singular values and see what we get back
     rng = np.random.RandomState(0)
@@ -688,38 +688,30 @@ def test_pca_sparse_input_randomized_solver():
     n_samples = 100
     n_features = 80
 
-    # The randomized method produces larger errors whenever the means of the
-    # matrix are way off the origin
-    X = rng.normal(1000, 20, (n_samples, n_features))
-
+    X = rng.binomial(1, 0.1, (n_samples, n_features))
     X_sp = sp.sparse.csr_matrix(X)
-    assert sp.sparse.issparse(X_sp)
 
     # Compute the complete decomposition on the dense matrix
-    pca = PCA(n_components=3, svd_solver='full', random_state=rng).fit(X)
+    pca = PCA(n_components=3, svd_solver='randomized',
+              random_state=rng, iterated_power=30).fit(X)
     # And compute a randomized decomposition on the sparse matrix. Increase the
     # number of power iterations to account for the non-zero means
-    pca_sp = PCA(
-        n_components=3,
-        svd_solver='randomized',
-        random_state=rng,
-        iterated_power=20,
-    ).fit(X_sp)
+    pca_sp = PCA(n_components=3, svd_solver='randomized',
+                 random_state=rng, iterated_power=30).fit(X_sp)
 
     # Ensure the singular values are close to the exact singular values
-    assert_array_almost_equal(pca_sp.singular_values_, pca.singular_values_, 5)
+    np.testing.assert_allclose(pca_sp.singular_values_, pca.singular_values_)
 
     # Ensure that the basis is close to the true basis
     X_pca = pca.transform(X)
     X_sppca = pca_sp.transform(X)
-    assert_array_almost_equal(X_sppca, X_pca, 2)
+    np.testing.assert_allclose(X_sppca, X_pca, 1e-3)
 
 
 @pytest.mark.parametrize('svd_solver', ['full', 'arpack'])
 def test_pca_sparse_input_bad_solvers(svd_solver):
     X = np.random.RandomState(0).rand(5, 4)
     X = sp.sparse.csr_matrix(X)
-    assert sp.sparse.issparse(X)
 
     pca = PCA(n_components=3, svd_solver=svd_solver)
 
@@ -729,12 +721,11 @@ def test_pca_sparse_input_bad_solvers(svd_solver):
 def test_pca_auto_solver_selects_randomized_solver_for_sparse_matrices():
     X = np.random.RandomState(0).rand(5, 4)
     X = sp.sparse.csr_matrix(X)
-    assert sp.sparse.issparse(X)
 
     pca = PCA(n_components=3, svd_solver='auto')
     pca.fit(X)
 
-    assert_equal(pca._fit_svd_solver, 'randomized')
+    assert pca._fit_svd_solver == 'randomized'
 
 
 def test_pca_bad_solver():
 
@@ -147,8 +147,8 @@ def safe_sparse_dot(a, b, dense_output=False):
 
 def randomized_range_finder(A, size, n_iter,
                             power_iteration_normalizer='auto',
-                            subtract_mean=False,
-                            random_state=None):
+                            random_state=None,
+                            subtract_mean=False):
     """Computes an orthonormal matrix whose range approximates the range of A.
 
     Parameters
@@ -172,20 +172,20 @@ def randomized_range_finder(A, size, n_iter,
 
         .. versionadded:: 0.18
 
-    subtract_mean : bool
-        Whether the mean  of `A` should be subtracted after each multiplication
-        by the `A` matrix. This is equivalent to multiplying matrices by a
-        centered `A` without ever having to explicitly center. This is
-        especially useful for performing PCA on large sparse matrices, so they
-        do not need to be centered.
-
     random_state : int, RandomState instance or None, optional (default=None)
         The seed of the pseudo random number generator to use when shuffling
         the data.  If int, random_state is the seed used by the random number
         generator; If RandomState instance, random_state is the random number
         generator; If None, the random number generator is the RandomState
         instance used by `np.random`.
 
+    subtract_mean : bool
+        Whether the mean of `A` should be subtracted after each multiplication
+        by the `A` matrix. This is equivalent to multiplying matrices by a
+        centered `A` without ever having to explicitly center. This is
+        especially useful for performing PCA on large sparse matrices, so they
+        do not need to be centered.
+
     Returns
     -------
     Q : 2D array
@@ -219,39 +219,45 @@ def randomized_range_finder(A, size, n_iter,
         else:
             power_iteration_normalizer = 'LU'
 
+    # Prepare funcitons that will multiply `Q` with `A`
     if subtract_mean:
         c = A.mean(axis=0).reshape((1, -1))
-        applyA = lambda X: safe_sparse_dot(A, X) - safe_sparse_dot(c, X)
-        applyAT = lambda X: safe_sparse_dot(A.T, X) - \
-                            safe_sparse_dot(c.T, Q.sum(axis=0).reshape((1, -1)))
+
+        def _apply_A(X):
+            return safe_sparse_dot(A, X) - safe_sparse_dot(c, X)
+
+        def _apply_AT(X):
+            return safe_sparse_dot(A.T, X) - \
+                   safe_sparse_dot(c.T, Q.sum(axis=0).reshape((1, -1)))
     else:
-        applyA = lambda X: safe_sparse_dot(A, X)
-        applyAT = lambda X: safe_sparse_dot(A.T, X)
+        def _apply_A(X):
+            return safe_sparse_dot(A, X)
 
-    Q = applyA(Q)
+        def _apply_AT(X):
+            return safe_sparse_dot(A.T, X)
 
     # Perform power iterations with Q to further 'imprint' the top
     # singular vectors of A in Q
     for i in range(n_iter):
         if power_iteration_normalizer == 'none':
-            Q = applyAT(Q)
-            Q = applyA(Q)
+            Q = _apply_A(Q)
+            Q = _apply_AT(Q)
         elif power_iteration_normalizer == 'LU':
-            Q, _ = linalg.lu(applyAT(Q), permute_l=True)
-            Q, _ = linalg.lu(applyA(Q), permute_l=True)
+            Q, _ = linalg.lu(_apply_A(Q), permute_l=True)
+            Q, _ = linalg.lu(_apply_AT(Q), permute_l=True)
         elif power_iteration_normalizer == 'QR':
-            Q, _ = linalg.qr(applyAT(Q), mode='economic')
-            Q, _ = linalg.qr(applyA(Q), mode='economic')
+            Q, _ = linalg.qr(_apply_A(Q), mode='economic')
+            Q, _ = linalg.qr(_apply_AT(Q), mode='economic')
 
     # Sample the range of A using by linear projection of Q
     # Extract an orthonormal basis
-    Q, _ = linalg.qr(Q, mode='economic')
+    Q, _ = linalg.qr(_apply_A(Q), mode='economic')
     return Q
 
 
 def randomized_svd(M, n_components, n_oversamples=10, n_iter='auto',
                    power_iteration_normalizer='auto', transpose='auto',
-                   flip_sign=True, subtract_mean=False, random_state=0):
+                   flip_sign=True, random_state=0, subtract_mean=False):
     """Computes a truncated randomized SVD
 
     Parameters
@@ -302,20 +308,20 @@ def randomized_svd(M, n_components, n_oversamples=10, n_iter='auto',
         set to `True`, the sign ambiguity is resolved by making the largest
         loadings for each component in the left singular vectors positive.
 
-    subtract_mean : bool
-        Whether the mean  of `A` should be subtracted after each multiplication
-        by the `A` matrix. This is equivalent to multiplying matrices by a
-        centered `A` without ever having to explicitly center. This is
-        especially useful for performing PCA on large sparse matrices, so they
-        do not need to be centered.
-
     random_state : int, RandomState instance or None, optional (default=None)
         The seed of the pseudo random number generator to use when shuffling
         the data.  If int, random_state is the seed used by the random number
         generator; If RandomState instance, random_state is the random number
         generator; If None, the random number generator is the RandomState
         instance used by `np.random`.
 
+    subtract_mean : bool
+        Whether the mean of `A` should be subtracted after each multiplication
+        by the `A` matrix. This is equivalent to multiplying matrices by a
+        centered `A` without ever having to explicitly center. This is
+        especially useful for performing PCA on large sparse matrices, so they
+        do not need to be centered.
+
     Notes
     -----
     This algorithm finds a (usually very good) approximate truncated
@@ -359,14 +365,9 @@ def randomized_svd(M, n_components, n_oversamples=10, n_iter='auto',
         # this implementation is a bit faster with smaller shape[1]
         M = M.T
 
-    Q = randomized_range_finder(
-        M,
-        size=n_random,
-        n_iter=n_iter,
-        power_iteration_normalizer=power_iteration_normalizer,
-        subtract_mean=subtract_mean,
-        random_state=random_state,
-    )
+    Q = randomized_range_finder(M, n_random, n_iter,
+                                power_iteration_normalizer, random_state,
+                                subtract_mean)
 
     # project M to the (k + p) dimensional space using the basis vectors
     B = safe_sparse_dot(Q.T, M)