scikit-learn
diff --git a/‎sklearn/decomposition/pca.py
Lines changed: 6 additions & 6 deletions b/‎sklearn/decomposition/pca.py
Lines changed: 6 additions & 6 deletions
diff --git a/‎sklearn/decomposition/tests/test_pca.py
Lines changed: 4 additions & 4 deletions b/‎sklearn/decomposition/tests/test_pca.py
Lines changed: 4 additions & 4 deletions
diff --git a/‎sklearn/utils/extmath.py
Lines changed: 3 additions & 3 deletions b/‎sklearn/utils/extmath.py
Lines changed: 3 additions & 3 deletions
diff --git a/‎sklearn/utils/sparsefuncs.py
Lines changed: 6 additions & 4 deletions b/‎sklearn/utils/sparsefuncs.py
Lines changed: 6 additions & 4 deletions
diff --git a/‎sklearn/utils/sparsefuncs_fast.pyx
Lines changed: 4 additions & 6 deletions b/‎sklearn/utils/sparsefuncs_fast.pyx
Lines changed: 4 additions & 6 deletions
diff --git a/‎sklearn/utils/tests/test_sparsefuncs.py
Lines changed: 2 additions & 1 deletion b/‎sklearn/utils/tests/test_sparsefuncs.py
Lines changed: 2 additions & 1 deletion
@@ -159,24 +159,24 @@ class PCA(_BasePCA):
 
     svd_solver : string {'auto', 'full', 'arpack', 'randomized'}
         auto :
-            the solver is selected by a default policy based on `X.shape` and
+            The solver is selected by a default policy based on `X.shape` and
             `n_components`: if the input data is larger than 500x500 and the
             number of components to extract is lower than 80% of the smallest
             dimension of the data, then the more efficient 'randomized'
             method is enabled. Otherwise the exact full SVD is computed and
             optionally truncated afterwards.
 
-            in case sparse data is used, 'randomized' is used as this is the
+            In case sparse data is used, 'randomized' is used as this is the
             only method that supports sparse data.
         full :
-            run exact full SVD calling the standard LAPACK solver via
+            Run exact full SVD calling the standard LAPACK solver via
             `scipy.linalg.svd` and select the components by postprocessing
         arpack :
-            run SVD truncated to n_components calling ARPACK solver via
+            Run SVD truncated to n_components calling ARPACK solver via
             `scipy.sparse.linalg.svds`. It requires strictly
             0 < n_components < min(X.shape)
         randomized :
-            run randomized SVD by the method of Halko et al. This is the only
+            Run randomized SVD by the method of Halko et al. This is the only
             method that supports sparse data.
 
         .. versionadded:: 0.18.0
@@ -403,7 +403,7 @@ def _fit(self, X):
         # Ensure we don't try call arpack or full on a sparse matrix
         if issparse(X) and self._fit_svd_solver != 'randomized':
             raise ValueError(
-                'only the randomized solver supports sparse matrices'
+                'Only the randomized solver supports sparse matrices'
             )
 
         # Call different fits for either full or truncated SVD
 
@@ -264,9 +264,9 @@ def test_singular_values():
     # Increase the number of power iterations to get greater accuracy in tests
     rpca = PCA(n_components=2, svd_solver='randomized', iterated_power=40,
                random_state=rng).fit(X)
-    assert_allclose(pca.singular_values_, apca.singular_values_, 12)
-    assert_allclose(pca.singular_values_, rpca.singular_values_, 12)
-    assert_allclose(apca.singular_values_, rpca.singular_values_, 12)
+    assert_allclose(pca.singular_values_, apca.singular_values_, atol=12)
+    assert_allclose(pca.singular_values_, rpca.singular_values_, atol=12)
+    assert_allclose(apca.singular_values_, rpca.singular_values_, atol=12)
 
     # Compare to the Frobenius norm
     X_pca = pca.transform(X)
@@ -717,7 +717,7 @@ def test_pca_sparse_input_bad_solvers(svd_solver):
 
     pca = PCA(n_components=3, svd_solver=svd_solver)
 
-    with pytest.raises(ValueError, match='only the randomized solver supports '
+    with pytest.raises(ValueError, match='Only the randomized solver supports '
                                          'sparse matrices'):
         pca.fit(X)
 
 
@@ -386,14 +386,14 @@ def randomized_pca(A, n_components, n_oversamples=10, n_iter="auto",
     n_components : int
         Number of singular values and vectors to extract.
 
-    n_oversamples : int (default is 10)
+    n_oversamples : int (default=10)
         Additional number of random vectors to sample the range of M so as
         to ensure proper conditioning. The total number of random vectors
         used to find the range of M is n_components + n_oversamples. Smaller
         number can improve speed but can negatively impact the quality of
         approximation of singular vectors and singular values.
 
-    n_iter : int or 'auto' (default is 'auto')
+    n_iter : int or 'auto' (default='auto')
         Number of power iterations. It can be used to deal with very noisy
         problems. When 'auto', it is set to 4, unless `n_components` is small
         (< .1 * min(X.shape)) `n_iter` in which case is set to 7.
@@ -407,7 +407,7 @@ def randomized_pca(A, n_components, n_oversamples=10, n_iter="auto",
         but can lose slightly in accuracy). The 'auto' mode applies no
         normalization if `n_iter` <= 2 and switches to LU otherwise.
 
-    flip_sign : boolean, (True by default)
+    flip_sign : boolean, (default=True)
         The output of a singular value decomposition is only unique up to a
         permutation of the signs of the singular vectors. If `flip_sign` is
         set to `True`, the sign ambiguity is resolved by making the largest
 
@@ -72,10 +72,9 @@ def mean_variance_axis(X, axis, ddof=0):
     axis : int (either 0 or 1)
         Axis along which the axis should be computed.
 
+    ddof : int, optional (default=0)
         “Delta Degrees of Freedom”: the divisor used in the calculation is
-        ``N - ddof``, where ``N`` represents the number of elements. By default
-        ddof is zero.
+        ``N - ddof``, where ``N`` represents the number of elements.
 
         .. versionadded:: 0.21
 
@@ -95,7 +94,10 @@ def mean_variance_axis(X, axis, ddof=0):
         raise ValueError('ddof cannot be <0')
 
     if ddof >= X.shape[axis]:
-        raise ValueError('ddof must be <N')
+        raise ValueError(
+            'ddof=%r must be smaller than the number of samples=%r' % (
+                ddof, X.shape[axis])
+        )
 
     if isinstance(X, sp.csr_matrix):
         if axis == 0:
 
@@ -63,10 +63,9 @@ def csr_mean_variance_axis0(X, ddof=0):
     X : CSR sparse matrix, shape (n_samples, n_features)
         Input data.
 
-    ddof : int, optional
+    ddof : int, optional (default=0)
         “Delta Degrees of Freedom”: the divisor used in the calculation is
-        ``N - ddof``, where ``N`` represents the number of elements. By default
-        ddof is zero.
+        ``N - ddof``, where ``N`` represents the number of elements.
 
         .. versionadded:: 0.21
 
@@ -156,10 +155,9 @@ def csc_mean_variance_axis0(X, ddof=0):
     X : CSC sparse matrix, shape (n_samples, n_features)
         Input data.
 
-    ddof : int, optional
+    ddof : int, optional (default=0)
         “Delta Degrees of Freedom”: the divisor used in the calculation is
-        ``N - ddof``, where ``N`` represents the number of elements. By default
-        ddof is zero.
+        ``N - ddof``, where ``N`` represents the number of elements.
 
         .. versionadded:: 0.21
 
 
@@ -116,7 +116,8 @@ def test_mean_variance_too_large_ddof():
     X, _ = make_classification(5, 4, random_state=0)
     X = sp.csr_matrix(X)
 
-    with pytest.raises(ValueError, match='ddof must be <N'):
+    with pytest.raises(ValueError, match='ddof=10 must be smaller than the '
+                                         'number of samples=5'):
         mean_variance_axis(X, axis=0, ddof=10)