scikit-learn
diff --git a/‎sklearn/linear_model/base.py
Lines changed: 120 additions & 30 deletions b/‎sklearn/linear_model/base.py
Lines changed: 120 additions & 30 deletions
diff --git a/‎sklearn/linear_model/tests/test_base.py
Lines changed: 47 additions & 21 deletions b/‎sklearn/linear_model/tests/test_base.py
Lines changed: 47 additions & 21 deletions
@@ -34,13 +34,10 @@
 from ..utils.seq_dataset import ArrayDataset, CSRDataset
 
 
-###
-### TODO: intercept for all models
-### We should define a common function to center data instead of
-### repeating the same code inside each fit method.
+# TODO: intercept for all models
 
-### TODO: bayesian_ridge_regression and bayesian_regression_ard
-### should be squashed into its respective objects.
+# TODO: bayesian_ridge_regression and bayesian_regression_ard
+# should be squashed into its respective objects.
 
 SPARSE_INTERCEPT_DECAY = 0.01
 # For sparse data intercept updates are scaled by this decay factor to avoid
@@ -69,12 +66,9 @@ def make_dataset(X, y, sample_weight, random_state=None):
     return dataset, intercept_decay
 
 
-def sparse_center_data(X, y, fit_intercept, normalize=False):
-    """
-    Compute information needed to center data to have mean zero along
-    axis 0. Be aware that X will not be centered since it would break
-    the sparsity, but will be normalized if asked so.
-    """
+# TODO: this reproduces the behavior prior 0.17
+# Must be remove in 0.19
+def _sparse_center_data(X, y, fit_intercept, normalize=None):
     if fit_intercept:
         # we might require not to change the csr matrix sometimes
         # store a copy if normalize is True.
@@ -106,15 +100,96 @@ def sparse_center_data(X, y, fit_intercept, normalize=False):
     return X, y, X_mean, y_mean, X_std
 
 
-def center_data(X, y, fit_intercept, normalize=False, copy=True,
-                sample_weight=None):
+def sparse_center_data(X, y, fit_intercept, standardize=False,
+                       normalize=None):
+    """
+    Compute information needed to center data to have mean zero along
+    axis 0. Be aware that X will not be centered since it would break
+    the sparsity, but will be standardized if asked so.
+    """
+    if normalize is not None:
+        warnings.warn("The `normalize` parameter is not in use anymore from "
+                      "version 0.17 and will be removed in 0.19. If you want "
+                      "to standardize the data instead, use"
+                      "`standardize=True`", DeprecationWarning)
+        return _sparse_center_data(X, y, fit_intercept, normalize)
+
+    if fit_intercept:
+        # we might require not to change the csr matrix sometimes
+        # store a copy if standardize is True.
+        # Change dtype to float64 since mean_variance_axis accepts
+        # it that way.
+        if sp.isspmatrix(X) and X.getformat() == 'csr':
+            X = sp.csr_matrix(X, copy=standardize, dtype=np.float64)
+        else:
+            X = sp.csc_matrix(X, copy=standardize, dtype=np.float64)
+
+        X_mean, X_var = mean_variance_axis(X, axis=0)
+        if standardize:
+            # transform variance to std in-place
+            X_std = np.sqrt(X_var, X_var)
+            del X_var
+            X_std[X_std == 0] = 1
+            inplace_column_scale(X, 1. / X_std)
+        else:
+            X_std = np.ones(X.shape[1])
+        y_mean = y.mean(axis=0)
+        y = y - y_mean
+    else:
+        X_mean = np.zeros(X.shape[1])
+        X_std = np.ones(X.shape[1])
+        y_mean = 0. if y.ndim == 1 else np.zeros(y.shape[1], dtype=X.dtype)
+
+    return X, y, X_mean, y_mean, X_std
+
+
+# TODO: this reproduces the behavior prior 0.17
+# Must be remove in 0.19
+def _center_data(X, y, fit_intercept, normalize=False, copy=True,
+                 sample_weight=None):
+
+    X = as_float_array(X, copy)
+    if fit_intercept:
+        if isinstance(sample_weight, numbers.Number):
+            sample_weight = None
+        if sp.issparse(X):
+            X_mean = np.zeros(X.shape[1])
+            X_std = np.ones(X.shape[1])
+        else:
+            X_mean = np.average(X, axis=0, weights=sample_weight)
+            X -= X_mean
+            if normalize:
+                # XXX: currently scaled to variance=n_samples
+                X_std = np.sqrt(np.sum(X ** 2, axis=0))
+                X_std[X_std == 0] = 1
+                X /= X_std
+            else:
+                X_std = np.ones(X.shape[1])
+        y_mean = np.average(y, axis=0, weights=sample_weight)
+        y = y - y_mean
+    else:
+        X_mean = np.zeros(X.shape[1])
+        X_std = np.ones(X.shape[1])
+        y_mean = 0. if y.ndim == 1 else np.zeros(y.shape[1], dtype=X.dtype)
+    return X, y, X_mean, y_mean, X_std
+
+
+def center_data(X, y, fit_intercept, standardize=False, normalize=None,
+                copy=True, sample_weight=None):
     """
     Centers data to have mean zero along axis 0. This is here because
     nearly all linear models will want their data to be centered.
 
     If sample_weight is not None, then the weighted mean of X and y
     is zero, and not the mean itself
     """
+    if normalize is not None:
+        warnings.warn("The `normalize` parameter is not in use anymore from "
+                      "version 0.17 and will be removed in 0.19. If you want "
+                      "to standardize the data instead, use"
+                      "`standardize=True`", DeprecationWarning)
+        return _center_data(X, y, fit_intercept, normalize, copy, sample_weight)
+
     X = as_float_array(X, copy)
     if fit_intercept:
         if isinstance(sample_weight, numbers.Number):
@@ -125,9 +200,8 @@ def center_data(X, y, fit_intercept, normalize=False, copy=True,
         else:
             X_mean = np.average(X, axis=0, weights=sample_weight)
             X -= X_mean
-            if normalize:
-                # XXX: currently scaled to variance=n_samples
-                X_std = np.sqrt(np.sum(X ** 2, axis=0))
+            if standardize:
+                X_std = np.sqrt(np.mean(X ** 2, axis=0))
                 X_std[X_std == 0] = 1
                 X /= X_std
             else:
@@ -356,8 +430,8 @@ class LinearRegression(LinearModel, RegressorMixin):
         to false, no intercept will be used in calculations
         (e.g. data is expected to be already centered).
 
-    normalize : boolean, optional, default False
-        If True, the regressors X will be normalized before regression.
+    standardize : boolean, optional, default False
+        If True, the regressors X will be standardized before regression.
 
     copy_X : boolean, optional, default True
         If True, X will be copied; else, it may be overwritten.
@@ -385,13 +459,26 @@ class LinearRegression(LinearModel, RegressorMixin):
 
     """
 
-    def __init__(self, fit_intercept=True, normalize=False, copy_X=True,
-                 n_jobs=1):
+    def __init__(self, fit_intercept=True, standardize=False, normalize=None,
+                 copy_X=True, n_jobs=1):
+        if normalize is not None:
+            warnings.warn("The `normalize` parameter is not in use anymore "
+                          "from version 0.17 and will be removed in 0.19. If "
+                          "you want the data to be standardized instead, use "
+                          "`standardize=True`", DeprecationWarning)
         self.fit_intercept = fit_intercept
-        self.normalize = normalize
+        self.standardize = standardize
         self.copy_X = copy_X
         self.n_jobs = n_jobs
 
+    @property
+    @deprecated("The `normalize` attribute is not in use anymore "
+                "from version 0.17 and will be removed in 0.19. If "
+                "you want the data to be standardized instead, use "
+                "`standardize=True`")
+    def normalize(self):
+        return None
+
     def fit(self, X, y, sample_weight=None):
         """
         Fit linear model.
@@ -416,11 +503,13 @@ def fit(self, X, y, sample_weight=None):
         X, y = check_X_y(X, y, accept_sparse=['csr', 'csc', 'coo'],
                          y_numeric=True, multi_output=True)
 
-        if ((sample_weight is not None) and np.atleast_1d(sample_weight).ndim > 1):
+        if ((sample_weight is not None) and
+           np.atleast_1d(sample_weight).ndim > 1):
             sample_weight = column_or_1d(sample_weight, warn=True)
 
         X, y, X_mean, y_mean, X_std = self._center_data(
-            X, y, self.fit_intercept, self.normalize, self.copy_X,
+            X, y, fit_intercept=self.fit_intercept,
+            standardize=self.standardize, copy=self.copy_X,
             sample_weight=sample_weight)
 
         if sample_weight is not None:
@@ -450,24 +539,25 @@ def fit(self, X, y, sample_weight=None):
         return self
 
 
-def _pre_fit(X, y, Xy, precompute, normalize, fit_intercept, copy):
+def _pre_fit(X, y, Xy, precompute, standardize, fit_intercept, copy):
     """Aux function used at beginning of fit in linear models"""
     n_samples, n_features = X.shape
 
     if sparse.isspmatrix(X):
         precompute = False
         X, y, X_mean, y_mean, X_std = sparse_center_data(
-            X, y, fit_intercept, normalize)
+            X, y, fit_intercept=fit_intercept, standardize=standardize)
     else:
         # copy was done in fit if necessary
         X, y, X_mean, y_mean, X_std = center_data(
-            X, y, fit_intercept, normalize, copy=copy)
+            X, y, fit_intercept=fit_intercept, standardize=standardize,
+            copy=copy)
     if hasattr(precompute, '__array__') and (
-            fit_intercept and not np.allclose(X_mean, np.zeros(n_features))
-            or normalize and not np.allclose(X_std, np.ones(n_features))):
+            fit_intercept and not np.allclose(X_mean, np.zeros(n_features)) or
+            standardize and not np.allclose(X_std, np.ones(n_features))):
         warnings.warn("Gram matrix was provided but X was centered"
                       " to fit intercept, "
-                      "or X was normalized : recomputing Gram matrix.",
+                      "or X was standardized : recomputing Gram matrix.",
                       UserWarning)
         # recompute Gram
         precompute = 'auto'
 
@@ -8,11 +8,14 @@
 
 from sklearn.utils.testing import assert_array_almost_equal
 from sklearn.utils.testing import assert_equal
+from sklearn.utils.testing import assert_warns
+from sklearn.utils.testing import ignore_warnings
 
 from sklearn.linear_model.base import LinearRegression
-from sklearn.linear_model.base import center_data, sparse_center_data, _rescale_data
+from sklearn.linear_model.base import center_data
+from sklearn.linear_model.base import sparse_center_data
+from sklearn.linear_model.base import _rescale_data
 from sklearn.utils import check_random_state
-from sklearn.utils.testing import assert_raise_message
 from sklearn.utils.testing import assert_greater
 from sklearn.datasets.samples_generator import make_sparse_uncorrelated
 from sklearn.datasets.samples_generator import make_regression
@@ -168,28 +171,35 @@ def test_center_data():
     X = rng.rand(n_samples, n_features)
     y = rng.rand(n_samples)
     expected_X_mean = np.mean(X, axis=0)
-    # XXX: currently scaled to variance=n_samples
-    expected_X_std = np.std(X, axis=0) * np.sqrt(X.shape[0])
+    expected_X_std = np.std(X, axis=0)
     expected_y_mean = np.mean(y, axis=0)
 
     Xt, yt, X_mean, y_mean, X_std = center_data(X, y, fit_intercept=False,
-                                                normalize=False)
+                                                standardize=False)
     assert_array_almost_equal(X_mean, np.zeros(n_features))
     assert_array_almost_equal(y_mean, 0)
     assert_array_almost_equal(X_std, np.ones(n_features))
     assert_array_almost_equal(Xt, X)
     assert_array_almost_equal(yt, y)
 
     Xt, yt, X_mean, y_mean, X_std = center_data(X, y, fit_intercept=True,
-                                                normalize=False)
+                                                standardize=False)
     assert_array_almost_equal(X_mean, expected_X_mean)
     assert_array_almost_equal(y_mean, expected_y_mean)
     assert_array_almost_equal(X_std, np.ones(n_features))
     assert_array_almost_equal(Xt, X - expected_X_mean)
     assert_array_almost_equal(yt, y - expected_y_mean)
 
+    Xt, yt, X_mean, y_mean, X_std = center_data(X, y, fit_intercept=False,
+                                                standardize=True)
+    assert_array_almost_equal(X_mean, np.zeros(n_features))
+    assert_array_almost_equal(y_mean, 0)
+    assert_array_almost_equal(X_std, np.ones(n_features))
+    assert_array_almost_equal(Xt, X)
+    assert_array_almost_equal(yt, y)
+
     Xt, yt, X_mean, y_mean, X_std = center_data(X, y, fit_intercept=True,
-                                                normalize=True)
+                                                standardize=True)
     assert_array_almost_equal(X_mean, expected_X_mean)
     assert_array_almost_equal(y_mean, expected_y_mean)
     assert_array_almost_equal(X_std, expected_X_std)
@@ -209,17 +219,17 @@ def test_center_data_multioutput():
     args = [(center_data, X), (sparse_center_data, sparse.csc_matrix(X))]
     for center, X in args:
         _, yt, _, y_mean, _ = center(X, y, fit_intercept=False,
-                                     normalize=False)
+                                     standardize=False)
         assert_array_almost_equal(y_mean, np.zeros(n_outputs))
         assert_array_almost_equal(yt, y)
 
         _, yt, _, y_mean, _ = center(X, y, fit_intercept=True,
-                                     normalize=False)
+                                     standardize=False)
         assert_array_almost_equal(y_mean, expected_y_mean)
         assert_array_almost_equal(yt, y - y_mean)
 
         _, yt, _, y_mean, _ = center(X, y, fit_intercept=True,
-                                     normalize=True)
+                                     standardize=True)
         assert_array_almost_equal(y_mean, expected_y_mean)
         assert_array_almost_equal(yt, y - y_mean)
 
@@ -234,14 +244,12 @@ def test_center_data_weighted():
     expected_X_mean = np.average(X, axis=0, weights=sample_weight)
     expected_y_mean = np.average(y, axis=0, weights=sample_weight)
 
-    # XXX: if normalize=True, should we expect a weighted standard deviation?
+    # XXX: if standardize=True, should we expect a weighted standard deviation?
     #      Currently not weighted, but calculated with respect to weighted mean
-    # XXX: currently scaled to variance=n_samples
-    expected_X_std = (np.sqrt(X.shape[0]) *
-                      np.mean((X - expected_X_mean) ** 2, axis=0) ** .5)
+    expected_X_std = (np.mean((X - expected_X_mean) ** 2, axis=0) ** .5)
 
     Xt, yt, X_mean, y_mean, X_std = center_data(X, y, fit_intercept=True,
-                                                normalize=False,
+                                                standardize=False,
                                                 sample_weight=sample_weight)
     assert_array_almost_equal(X_mean, expected_X_mean)
     assert_array_almost_equal(y_mean, expected_y_mean)
@@ -250,7 +258,7 @@ def test_center_data_weighted():
     assert_array_almost_equal(yt, y - expected_y_mean)
 
     Xt, yt, X_mean, y_mean, X_std = center_data(X, y, fit_intercept=True,
-                                                normalize=True,
+                                                standardize=True,
                                                 sample_weight=sample_weight)
     assert_array_almost_equal(X_mean, expected_X_mean)
     assert_array_almost_equal(y_mean, expected_y_mean)
@@ -268,12 +276,11 @@ def test_sparse_center_data():
     X = X.tolil()
     y = rng.rand(n_samples)
     XA = X.toarray()
-    # XXX: currently scaled to variance=n_samples
-    expected_X_std = np.std(XA, axis=0) * np.sqrt(X.shape[0])
+    expected_X_std = np.std(XA, axis=0)
 
     Xt, yt, X_mean, y_mean, X_std = sparse_center_data(X, y,
                                                        fit_intercept=False,
-                                                       normalize=False)
+                                                       standardize=False)
     assert_array_almost_equal(X_mean, np.zeros(n_features))
     assert_array_almost_equal(y_mean, 0)
     assert_array_almost_equal(X_std, np.ones(n_features))
@@ -282,7 +289,7 @@ def test_sparse_center_data():
 
     Xt, yt, X_mean, y_mean, X_std = sparse_center_data(X, y,
                                                        fit_intercept=True,
-                                                       normalize=False)
+                                                       standardize=False)
     assert_array_almost_equal(X_mean, np.mean(XA, axis=0))
     assert_array_almost_equal(y_mean, np.mean(y, axis=0))
     assert_array_almost_equal(X_std, np.ones(n_features))
@@ -291,7 +298,7 @@ def test_sparse_center_data():
 
     Xt, yt, X_mean, y_mean, X_std = sparse_center_data(X, y,
                                                        fit_intercept=True,
-                                                       normalize=True)
+                                                       standardize=True)
     assert_array_almost_equal(X_mean, np.mean(XA, axis=0))
     assert_array_almost_equal(y_mean, np.mean(y, axis=0))
     assert_array_almost_equal(X_std, expected_X_std)
@@ -322,3 +329,22 @@ def test_rescale_data():
     assert_array_almost_equal(rescaled_X, rescaled_X2)
     assert_array_almost_equal(rescaled_y, rescaled_y2)
 
+
+@ignore_warnings
+def test_normalize_deprecation():
+    X = np.array([[1], [2]])
+    y = np.array([1, 2])
+    X_csr = sparse.csr_matrix(X)
+
+    assert_warns(DeprecationWarning, center_data, X, y, True, normalize=True)
+    assert_warns(DeprecationWarning, sparse_center_data, X_csr, y, True,
+                 normalize=True)
+    assert_warns(DeprecationWarning, LinearRegression, normalize=True)
+
+    # Test warning when accessing the normalize attribute
+    est = LinearRegression(normalize=True)
+
+    def trigger_warning_for_property(estimator):
+        est.normalize
+
+    assert_warns(DeprecationWarning, trigger_warning_for_property, est)