gio8tisu
diff --git a/‎doc/whats_new/v0.23.rst
Lines changed: 12 additions & 8 deletions b/‎doc/whats_new/v0.23.rst
Lines changed: 12 additions & 8 deletions
diff --git a/‎sklearn/compose/tests/test_target.py
Lines changed: 2 additions & 2 deletions b/‎sklearn/compose/tests/test_target.py
Lines changed: 2 additions & 2 deletions
diff --git a/‎sklearn/linear_model/_base.py
Lines changed: 26 additions & 7 deletions b/‎sklearn/linear_model/_base.py
Lines changed: 26 additions & 7 deletions
diff --git a/‎sklearn/linear_model/_coordinate_descent.py
Lines changed: 87 additions & 7 deletions b/‎sklearn/linear_model/_coordinate_descent.py
Lines changed: 87 additions & 7 deletions
diff --git a/‎sklearn/linear_model/tests/test_base.py
Lines changed: 13 additions & 6 deletions b/‎sklearn/linear_model/tests/test_base.py
Lines changed: 13 additions & 6 deletions
@@ -54,10 +54,10 @@ Changelog
   ``tol=0`` as with the default ``algorithm="full"``. :pr:`16075` by
   :user:`Erich Schubert <kno10>`.
 
-- |Efficiency| :class:`cluster.Birch` implementation of the predict method 
-  avoids high memory footprint by calculating the distances matrix using 
+- |Efficiency| :class:`cluster.Birch` implementation of the predict method
+  avoids high memory footprint by calculating the distances matrix using
   a chunked scheme.
-  :pr:`16149` by :user:`Jeremie du Boisberranger <jeremiedbb>` and 
+  :pr:`16149` by :user:`Jeremie du Boisberranger <jeremiedbb>` and
   :user:`Alex Shacked <alexshacked>`.
 
 :mod:`sklearn.compose`
@@ -70,7 +70,7 @@ Changelog
 :mod:`sklearn.datasets`
 .......................
 
-- |Enhancement| Added ``return_centers`` parameter  in  
+- |Enhancement| Added ``return_centers`` parameter  in
   :func:`datasets.make_blobs`, which can be used to return
   centers for each cluster.
   :pr:`15709` by :user:`<shivamgargsya>` and
@@ -154,10 +154,14 @@ Changelog
 
 - |Enhancement| :func:`gaussian_process.kernels.Matern` returns the RBF kernel when ``nu=np.inf``.
   :pr:`15503` by :user:`Sam Dixon <sam-dixon>`.
-  
+
 :mod:`sklearn.linear_model`
 ...........................
 
+- |Feature| Support of `sample_weight` in :class:`linear_model.ElasticNet` and
+  :class:`linear_model:Lasso` for dense feature matrix `X`.
+  :pr:`15436` by :user:`Christian Lorentzen <lorentzenchr>`.
+
 - |Fix| Fixed a bug where if a `sample_weight` parameter was passed to the fit
   method of :class:`linear_model.RANSACRegressor`, it would not be passed to
   the wrapped `base_estimator` during the fitting of the final model.
@@ -196,7 +200,7 @@ Changelog
 ......................
 
 - |Fix| Fixed a bug in :func:`metrics.mean_squared_error` to not ignore
-  argument `squared` when argument `multioutput='raw_values'`. 
+  argument `squared` when argument `multioutput='raw_values'`.
   :pr:`16323` by :user:`Rushabh Vasani <rushabh-v>`
 
 - |Fix| Fixed a bug in :func:`metrics.mutual_info_score` where negative
@@ -230,10 +234,10 @@ Changelog
 :mod:`sklearn.neighbors`
 ..............................
 
-- |Fix| Fix a bug which converted a list of arrays into a 2-D object 
+- |Fix| Fix a bug which converted a list of arrays into a 2-D object
   array instead of a 1-D array containing NumPy arrays. This bug
   was affecting :meth:`neighbors.NearestNeighbors.radius_neighbors`.
-  :pr:`16076` by :user:`Guillaume Lemaitre <glemaitre>` and  
+  :pr:`16076` by :user:`Guillaume Lemaitre <glemaitre>` and
   :user:`Alex Shacked <alexshacked>`.
 
 :mod:`sklearn.neural_network`
 
@@ -16,7 +16,7 @@
 
 from sklearn.pipeline import Pipeline
 
-from sklearn.linear_model import LinearRegression, Lasso
+from sklearn.linear_model import LinearRegression, OrthogonalMatchingPursuit
 
 from sklearn import datasets
 
@@ -37,7 +37,7 @@ def test_transform_target_regressor_error():
         regr.fit(X, y)
     # fit with sample_weight with a regressor which does not support it
     sample_weight = np.ones((y.shape[0],))
-    regr = TransformedTargetRegressor(regressor=Lasso(),
+    regr = TransformedTargetRegressor(regressor=OrthogonalMatchingPursuit(),
                                       transformer=StandardScaler())
     with pytest.raises(TypeError, match=r"fit\(\) got an unexpected "
                        "keyword argument 'sample_weight'"):
 
@@ -1,5 +1,5 @@
 """
-Generalized Linear models.
+Generalized Linear Models.
 """
 
 # Author: Alexandre Gramfort <alexandre.gramfort@inria.fr>
@@ -100,7 +100,8 @@ def make_dataset(X, y, sample_weight, random_state=None):
 
 def _preprocess_data(X, y, fit_intercept, normalize=False, copy=True,
                      sample_weight=None, return_mean=False, check_input=True):
-    """
+    """Center and scale data.
+
     Centers data to have mean zero along axis 0. If fit_intercept=False or if
     the X is a sparse matrix, no centering is done, but normalization can still
     be applied. The function returns the statistics necessary to reconstruct
@@ -180,7 +181,16 @@ def _preprocess_data(X, y, fit_intercept, normalize=False, copy=True,
 # sample_weight makes the refactoring tricky.
 
 def _rescale_data(X, y, sample_weight):
-    """Rescale data so as to support sample_weight"""
+    """Rescale data sample-wise by square root of sample_weight.
+
+    For many linear models, this enables easy support for sample_weight.
+
+    Returns
     -------
+    X_rescaled : {array-like, sparse matrix}
+
+    y_rescaled : {array-like, sparse matrix}
+    """
     n_samples = X.shape[0]
     sample_weight = np.asarray(sample_weight)
     if sample_weight.ndim == 0:
@@ -540,8 +550,15 @@ def rmatvec(b):
 
 
 def _pre_fit(X, y, Xy, precompute, normalize, fit_intercept, copy,
-             check_input=True):
-    """Aux function used at beginning of fit in linear models"""
+             check_input=True, sample_weight=None):
+    """Aux function used at beginning of fit in linear models
+
+    Parameters
+    ----------
+    order : 'F', 'C' or None, default=None
+        Whether X and y will be forced to be fortran or c-style. Only relevant
+        if sample_weight is not None.
+    """
     n_samples, n_features = X.shape
 
     if sparse.isspmatrix(X):
@@ -554,9 +571,11 @@ def _pre_fit(X, y, Xy, precompute, normalize, fit_intercept, copy,
         # copy was done in fit if necessary
         X, y, X_offset, y_offset, X_scale = _preprocess_data(
             X, y, fit_intercept=fit_intercept, normalize=normalize, copy=copy,
-            check_input=check_input)
+            check_input=check_input, sample_weight=sample_weight)
+    if sample_weight is not None:
+        X, y = _rescale_data(X, y, sample_weight=sample_weight)
     if hasattr(precompute, '__array__') and (
-            fit_intercept and not np.allclose(X_offset, np.zeros(n_features)) or
+        fit_intercept and not np.allclose(X_offset, np.zeros(n_features)) or
             normalize and not np.allclose(X_scale, np.ones(n_features))):
         warnings.warn("Gram matrix was provided but X was centered"
                       " to fit intercept, "
 
@@ -7,6 +7,7 @@
 
 import sys
 import warnings
+import numbers
 from abc import ABCMeta, abstractmethod
 
 import numpy as np
@@ -20,13 +21,57 @@
 from ..utils.validation import check_random_state
 from ..model_selection import check_cv
 from ..utils.extmath import safe_sparse_dot
-from ..utils.fixes import _joblib_parallel_args
-from ..utils.validation import check_is_fitted
+from ..utils.fixes import _astype_copy_false, _joblib_parallel_args
+from ..utils.validation import check_is_fitted, _check_sample_weight
 from ..utils.validation import column_or_1d
 
 from . import _cd_fast as cd_fast
 
 
+def _set_order(X, y, order='C'):
+    """Change the order of X and y if necessary.
+
+    Parameters
+    ----------
+    X : {array-like, sparse matrix} of shape (n_samples, n_features)
+        Training data.
+
+    y : ndarray of shape (n_samples,)
+        Target values.
+
+        If 'C', dense arrays are returned as C-ordered, sparse matrices in csr
+        format. If 'F', dense arrays are return as F-ordered, sparse matrices
+        in csc format.
+
+    Returns
+    -------
+    X : {array-like, sparse matrix} of shape (n_samples, n_features)
+        Training data with guaranteed order.
+
+    y : ndarray of shape (n_samples,)
+        Target values with guaranteed order.
+    """
+    if order not in [None, 'C', 'F']:
+        raise ValueError("Unknown value for order. Got {} instead of "
+                         "None, 'C' or 'F'.".format(order))
+    sparse_X = sparse.issparse(X)
+    sparse_y = sparse.issparse(y)
+    if order is not None:
+        sparse_format = "csc" if order == "F" else "csr"
+        if sparse_X:
+            # As of scipy 1.1.0, new argument copy=False by default.
+            # This is what we want.
+            X = X.asformat(sparse_format, **_astype_copy_false(X))
+        else:
+            X = np.asarray(X, order=order)
+        if sparse_y:
+            y = y.asformat(sparse_format)
+        else:
+            y = np.asarray(y, order=order)
+    return X, y
+
+
 ###############################################################################
 # Paths functions
 
@@ -661,7 +706,7 @@ def __init__(self, alpha=1.0, l1_ratio=0.5, fit_intercept=True,
         self.random_state = random_state
         self.selection = selection
 
-    def fit(self, X, y, check_input=True):
+    def fit(self, X, y, sample_weight=None, check_input=True):
         """Fit model with coordinate descent.
 
         Parameters
@@ -673,6 +718,9 @@ def fit(self, X, y, check_input=True):
             (n_samples, n_targets)
             Target. Will be cast to X's dtype if necessary
 
+        sample_weight : float or array-like of shape (n_samples,), default=None
+            Sample weight.
+
         check_input : bool, default=True
             Allow to bypass several input checking.
             Don't use this parameter unless you know what you do.
@@ -709,18 +757,49 @@ def fit(self, X, y, check_input=True):
             y = check_array(y, order='F', copy=False, dtype=X.dtype.type,
                             ensure_2d=False)
 
-        # Ensure copying happens only once, don't do it again if done above
+        n_samples, n_features = X.shape
+        alpha = self.alpha
+
+        if isinstance(sample_weight, numbers.Number):
+            sample_weight = None
+        if sample_weight is not None:
+            if check_input:
+                if sparse.issparse(X):
+                    raise ValueError("Sample weights do not (yet) support "
+                                     "sparse matrices.")
+                sample_weight = _check_sample_weight(sample_weight, X,
+                                                     dtype=X.dtype)
+            # simplify things by rescaling sw to sum up to n_samples
+            # => np.average(x, weights=sw) = np.mean(sw * x)
+            sample_weight *= (n_samples / np.sum(sample_weight))
+            # Objective function is:
+            # 1/2 * np.average(squared error, weights=sw) + alpha * penalty
+            # but coordinate descent minimizes:
+            # 1/2 * sum(squared error) + alpha * penalty
+            # enet_path therefore sets alpha = n_samples * alpha
+            # With sw, enet_path should set alpha = sum(sw) * alpha
+            # Therefore, we rescale alpha = sum(sw) / n_samples * alpha
+            # Note: As we rescaled sample_weights to sum up to n_samples,
+            #       we don't need this
+            # alpha *= np.sum(sample_weight) / n_samples
+
+        # Ensure copying happens only once, don't do it again if done above.
+        # X and y will be rescaled if sample_weight is not None, order='F'
+        # ensures that the returned X and y are still F-contiguous.
         should_copy = self.copy_X and not X_copied
         X, y, X_offset, y_offset, X_scale, precompute, Xy = \
             _pre_fit(X, y, None, self.precompute, self.normalize,
                      self.fit_intercept, copy=should_copy,
-                     check_input=check_input)
+                     check_input=check_input, sample_weight=sample_weight)
+        # coordinate descent needs F-ordered arrays and _pre_fit might have
+        # called _rescale_data
+        if check_input or sample_weight is not None:
+            X, y = _set_order(X, y, order='F')
         if y.ndim == 1:
             y = y[:, np.newaxis]
         if Xy is not None and Xy.ndim == 1:
             Xy = Xy[:, np.newaxis]
 
-        n_samples, n_features = X.shape
         n_targets = y.shape[1]
 
         if self.selection not in ['cyclic', 'random']:
@@ -745,7 +824,7 @@ def fit(self, X, y, check_input=True):
             _, this_coef, this_dual_gap, this_iter = \
                 self.path(X, y[:, k],
                           l1_ratio=self.l1_ratio, eps=None,
-                          n_alphas=None, alphas=[self.alpha],
+                          n_alphas=None, alphas=[alpha],
                           precompute=precompute, Xy=this_Xy,
                           fit_intercept=False, normalize=False, copy_X=True,
                           verbose=False, tol=self.tol, positive=self.positive,
@@ -1397,6 +1476,7 @@ def __init__(self, eps=1e-3, n_alphas=100, alphas=None, fit_intercept=True,
     def _more_tags(self):
         return {'multioutput': False}
 
+
 class ElasticNetCV(RegressorMixin, LinearModelCV):
     """Elastic Net model with iterative fitting along a regularization path.
 
 
@@ -131,11 +131,11 @@ def test_fit_intercept():
     lr3_with_intercept = LinearRegression().fit(X3, y)
 
     assert (lr2_with_intercept.coef_.shape ==
-                 lr2_without_intercept.coef_.shape)
+            lr2_without_intercept.coef_.shape)
     assert (lr3_with_intercept.coef_.shape ==
-                 lr3_without_intercept.coef_.shape)
+            lr3_without_intercept.coef_.shape)
     assert (lr2_without_intercept.coef_.ndim ==
-                 lr3_without_intercept.coef_.ndim)
+            lr3_without_intercept.coef_.ndim)
 
 
 def test_linear_regression_sparse(random_state=0):
@@ -451,16 +451,23 @@ def test_dtype_preprocess_data():
             assert_array_almost_equal(X_norm_32, X_norm_64)
 
 
-def test_rescale_data():
+@pytest.mark.parametrize('n_targets', [None, 2])
+def test_rescale_data_dense(n_targets):
     n_samples = 200
     n_features = 2
 
     sample_weight = 1.0 + rng.rand(n_samples)
     X = rng.rand(n_samples, n_features)
-    y = rng.rand(n_samples)
+    if n_targets is None:
+        y = rng.rand(n_samples)
+    else:
+        y = rng.rand(n_samples, n_targets)
     rescaled_X, rescaled_y = _rescale_data(X, y, sample_weight)
     rescaled_X2 = X * np.sqrt(sample_weight)[:, np.newaxis]
-    rescaled_y2 = y * np.sqrt(sample_weight)
+    if n_targets is None:
+        rescaled_y2 = y * np.sqrt(sample_weight)
+    else:
+        rescaled_y2 = y * np.sqrt(sample_weight)[:, np.newaxis]
     assert_array_almost_equal(rescaled_X, rescaled_X2)
     assert_array_almost_equal(rescaled_y, rescaled_y2)