sstalley
diff --git a/‎doc/modules/linear_model.rst
Lines changed: 15 additions & 0 deletions b/‎doc/modules/linear_model.rst
Lines changed: 15 additions & 0 deletions
diff --git a/‎doc/tutorial/statistical_inference/supervised_learning.rst
Lines changed: 1 addition & 1 deletion b/‎doc/tutorial/statistical_inference/supervised_learning.rst
Lines changed: 1 addition & 1 deletion
diff --git a/‎doc/whats_new/v0.24.rst
Lines changed: 8 additions & 0 deletions b/‎doc/whats_new/v0.24.rst
Lines changed: 8 additions & 0 deletions
diff --git a/‎examples/linear_model/plot_nnls.py
Lines changed: 67 additions & 0 deletions b/‎examples/linear_model/plot_nnls.py
Lines changed: 67 additions & 0 deletions
diff --git a/‎sklearn/linear_model/_base.py
Lines changed: 25 additions & 4 deletions b/‎sklearn/linear_model/_base.py
Lines changed: 25 additions & 4 deletions
diff --git a/‎sklearn/linear_model/tests/test_base.py
Lines changed: 81 additions & 1 deletion b/‎sklearn/linear_model/tests/test_base.py
Lines changed: 81 additions & 1 deletion
@@ -43,6 +43,8 @@ and will store the coefficients :math:`w` of the linear model in its
 
     >>> from sklearn import linear_model
     >>> reg = linear_model.LinearRegression()
+    >>> reg.fit ([[0, 0], [1, 1], [2, 2]], [0, 1, 2])
+    LinearRegression()
     >>> reg.fit([[0, 0], [1, 1], [2, 2]], [0, 1, 2])
     LinearRegression()
     >>> reg.coef_
@@ -61,6 +63,19 @@ example, when data are collected without an experimental design.
 
    * :ref:`sphx_glr_auto_examples_linear_model_plot_ols.py`
 
+Non-Negative Least Squares
+--------------------------
+
+It is possible to constrain all the coefficients to be non-negative, which may
+be useful when they represent some physical or naturally non-negative
+quantities (e.g., frequency counts or prices of goods).
+:class:`LinearRegression` accepts a boolean ``positive``
+parameter: when set to `True` `Non Negative Least Squares
+<https://en.wikipedia.org/wiki/Non-negative_least_squares>`_ are then applied.
+
+.. topic:: Examples:
+
+   * :ref:`sphx_glr_auto_examples_linear_model_plot_nnls.py`
 
 Or
10000
dinary Least Squares Complexity
 ---------------------------------
 
@@ -173,7 +173,7 @@ Linear models: :math:`y = X\beta + \epsilon`
     >>> regr = linear_model.LinearRegression()
     >>> regr.fit(diabetes_X_train, diabetes_y_train)
     LinearRegression()
-    >>> print(regr.coef_)  # doctest: +SKIP
+    >>> print(regr.coef_)
     [   0.30349955 -237.63931533  510.53060544  327.73698041 -814.13170937
       492.81458798  102.84845219  184.60648906  743.51961675   76.09517222]
 
 
@@ -203,6 +203,14 @@ Changelog
 - |Enhancement| :class:`isotonic.IsotonicRegression` now accepts 2darray with 1 feature as
   input array. :pr:`17379` by :user:`Jiaxiang <fujiaxiang>`.
 
+:mod:`sklearn.linear_model`
+...........................
+
+- |Feature| :class:`linear_model.LinearRegression` now forces coefficients
+  to be all positive when ``positive`` is set to ``True``.
+  :pr:`17578` by :user:`Joseph Knox <jknox13>`, :user:`Nelle Varoquaux <NelleV>`
+  and :user:`Chiara Marmo <cmarmo>`.
+
 :mod:`sklearn.manifold`
 .......................
 
 
@@ -0,0 +1,67 @@
+"""
+==========================
+Non-negative least squares
+==========================
+
+In this example, we fit a linear model with positive constraints on the
+regression coefficients and compare the estimated coefficients to a classic
+linear regression.
+"""
+print(__doc__)
+import numpy as np
+import matplotlib.pyplot as plt
+from sklearn.metrics import r2_score
+
+# %%
+# Generate some random data
+np.random.seed(42)
+
+n_samples, n_features = 200, 50
+X = np.random.randn(n_samples, n_features)
+true_coef = 3 * np.random.randn(n_features)
+# Threshold coefficients to render them non-negative
+true_coef[true_coef < 0] = 0
+y = np.dot(X, true_coef)
+
+# Add some noise
+y += 5 * np.random.normal(size=(n_samples, ))
+
+# %%
+# Split the data in train set and test set
+from sklearn.model_selection import train_test_split
+
+X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.5)
+
+# %%
+# Fit the Non-Negative least squares.
+from sklearn.linear_model import LinearRegression
+
+reg_nnls = LinearRegression(positive=True)
+y_pred_nnls = reg_nnls.fit(X_train, y_train).predict(X_test)
+r2_score_nnls = r2_score(y_test, y_pred_nnls)
+print("NNLS R2 score", r2_score_nnls)
+
+# %%
+# Fit an OLS.
+reg_ols = LinearRegression()
+y_pred_ols = reg_ols.fit(X_train, y_train).predict(X_test)
+r2_score_ols = r2_score(y_test, y_pred_ols)
+print("OLS R2 score", r2_score_ols)
+
+
+# %%
+# Comparing the regression coefficients between OLS and NNLS, we can observe
+# they are highly correlated (the dashed line is the identity relation),
+# but the non-negative constraint shrinks some to 0.
+# The Non-Negative Least squares inherently yield sparse results.
+
+fig, ax = plt.subplots()
+ax.plot(reg_ols.coef_, reg_nnls.coef_, linewidth=0, marker=".")
+
+low_x, high_x = ax.get_xlim()
+low_y, high_y = ax.get_ylim()
+low = max(low_x, low_y)
+high = min(high_x, high_y)
+ax.plot([low, high], [low, high], ls="--", c=".3", alpha=.5)
+ax.set_xlabel("OLS regression coefficients", fontweight="bold")
+ax.set_ylabel("NNLS regression coefficients", fontweight="bold")
@@ -20,6 +20,7 @@
 import numpy as np
 import scipy.sparse as sp
 from scipy import linalg
+from scipy import optimize
 from scipy import sparse
 from scipy.special import expit
 from joblib import Parallel, delayed
@@ -419,6 +420,12 @@ class LinearRegression(MultiOutputMixin, RegressorMixin, LinearModel):
         ``-1`` means using all processors. See :term:`Glossary <n_jobs>`
         for more details.
 
+    positive : bool, default=False
+        When set to ``True``, forces the coefficients to be positive. This
+        option is only supported for dense arrays.
+
+        .. versionadded:: 0.24
+
     Attributes
     ----------
     coef_ : array of shape (n_features, ) or (n_targets, n_features)
@@ -451,7 +458,8 @@ class LinearRegression(MultiOutputMixin, RegressorMixin, LinearModel):
     Notes
     -----
     From the implementation point of view, this is just plain Ordinary
-    Least Squares (scipy.linalg.lstsq) wrapped as a predictor object.
+    Least Squares (scipy.linalg.lstsq) or Non Negative Least Squares
+    (scipy.optimize.nnls) wrapped as a predictor object.
 
     Examples
     --------
@@ -472,11 +480,12 @@ class LinearRegression(MultiOutputMixin, RegressorMixin, LinearModel):
     """
     @_deprecate_positional_args
     def __init__(self, *, fit_intercept=True, normalize=False, copy_X=True,
-                 n_jobs=None):
+                 n_jobs=None, positive=False):
         self.fit_intercept = fit_intercept
         self.normalize = normalize
         self.copy_X = copy_X
         self.n_jobs = n_jobs
+        self.positive = positive
 
     def fit(self, X, y, sample_weight=None):
         """
@@ -502,7 +511,10 @@ def fit(self, X, y, sample_weight=None):
         """
 
         n_jobs_ = self.n_jobs
-        X, y = self._validate_data(X, y, accept_sparse=['csr', 'csc', 'coo'],
+
+        accept_sparse = False if self.positive else ['csr', 'csc', 'coo']
+
+        X, y = self._validate_data(X, y, accept_sparse=accept_sparse,
                                    y_numeric=True, multi_output=True)
 
         if sample_weight is not None:
@@ -518,7 +530,16 @@ def fit(self, X, y, sample_weight=None):
             # Sample weight can be implemented via a simple rescaling.
             X, y = _rescale_data(X, y, sample_weight)
 
-        if sp.issparse(X):
+        if self.positive:
+            if y.ndim < 2:
+                self.coef_, self._residues = optimize.nnls(X, y)
+            else:
+                # scipy.optimize.nnls cannot handle y with shape (M, K)
+                outs = Parallel(n_jobs=n_jobs_)(
+                        delayed(optimize.nnls)(X, y[:, j])
+                        for j in range(y.shape[1]))
+                self.coef_, self._residues = map(np.vstack, zip(*outs))
+        elif sp.issparse(X):
             X_offset_scale = X_offset / X_scale
 
             def matvec(b):
 
@@ -13,13 +13,13 @@
 from sklearn.utils._testing import assert_array_equal
 from sklearn.utils._testing import assert_almost_equal
 from sklearn.utils._testing import assert_allclose
+from sklearn.utils import check_random_state
 from sklearn.utils.fixes import parse_version
 
 from sklearn.linear_model import LinearRegression
 from sklearn.linear_model._base import _preprocess_data
 from sklearn.linear_model._base import _rescale_data
 from sklearn.linear_model._base import make_dataset
-from sklearn.utils import check_random_state
 from sklearn.datasets import make_sparse_uncorrelated
 from sklearn.datasets import make_regression
 from sklearn.datasets import load_iris
@@ -94,6 +94,18 @@ def test_linear_regression_sample_weights():
                 assert_almost_equal(inter1, coefs2[0])
 
 
+def test_raises_value_error_if_positive_and_sparse():
+    error_msg = ('A sparse matrix was passed, '
+                 'but dense data is required.')
+    # X must not be sparse if positive == True
+    X = sparse.eye(10)
+    y = np.ones(10)
+
+    reg = LinearRegression(positive=True)
+
+    with pytest.raises(TypeError, match=error_msg):
+        reg.fit(X, y)
+
 def test_raises_value_error_if_sample_weights_greater_than_1d():
     # Sample weights must be either scalar or 1D
 
@@ -206,6 +218,74 @@ def test_linear_regression_sparse_multiple_outcome(random_state=0):
     assert_array_almost_equal(np.vstack((y_pred, y_pred)).T, Y_pred, decimal=3)
 
 
+def test_linear_regression_positive():
+    # Test nonnegative LinearRegression on a simple dataset.
+    X = [[1], [2]]
+    y = [1, 2]
+
+    reg = LinearRegression(positive=True)
+    reg.fit(X, y)
+
+    assert_array_almost_equal(reg.coef_, [1])
+    assert_array_almost_equal(reg.intercept_, [0])
+    assert_array_almost_equal(reg.predict(X), [1, 2])
+
+    # test it also for degenerate input
+    X = [[1]]
+    y = [0]
+
+    reg = LinearRegression(positive=True)
+    reg.fit(X, y)
+    assert_allclose(reg.coef_, [0])
+    assert_allclose(reg.intercept_, [0])
+    assert_allclose(reg.predict(X), [0])
+
+
+def test_linear_regression_positive_multiple_outcome(random_state=0):
+    # Test multiple-outcome nonnegative linear regressions
+    random_state = check_random_state(random_state)
+    X, y = make_sparse_uncorrelated(random_state=random_state)
+    Y = np.vstack((y, y)).T
+    n_features = X.shape[1]
+
+    ols = LinearRegression(positive=True)
+    ols.fit(X, Y)
+    assert ols.coef_.shape == (2, n_features)
+    assert np.all(ols.coef_ >= 0.)
+    Y_pred = ols.predict(X)
+    ols.fit(X, y.ravel())
+    y_pred = ols.predict(X)
+    assert_allclose(np.vstack((y_pred, y_pred)).T, Y_pred)
+
+
+def test_linear_regression_positive_vs_nonpositive():
+    # Test differences with LinearRegression when positive=False.
+    X, y = make_sparse_uncorrelated(random_state=0)
+
+    reg = LinearRegression(positive=True)
+    reg.fit(X, y)
+    regn = LinearRegression(positive=False)
+    regn.fit(X, y)
+
+    assert np.mean((reg.coef_ - regn.coef_)**2) > 1e-3
+
+
+def test_linear_regression_positive_vs_nonpositive_when_positive():
+    # Test LinearRegression fitted coefficients
+    # when the problem is positive.
+    n_samples = 200
+    n_features = 4
+    X = rng.rand(n_samples, n_features)
+    y = X[:, 0] + 2 * X[:, 1] + 3 * X[:, 2] + 1.5 * X[:, 3]
+
+    reg = LinearRegression(positive=True)
+    reg.fit(X, y)
+    regn = LinearRegression(positive=False)
+    regn.fit(X, y)
+
+    assert np.mean((reg.coef_ - regn.coef_)**2) < 1e-6
+
+
 def test_linear_regression_pd_sparse_dataframe_warning():
     pd = pytest.importorskip('pandas')
     # restrict the pd versions < '0.24.0' as they have a bug in is_sparse func