jayzed82
diff --git a/‎doc/whats_new/v0.24.rst
+4 b/‎doc/whats_new/v0.24.rst
+4
diff --git a/‎sklearn/ensemble/_gb.py
+46-20 b/‎sklearn/ensemble/_gb.py
+46-20
diff --git a/‎sklearn/ensemble/_gb_losses.py
+7-22 b/‎sklearn/ensemble/_gb_losses.py
+7-22
diff --git a/‎sklearn/ensemble/tests/test_gradient_boosting.py
+27 b/‎sklearn/ensemble/tests/test_gradient_boosting.py
+27
diff --git a/‎sklearn/ensemble/tests/test_gradient_boosting_loss_functions.py
+15-15 b/‎sklearn/ensemble/tests/test_gradient_boosting_loss_functions.py
+15-15
@@ -147,6 +147,10 @@ Changelog
   which allows monitoring of each stage.
   :pr:`16985` by :user:`Hao Chun Chang <haochunchang>`.
 
+- |API|: The parameter ``n_classes_`` is now deprecated in
+  :class:`ensemble.GradientBoostingRegressor` and returns `1`.
+  :pr:`17702` by :user:`Simona Maggio <simonamaggio>`.
+
 :mod:`sklearn.exceptions`
 .........................
 
 
@@ -29,6 +29,7 @@
 from ..base import RegressorMixin
 from ..base import BaseEstimator
 from ..base import is_classifier
+from ..utils import deprecated
 
 from ._gradient_boosting import predict_stages
 from ._gradient_boosting import predict_stage
@@ -165,9 +166,13 @@ def __init__(self, *, loss, learning_rate, n_estimators, criterion,
         self.n_iter_no_change = n_iter_no_change
         self.tol = tol
 
+    @abstractmethod
+    def _validate_y(self, y, sample_weight=None):
+        """Called by fit to validate y"""
+
     def _fit_stage(self, i, X, y, raw_predictions, sample_weight, sample_mask,
                    random_state, X_csc=None, X_csr=None):
-        """Fit another stage of ``n_classes_`` trees to the boosting model. """
+        """Fit another stage of ``_n_classes`` trees to the boosting model. """
 
         assert sample_mask.dtype == bool
         loss = self.loss_
@@ -240,10 +245,12 @@ def _check_params(self):
         else:
             loss_class = _gb_losses.LOSS_FUNCTIONS[self.loss]
 
-        if self.loss in ('huber', 'quantile'):
-            self.loss_ = loss_class(self.n_classes_, self.alpha)
-        else:
+        if is_classifier(self):
             self.loss_ = loss_class(self.n_classes_)
+        elif self.loss in ("huber", "quantile"):
+            self.loss_ = loss_class(self.alpha)
+        else:
+            self.loss_ = loss_class()
 
         if not (0.0 < self.subsample <= 1.0):
             raise ValueError("subsample must be in (0,1] but "
@@ -265,11 +272,9 @@ def _check_params(self):
 
         if isinstance(self.max_features, str):
             if self.max_features == "auto":
-                # if is_classification
-                if self.n_classes_ > 1:
+                if is_classifier(self):
                     max_features = max(1, int(np.sqrt(self.n_features_)))
                 else:
-                    # is regression
                     max_features = self.n_features_
             elif self.max_features == "sqrt":
                 max_features = max(1, int(np.sqrt(self.n_features_)))
@@ -405,7 +410,11 @@ def fit(self, X, y, sample_weight=None, monitor=None):
         sample_weight = _check_sample_weight(sample_weight, X)
 
         y = column_or_1d(y, warn=True)
-        y = self._validate_y(y, sample_weight)
+
+        if is_classifier(self):
+            y = self._validate_y(y, sample_weight)
+        else:
+            y = self._validate_y(y)
 
         if self.n_iter_no_change is not None:
             stratify = y if is_classifier(self) else None
@@ -415,7 +424,7 @@ def fit(self, X, y, sample_weight=None, monitor=None):
                                  test_size=self.validation_fraction,
                                  stratify=stratify))
             if is_classifier(self):
-                if self.n_classes_ != np.unique(y).shape[0]:
+                if self._n_classes != np.unique(y).shape[0]:
                     # We choose to error here. The problem is that the init
                     # estimator would be trained on y, which has some missing
                     # classes now, so its predictions would not have the
@@ -711,15 +720,6 @@ def _compute_partial_dependence_recursion(self, grid, target_features):
 
         return averaged_predictions
 
-    def _validate_y(self, y, sample_weight):
-        # 'sample_weight' is not utilised but is used for
-        # consistency with similar method _validate_y of GBC
-        self.n_classes_ = 1
-        if y.dtype.kind == 'O':
-            y = y.astype(DOUBLE)
-        # Default implementation
-        return y
-
     def apply(self, X):
         """Apply trees in the ensemble to X, return leaf indices.
 
@@ -1096,7 +1096,9 @@ def _validate_y(self, y, sample_weight):
                              "trimmed classes with zero weights, while a "
                              "minimum of 2 classes are required."
                              % n_trim_classes)
-        self.n_classes_ = len(self.classes_)
+        self._n_classes = len(self.classes_)
+        # expose n_classes_ attribute
+        self.n_classes_ = self._n_classes
         return y
 
     def decision_function(self, X):
@@ -1507,7 +1509,11 @@ class GradientBoostingRegressor(RegressorMixin, BaseGradientBoosting):
         The collection of fitted sub-estimators.
 
     n_classes_ : int
-        The number of classes, set to 1 in regression tasks.
+        The number of classes, set to 1 for regressors.
+
+        .. deprecated:: 0.24
+            Attribute ``n_classes_`` was deprecated in version 0.24 and
+            will be removed in 0.26.
 
     n_estimators_ : int
         The number of estimators as selected by early stopping (if
@@ -1589,6 +1595,11 @@ def __init__(self, *, loss='ls', learning_rate=0.1, n_estimators=100,
             validation_fraction=validation_fraction,
             n_iter_no_change=n_iter_no_change, tol=tol, ccp_alpha=ccp_alpha)
 
+    def _validate_y(self, y, sample_weight=None):
+        if y.dtype.kind == 'O':
+            y = y.astype(DOUBLE)
+        return y
+
     def predict(self, X):
         """Predict regression target for X.
 
@@ -1651,3 +1662,18 @@ def apply(self, X):
         leaves = super().apply(X)
         leaves = leaves.reshape(X.shape[0], self.estimators_.shape[0])
         return leaves
+
+    # FIXME: to be removed in 0.26
+    # mypy error: Decorated property not supported
+    @deprecated("Attribute n_classes_ was deprecated "  # type: ignore
+                "in version 0.24 and will be removed in 0.26.")
+    @property
+    def n_classes_(self):
+        try:
+            check_is_fitted(self)
+        except NotFittedError as nfe:
+            raise AttributeError(
+                "{} object has no n_classes_ attribute."
+                .format(self.__class__.__name__)
+            ) from nfe
+        return 1
@@ -145,18 +145,9 @@ def get_init_raw_predictions(self, X, estimator):
 
 
 class RegressionLossFunction(LossFunction, metaclass=ABCMeta):
-    """Base class for regression loss functions.
-
-    Parameters
-    ----------
-    n_classes : int
-        Number of classes.
-    """
-    def __init__(self, n_classes):
-        if n_classes != 1:
-            raise ValueError("``n_classes`` must be 1 for regression but "
-                             "was %r" % n_classes)
-        super().__init__(n_classes)
+    """Base class for regression loss functions."""
+    def __init__(self):
+        super().__init__(n_classes=1)
 
     def check_init_estimator(self, estimator):
         """Make sure estimator has the required fit and predict methods.
@@ -328,9 +319,6 @@ class HuberLossFunction(RegressionLossFunction):
 
     Parameters
     ----------
-    n_classes : int
-        Number of classes.
-
     alpha : float, default=0.9
         Percentile at which to extract score.
 
@@ -340,8 +328,8 @@ class HuberLossFunction(RegressionLossFunction):
     Machine, The Annals of Statistics, Vol. 29, No. 5, 2001.
     """
 
-    def __init__(self, n_classes, alpha=0.9):
-        super().__init__(n_classes)
+    def __init__(self, alpha=0.9):
+        super().__init__()
         self.alpha = alpha
         self.gamma = None
 
@@ -439,14 +427,11 @@ class QuantileLossFunction(RegressionLossFunction):
 
     Parameters
     ----------
-    n_classes : int
-        Number of classes.
-
     alpha : float, default=0.9
         The percentile.
     """
-    def __init__(self, n_classes, alpha=0.9):
-        super().__init__(n_classes)
+    def __init__(self, alpha=0.9):
+        super().__init__()
         self.alpha = alpha
         self.percentile = alpha * 100
 
 
@@ -1306,3 +1306,30 @@ def test_gbr_degenerate_feature_importances():
     gbr = GradientBoostingRegressor().fit(X, y)
     assert_array_equal(gbr.feature_importances_,
                        np.zeros(10, dtype=np.float64))
+
+
+# TODO: Remove in 0.26 when `n_classes_` is deprecated
+def test_gbr_deprecated_attr():
+    # check that accessing n_classes_ in GradientBoostingRegressor raises
+    # a deprecation warning
+    X = np.zeros((10, 10))
+    y = np.ones((10,))
+    gbr = GradientBoostingRegressor().fit(X, y)
+    msg = "Attribute n_classes_ was deprecated"
+    with pytest.warns(FutureWarning, match=msg):
+        gbr.n_classes_
+
+
+# TODO: Remove in 0.26 when `n_classes_` is deprecated
+@pytest.mark.filterwarnings("ignore:Attribute n_classes_ was deprecated")
+def test_attr_error_raised_if_not_fitted():
+    # check that accessing n_classes_ in not fitted GradientBoostingRegressor
+    # raises an AttributeError
+    gbr = GradientBoostingRegressor()
+    # test raise AttributeError if not fitted
+    msg = (
+        f"{GradientBoostingRegressor.__name__} object has no n_classes_ "
+        f"attribute."
+    )
+    with pytest.raises(AttributeError, match=msg):
+        gbr.n_classes_
@@ -62,7 +62,7 @@ def test_sample_weight_smoke():
     pred = rng.rand(100)
 
     # least squares
-    loss = LeastSquaresError(1)
+    loss = LeastSquaresError()
     loss_wo_sw = loss(y, pred)
     loss_w_sw = loss(y, pred, np.ones(pred.shape[0], dtype=np.float32))
     assert_almost_equal(loss_wo_sw, loss_w_sw)
@@ -81,16 +81,16 @@ def test_sample_weight_init_estimators():
         if Loss is None:
             continue
         if issubclass(Loss, RegressionLossFunction):
-            k = 1
             y = reg_y
+            loss = Loss()
         else:
             k = 2
             y = clf_y
             if Loss.is_multi_class:
                 # skip multiclass
                 continue
+            loss = Loss(k)
 
-        loss = Loss(k)
         init_est = loss.init_estimator()
         init_est.fit(X, y)
         out = loss.get_init_raw_predictions(X, init_est)
@@ -110,7 +110,7 @@ def test_quantile_loss_function():
     # There was a sign problem when evaluating the function
     # for negative values of 'ytrue - ypred'
     x = np.asarray([-1.0, 0.0, 1.0])
-    y_found = QuantileLossFunction(1, 0.9)(x, np.zeros_like(x))
+    y_found = QuantileLossFunction(0.9)(x, np.zeros_like(x))
     y_expected = np.asarray([0.1, 0.0, 0.9]).mean()
     np.testing.assert_allclose(y_found, y_expected)
 
@@ -127,9 +127,9 @@ def test_sample_weight_deviance():
         if Loss is None:
             continue
         if issubclass(Loss, RegressionLossFunction):
-            k = 1
             y = reg_y
             p = reg_y
+            loss = Loss()
         else:
             k = 2
             y = clf_y
@@ -141,8 +141,8 @@ def test_sample_weight_deviance():
                 p = np.zeros((y.shape[0], k), dtype=np.float64)
                 for i in range(k):
                     p[:, i] = y == i
+            loss = Loss(k)
 
-        loss = Loss(k)
         deviance_w_w = loss(y, p, sample_weight)
         deviance_wo_w = loss(y, p)
         assert deviance_wo_w == deviance_w_w
@@ -201,10 +201,10 @@ def test_init_raw_predictions_shapes():
     n_samples = 100
     X = rng.normal(size=(n_samples, 5))
-    for loss in (LeastSquaresError(n_classes=1),
-                 LeastAbsoluteError(n_classes=1),
-                 QuantileLossFunction(n_classes=1),
-                 HuberLossFunction(n_classes=1)):
+    for loss in (LeastSquaresError(),
+                 LeastAbsoluteError(),
+                 QuantileLossFunction(),
+                 HuberLossFunction()):
         init_estimator = loss.init_estimator().fit(X, y)
         raw_predictions = loss.get_init_raw_predictions(y, init_estimator)
         assert raw_predictions.shape == (n_samples, 1)
@@ -237,23 +237,23 @@ def test_init_raw_predictions_values():
     y = rng.normal(size=n_samples)
 
     # Least squares loss
-    loss = LeastSquaresError(n_classes=1)
+    loss = LeastSquaresError()
     init_estimator = loss.init_estimator().fit(X, y)
     raw_predictions = loss.get_init_raw_predictions(y, init_estimator)
     # Make sure baseline prediction is the mean of all targets
     assert_almost_equal(raw_predictions, y.mean())
 
     # Least absolute and huber loss
     for Loss in (LeastAbsoluteError, HuberLossFunction):
-        loss = Loss(n_classes=1)
+        loss = Loss()
         init_estimator = loss.init_estimator().fit(X, y)
         raw_predictions = loss.get_init_raw_predictions(y, init_estimator)
         # Make sure baseline prediction is the median of all targets
         assert_almost_equal(raw_predictions, np.median(y))
 
     # Quantile loss
     for alpha in (.1, .5, .9):
-        loss = QuantileLossFunction(n_classes=1, alpha=alpha)
+        loss = QuantileLossFunction(alpha=alpha)
         init_estimator = loss.init_estimator().fit(X, y)
         raw_predictions = loss.get_init_raw_predictions(y, init_estimator)
         # Make sure baseline prediction is the alpha-quantile of all targets
@@ -294,8 +294,8 @@ def test_init_raw_predictions_values():
 @pytest.mark.parametrize('seed', range(5))
 def test_lad_equals_quantile_50(seed):
     # Make sure quantile loss with alpha = .5 is equivalent to LAD
-    lad = LeastAbsoluteError(n_classes=1)
-    ql = QuantileLossFunction(n_classes=1, alpha=0.5)
+    lad = LeastAbsoluteError()
+    ql = QuantileLossFunction(alpha=0.5)
 
     n_samples = 50
     rng = np.random.RandomState(seed)