scikit-learn · akaashp2000 · Sep 10, 2023 · Sep 10, 2023 · Sep 10, 2023 · Sep 10, 2023
diff --git a/sklearn/ensemble/tests/test_stacking.py b/sklearn/ensemble/tests/test_stacking.py
@@ -26,7 +26,7 @@
     StackingClassifier,
     StackingRegressor,
 )
-from sklearn.exceptions import ConvergenceWarning, NotFittedError
+from sklearn.exceptions import NotFittedError
 from sklearn.linear_model import (
        LinearRegression,
     LogisticRegression,
@@ -42,7 +42,6 @@
 from sklearn.utils._testing import (
     assert_allclose,
     assert_allclose_dense_sparse,
-    ignore_warnings,
 )
 from sklearn.utils.fixes import COO_CONTAINERS, CSC_CONTAINERS, CSR_CONTAINERS
 
@@ -54,6 +53,8 @@
     n_classes=3, random_state=42
 )
 X_binary, y_binary = make_classification(n_classes=2, random_state=42)
+X_breast_cancer, y_breast_cancer = load_breast_cancer(return_X_y=True)
+X_breast_cancer = scale(X_breast_cancer)
 
 
 @pytest.mark.parametrize(
@@ -435,7 +436,8 @@ def test_stacking_classifier_stratify_default():
                 final_estimator=LogisticRegression(),
                 cv=KFold(shuffle=True, random_state=42),
             ),
-            *load_breast_cancer(return_X_y=True),
+            X_breast_cancer,
+            y_breast_cancer,
         ),
         (
             StackingRegressor(
@@ -464,18 +466,15 @@ def test_stacking_with_sample_weight(stacker, X, y):
         X, y, total_sample_weight, random_state=42
     )
 
-    with ignore_warnings(category=ConvergenceWarning):
-        stacker.fit(X_train, y_train)
+    stacker.fit(X_train, y_train)
     y_pred_no_weight = stacker.predict(X_test)
 
-    with ignore_warnings(category=ConvergenceWarning):
-        stacker.fit(X_train, y_train, sample_weight=np.ones(y_train.shape))
+    stacker.fit(X_train, y_train, sample_weight=np.ones(y_train.shape))
     y_pred_unit_weight = stacker.predict(X_test)
 
     assert_allclose(y_pred_no_weight, y_pred_unit_weight)
 
-    with ignore_warnings(category=ConvergenceWarning):
-        stacker.fit(X_train, y_train, sample_weight=sample_weight_train)
+    stacker.fit(X_train, y_train, sample_weight=sample_weight_train)
     y_pred_biased = stacker.predict(X_test)
 
     assert np.abs(y_pred_no_weight - y_pred_biased).sum() > 0
@@ -490,7 +489,6 @@ def test_stacking_classifier_sample_weight_fit_param():
     stacker.fit(X_iris, y_iris, sample_weight=np.ones(X_iris.shape[0]))
 
 
-@pytest.mark.filterwarnings("ignore::sklearn.exceptions.ConvergenceWarning")
 @pytest.mark.parametrize(
     "stacker, X, y",
     [
@@ -502,7 +500,8 @@ def test_stacking_classifier_sample_weight_fit_param():
                 ],
                 final_estimator=LogisticRegression(),
             ),
-            *load_breast_cancer(return_X_y=True),
+            X_breast_cancer,
+            y_breast_cancer,
         ),
         (
             StackingRegressor(

diff --git a/sklearn/linear_model/_linear_loss.py b/sklearn/linear_model/_linear_loss.py
@@ -291,13 +291,29 @@
 
         if not self.base_loss.is_multiclass:
             grad = np.empty_like(coef, dtype=weights.dtype)
-            grad[:n_features] = X.T @ grad_pointwise + l2_reg_strength * weights
+            with np.errstate(all="raise"):
+                try:
+                    grad[:n_features] = X.T @ grad_pointwise + l2_reg_strength * weights
+                except FloatingPointError:
-                except FloatingPointError:
+                except FloatingPointError as exc:
-                except FloatingPointError:
+                except FloatingPointError as exc:
+                    raise ValueError(
+                        "Overflow detected. Try scaling the target variable or"
+                        " features, or using a different solver"
+                    ) from None
-                    ) from None
+                    ) from exc
-                    ) from None
+                    ) from exc
             if self.fit_intercept:
                 grad[-1] = grad_pointwise.sum()
         else:
             grad = np.empty((n_classes, n_dof), dtype=weights.dtype, order="F")
             # grad_pointwise.shape = (n_samples, n_classes)
-            grad[:, :n_features] = grad_pointwise.T @ X + l2_reg_strength * weights
+            with np.errstate(all="raise"):
+                try:
+                    grad[:, :n_features] = (
+                        grad_pointwise.T @ X + l2_reg_strength * weights
+                    )
+                except FloatingPointError:
-                except FloatingPointError:
+                except FloatingPointError as exc:
-                except FloatingPointError:
+                except FloatingPointError as exc:
+                    raise ValueE
67E6
rror(
+                        "Overflow detected. Try scaling the target variable or"
+                        " features, or using a different solver"
+                    ) from None
-                    ) from None
+                    ) from exc
-                    ) from None
+                    ) from exc
             if self.fit_intercept:
                 grad[:, -1] = grad_pointwise.sum(axis=0)
             if coef.ndim == 1: