scikit-learn
diff --git a/‎benchmarks/bench_hist_gradient_boosting_adult.py
Lines changed: 1 addition & 1 deletion b/‎benchmarks/bench_hist_gradient_boosting_adult.py
Lines changed: 1 addition & 1 deletion
diff --git a/‎benchmarks/bench_hist_gradient_boosting_higgsboson.py
Lines changed: 1 addition & 1 deletion b/‎benchmarks/bench_hist_gradient_boosting_higgsboson.py
Lines changed: 1 addition & 1 deletion
diff --git a/‎examples/applications/plot_species_distribution_modeling.py
Lines changed: 1 addition & 1 deletion b/‎examples/applications/plot_species_distribution_modeling.py
Lines changed: 1 addition & 1 deletion
diff --git a/‎examples/applications/plot_time_series_lagged_features.py
Lines changed: 1 addition & 1 deletion b/‎examples/applications/plot_time_series_lagged_features.py
Lines changed: 1 addition & 1 deletion
diff --git a/‎examples/applications/plot_topics_extraction_with_nmf_lda.py
Lines changed: 1 addition & 1 deletion b/‎examples/applications/plot_topics_extraction_with_nmf_lda.py
Lines changed: 1 addition & 1 deletion
diff --git a/‎examples/ensemble/plot_bias_variance.py
Lines changed: 2 additions & 2 deletions b/‎examples/ensemble/plot_bias_variance.py
Lines changed: 2 additions & 2 deletions
diff --git a/‎examples/linear_model/plot_tweedie_regression_insurance_claims.py
Lines changed: 3 additions & 2 deletions b/‎examples/linear_model/plot_tweedie_regression_insurance_claims.py
Lines changed: 3 additions & 2 deletions
diff --git a/‎examples/manifold/plot_lle_digits.py
Lines changed: 0 additions & 1 deletion b/‎examples/manifold/plot_lle_digits.py
Lines changed: 0 additions & 1 deletion
diff --git a/‎examples/manifold/plot_manifold_sphere.py
Lines changed: 1 addition & 1 deletion b/‎examples/manifold/plot_manifold_sphere.py
Lines changed: 1 addition & 1 deletion
diff --git a/‎examples/model_selection/plot_likelihood_ratios.py
Lines changed: 1 addition & 1 deletion b/‎examples/model_selection/plot_likelihood_ratios.py
Lines changed: 1 addition & 1 deletion
diff --git a/‎examples/model_selection/plot_roc.py
Lines changed: 3 additions & 3 deletions b/‎examples/model_selection/plot_roc.py
Lines changed: 3 additions & 3 deletions
diff --git a/‎sklearn/_loss/tests/test_loss.py
Lines changed: 10 additions & 7 deletions b/‎sklearn/_loss/tests/test_loss.py
Lines changed: 10 additions & 7 deletions
diff --git a/‎sklearn/cluster/_feature_agglomeration.py
Lines changed: 0 additions & 1 deletion b/‎sklearn/cluster/_feature_agglomeration.py
Lines changed: 0 additions & 1 deletion
diff --git a/‎sklearn/cross_decomposition/tests/test_pls.py
Lines changed: 2 additions & 2 deletions b/‎sklearn/cross_decomposition/tests/test_pls.py
Lines changed: 2 additions & 2 deletions
diff --git a/‎sklearn/datasets/tests/test_openml.py
Lines changed: 6 additions & 6 deletions b/‎sklearn/datasets/tests/test_openml.py
Lines changed: 6 additions & 6 deletions
diff --git a/‎sklearn/datasets/tests/test_samples_generator.py
Lines changed: 18 additions & 18 deletions b/‎sklearn/datasets/tests/test_samples_generator.py
Lines changed: 18 additions & 18 deletions
diff --git a/‎sklearn/ensemble/_bagging.py
Lines changed: 0 additions & 1 deletion b/‎sklearn/ensemble/_bagging.py
Lines changed: 0 additions & 1 deletion
diff --git a/‎sklearn/ensemble/_forest.py
Lines changed: 0 additions & 1 deletion b/‎sklearn/ensemble/_forest.py
Lines changed: 0 additions & 1 deletion
diff --git a/‎sklearn/ensemble/tests/test_forest.py
Lines changed: 10 additions & 9 deletions b/‎sklearn/ensemble/tests/test_forest.py
Lines changed: 10 additions & 9 deletions
diff --git a/‎sklearn/experimental/enable_hist_gradient_boosting.py
Lines changed: 0 additions & 1 deletion b/‎sklearn/experimental/enable_hist_gradient_boosting.py
Lines changed: 0 additions & 1 deletion
diff --git a/‎sklearn/feature_selection/_univariate_selection.py
Lines changed: 0 additions & 1 deletion b/‎sklearn/feature_selection/_univariate_selection.py
Lines changed: 0 additions & 1 deletion
diff --git a/‎sklearn/gaussian_process/tests/test_gpc.py
Lines changed: 3 additions & 2 deletions
< 10000 /div> b/‎sklearn/gaussian_process/tests/test_gpc.py
Lines changed: 3 additions & 2 deletions
< 10000 /div>
diff --git a/‎sklearn/gaussian_process/tests/test_gpr.py
Lines changed: 3 additions & 2 deletions b/‎sklearn/gaussian_process/tests/test_gpr.py
Lines changed: 3 additions & 2 deletions
diff --git a/‎sklearn/inspection/_plot/tests/test_plot_partial_dependence.py
Lines changed: 4 additions & 4 deletions b/‎sklearn/inspection/_plot/tests/test_plot_partial_dependence.py
Lines changed: 4 additions & 4 deletions
diff --git a/‎sklearn/linear_model/_glm/_newton_solver.py
Lines changed: 2 additions & 2 deletions b/‎sklearn/linear_model/_glm/_newton_solver.py
Lines changed: 2 additions & 2 deletions
@@ -46,7 +46,7 @@ def predict(est, data_test, target_test):
     toc = time()
     roc_auc = roc_auc_score(target_test, predicted_proba_test[:, 1])
     acc = accuracy_score(target_test, predicted_test)
-    print(f"predicted in {toc - tic:.3f}s, ROC AUC: {roc_auc:.4f}, ACC: {acc :.4f}")
+    print(f"predicted in {toc - tic:.3f}s, ROC AUC: {roc_auc:.4f}, ACC: {acc:.4f}")
 
 
 data = fetch_openml(data_id=179, as_frame=True)  # adult dataset
 
@@ -74,7 +74,7 @@ def predict(est, data_test, target_test):
     toc = time()
     roc_auc = roc_auc_score(target_test, predicted_proba_test[:, 1])
     acc = accuracy_score(target_test, predicted_test)
-    print(f"predicted in {toc - tic:.3f}s, ROC AUC: {roc_auc:.4f}, ACC: {acc :.4f}")
+    print(f"predicted in {toc - tic:.3f}s, ROC AUC: {roc_auc:.4f}, ACC: {acc:.4f}")
 
 
 df = load_data()
 
@@ -109,7 +109,7 @@ def create_species_bunch(species_name, train, test, coverages, xgrid, ygrid):
 
 
 def plot_species_distribution(
-    species=("bradypus_variegatus_0", "microryzomys_minutus_0")
+    species=("bradypus_variegatus_0", "microryzomys_minutus_0"),
 ):
     """
     Plot the species distribution.
 
@@ -265,7 +265,7 @@ def consolidate_scores(cv_results, scores, metric):
     time = cv_results["fit_time"]
     scores["fit_time"].append(f"{time.mean():.2f} ± {time.std():.2f} s")
 
-    scores["loss"].append(f"quantile {int(quantile*100)}")
+    scores["loss"].append(f"quantile {int(quantile * 100)}")
     for key, value in cv_results.items():
         if key.startswith("test_"):
             metric = key.split("test_")[1]
 
@@ -50,7 +50,7 @@ def plot_top_words(model, feature_names, n_top_words, title):
 
         ax = axes[topic_idx]
         ax.barh(top_features, weights, height=0.7)
-        ax.set_title(f"Topic {topic_idx +1}", fontdict={"fontsize": 30})
+        ax.set_title(f"Topic {topic_idx + 1}", fontdict={"fontsize": 30})
         ax.tick_params(axis="both", which="major", labelsize=20)
         for i in "top right left".split():
             ax.spines[i].set_visible(False)
 
@@ -177,8 +177,8 @@ def generate(n_samples, noise, n_repeat=1):
 
     plt.subplot(2, n_estimators, n_estimators + n + 1)
     plt.plot(X_test, y_error, "r", label="$error(x)$")
-    plt.plot(X_test, y_bias, "b", label="$bias^2(x)$"),
-    plt.plot(X_test, y_var, "g", label="$variance(x)$"),
+    (plt.plot(X_test, y_bias, "b", label="$bias^2(x)$"),)
+    (plt.plot(X_test, y_var, "g", label="$variance(x)$"),)
     plt.plot(X_test, y_noise, "c", label="$noise(x)$")
 
     plt.xlim([-5, 5])
 
@@ -606,8 +606,9 @@ def score_estimator(
             "predicted, frequency*severity model": np.sum(
                 exposure * glm_freq.predict(X) * glm_sev.predict(X)
             ),
-            "predicted, tweedie, power=%.2f"
-            % glm_pure_premium.power: np.sum(exposure * glm_pure_premium.predict(X)),
+            "predicted, tweedie, power=%.2f" % glm_pure_premium.power: np.sum(
+                exposure * glm_pure_premium.predict(X)
+            ),
         }
     )
 
 
@@ -10,7 +10,6 @@
 # Authors: The scikit-learn developers
 # SPDX-License-Identifier: BSD-3-Clause
 
-
 # %%
 # Load digits dataset
 # -------------------
 
@@ -50,7 +50,7 @@
 t = random_state.rand(n_samples) * np.pi
 
 # Sever the poles from the sphere.
-indices = (t < (np.pi - (np.pi / 8))) & (t > ((np.pi / 8)))
+indices = (t < (np.pi - (np.pi / 8))) & (t > (np.pi / 8))
 colors = p[indices]
 x, y, z = (
     np.sin(t[indices]) * np.cos(p[indices]),
 
@@ -40,7 +40,7 @@ class proportion than the target application.
 from sklearn.datasets import make_classification
 
 X, y = make_classification(n_samples=10_000, weights=[0.9, 0.1], random_state=0)
-print(f"Percentage of people carrying the disease: {100*y.mean():.2f}%")
+print(f"Percentage of people carrying the disease: {100 * y.mean():.2f}%")
 
 # %%
 # A machine learning model is built to diagnose if a person with some given
 
@@ -152,9 +152,9 @@
 #
 # We can briefly demo the effect of :func:`numpy.ravel`:
 
-print(f"y_score:\n{y_score[0:2,:]}")
+print(f"y_score:\n{y_score[0:2, :]}")
 print()
-print(f"y_score.ravel():\n{y_score[0:2,:].ravel()}")
+print(f"y_score.ravel():\n{y_score[0:2, :].ravel()}")
 
 # %%
 # In a multi-class classification setup with highly imbalanced classes,
@@ -359,7 +359,7 @@
     plt.plot(
         fpr_grid,
         mean_tpr[ix],
-        label=f"Mean {label_a} vs {label_b} (AUC = {mean_score :.2f})",
+        label=f"Mean {label_a} vs {label_b} (AUC = {mean_score:.2f})",
         linestyle=":",
         linewidth=4,
     )
 
@@ -215,7 +215,8 @@ def test_loss_boundary_y_true(loss, y_true_success, y_true_fail):
 
 
 @pytest.mark.parametrize(
-    "loss, y_pred_success, y_pred_fail", Y_COMMON_PARAMS + Y_PRED_PARAMS  # type: ignore
+    "loss, y_pred_success, y_pred_fail",
+    Y_COMMON_PARAMS + Y_PRED_PARAMS,  # type: ignore
 )
 def test_loss_boundary_y_pred(loss, y_pred_success, y_pred_fail):
     """Test boundaries of y_pred for loss functions."""
@@ -501,12 +502,14 @@ def test_loss_same_as_C_functions(loss, sample_weight):
         sample_weight=sample_weight,
         loss_out=out_l1,
     )
-    loss.closs.loss(
-        y_true=y_true,
-        raw_prediction=raw_prediction,
-        sample_weight=sample_weight,
-        loss_out=out_l2,
-    ),
+    (
+        loss.closs.loss(
+            y_true=y_true,
+            raw_prediction=raw_prediction,
+            sample_weight=sample_weight,
+            loss_out=out_l2,
+        ),
+    )
     assert_allclose(out_l1, out_l2)
     loss.gradient(
         y_true=y_true,
 
@@ -6,7 +6,6 @@
 # Authors: The scikit-learn developers
 # SPDX-License-Identifier: BSD-3-Clause
 
-
 import numpy as np
 from scipy.sparse import issparse
 
 
@@ -404,12 +404,12 @@ def test_copy(Est):
 
     X_orig = X.copy()
     with pytest.raises(AssertionError):
-        pls.transform(X, Y, copy=False),
+        (pls.transform(X, Y, copy=False),)
         assert_array_almost_equal(X, X_orig)
 
     X_orig = X.copy()
     with pytest.raises(AssertionError):
-        pls.predict(X, copy=False),
+        (pls.predict(X, copy=False),)
         assert_array_almost_equal(X, X_orig)
 
     # Make sure copy=True gives same transform and predictions as predict=False
 
@@ -105,9 +105,9 @@ def _file_name(url, suffix):
         )
 
     def _mock_urlopen_shared(url, has_gzip_header, expected_prefix, suffix):
-        assert url.startswith(
-            expected_prefix
-        ), f"{expected_prefix!r} does not match {url!r}"
+        assert url.startswith(expected_prefix), (
+            f"{expected_prefix!r} does not match {url!r}"
+        )
 
         data_file_name = _file_name(url, suffix)
         data_file_path = resources.files(data_module) / data_file_name
@@ -156,9 +156,9 @@ def _mock_urlopen_download_data(url, has_gzip_header):
         )
 
     def _mock_urlopen_data_list(url, has_gzip_header):
-        assert url.startswith(
-            url_prefix_data_list
-        ), f"{url_prefix_data_list!r} does not match {url!r}"
+        assert url.startswith(url_prefix_data_list), (
+            f"{url_prefix_data_list!r} does not match {url!r}"
+        )
 
         data_file_name = _file_name(url, ".json")
         data_file_path = resources.files(data_module) / data_file_name
 
@@ -138,17 +138,17 @@ def test_make_classification_informative_features():
             signs = signs.view(dtype="|S{0}".format(signs.strides[0])).ravel()
             unique_signs, cluster_index = np.unique(signs, return_inverse=True)
 
-            assert (
-                len(unique_signs) == n_clusters
-            ), "Wrong number of clusters, or not in distinct quadrants"
+            assert len(unique_signs) == n_clusters, (
+                "Wrong number of clusters, or not in distinct quadrants"
+            )
 
             clusters_by_class = defaultdict(set)
             for cluster, cls in zip(cluster_index, y):
                 clusters_by_class[cls].add(cluster)
             for clusters in clusters_by_class.values():
-                assert (
-                    len(clusters) == n_clusters_per_class
-                ), "Wrong number of clusters per class"
+                assert len(clusters) == n_clusters_per_class, (
+                    "Wrong number of clusters per class"
+                )
             assert len(clusters_by_class) == n_classes, "Wrong number of classes"
 
             assert_array_almost_equal(
@@ -412,9 +412,9 @@ def test_make_blobs_n_samples_list():
     X, y = make_blobs(n_samples=n_samples, n_features=2, random_state=0)
 
     assert X.shape == (sum(n_samples), 2), "X shape mismatch"
-    assert all(
-        np.bincount(y, minlength=len(n_samples)) == n_samples
-    ), "Incorrect number of samples per blob"
+    assert all(np.bincount(y, minlength=len(n_samples)) == n_samples), (
+        "Incorrect number of samples per blob"
+    )
 
 
 def test_make_blobs_n_samples_list_with_centers():
@@ -426,9 +426,9 @@ def test_make_blobs_n_samples_list_with_centers():
     )
 
     assert X.shape == (sum(n_samples), 2), "X shape mismatch"
-    assert all(
-        np.bincount(y, minlength=len(n_samples)) == n_samples
-    ), "Incorrect number of samples per blob"
+    assert all(np.bincount(y, minlength=len(n_samples)) == n_samples), (
+        "Incorrect number of samples per blob"
+    )
     for i, (ctr, std) in enumerate(zip(centers, cluster_stds)):
         assert_almost_equal((X[y == i] - ctr).std(), std, 1, "Unexpected std")
 
@@ -441,9 +441,9 @@ def test_make_blobs_n_samples_centers_none(n_samples):
     X, y = make_blobs(n_samples=n_samples, centers=centers, random_state=0)
 
     assert X.shape == (sum(n_samples), 2), "X shape mismatch"
-    assert all(
-        np.bincount(y, minlength=len(n_samples)) == n_samples
-    ), "Incorrect number of samples per blob"
+    assert all(np.bincount(y, minlength=len(n_samples)) == n_samples), (
+        "Incorrect number of samples per blob"
+    )
 
 
 def test_make_blobs_return_centers():
@@ -681,9 +681,9 @@ def test_make_moons():
 
 def test_make_moons_unbalanced():
     X, y = make_moons(n_samples=(7, 5))
-    assert (
-        np.sum(y == 0) == 7 and np.sum(y == 1) == 5
-    ), "Number of samples in a moon is wrong"
+    assert np.sum(y == 0) == 7 and np.sum(y == 1) == 5, (
+        "Number of samples in a moon is wrong"
+    )
     assert X.shape == (12, 2), "X shape mismatch"
     assert y.shape == (12,), "y shape mismatch"
 
 
@@ -3,7 +3,6 @@
 # Authors: The scikit-learn developers
 # SPDX-License-Identifier: BSD-3-Clause
 
-
 import itertools
 import numbers
 from abc import ABCMeta, abstractmethod
 
@@ -35,7 +35,6 @@ class calls the ``fit`` method of each sub-estimator on random samples
 # Authors: The scikit-learn developers
 # SPDX-License-Identifier: BSD-3-Clause
 
-
 import threading
 from abc import ABCMeta, abstractmethod
 from numbers import Integral, Real
 
@@ -168,11 +168,12 @@ def test_regression_criterion(name, criterion):
     reg = ForestRegressor(n_estimators=5, criterion=criterion, random_state=1)
     reg.fit(X_reg, y_reg)
     score = reg.score(X_reg, y_reg)
-    assert (
-        score > 0.93
-    ), "Failed with max_features=None, criterion %s and score = %f" % (
-        criterion,
-        score,
+    assert score > 0.93, (
+        "Failed with max_features=None, criterion %s and score = %f"
+        % (
+            criterion,
+            score,
+        )
     )
 
     reg = ForestRegressor(
@@ -1068,10 +1069,10 @@ def test_min_weight_fraction_leaf(name):
         node_weights = np.bincount(out, weights=weights)
         # drop inner nodes
         leaf_weights = node_weights[node_weights != 0]
-        assert (
-            np.min(leaf_weights) >= total_weight * est.min_weight_fraction_leaf
-        ), "Failed with {0} min_weight_fraction_leaf={1}".format(
-            name, est.min_weight_fraction_leaf
+        assert np.min(leaf_weights) >= total_weight * est.min_weight_fraction_leaf, (
+            "Failed with {0} min_weight_fraction_leaf={1}".format(
+                name, est.min_weight_fraction_leaf
+            )
         )
 
 
 
@@ -13,7 +13,6 @@
 # Don't remove this file, we don't want to break users code just because the
 # feature isn't experimental anymore.
 
-
 import warnings
 
 warnings.warn(
 
@@ -3,7 +3,6 @@
 # Authors: The scikit-learn developers
 # SPDX-License-Identifier: BSD-3-Clause
 
-
 import warnings
 from numbers import Integral, Real
 
 
@@ -147,8 +147,9 @@ def test_custom_optimizer(kernel, global_random_seed):
     # Define a dummy optimizer that simply tests 10 random hyperparameters
     def optimizer(obj_func, initial_theta, bounds):
         rng = np.random.RandomState(global_random_seed)
-        theta_opt, func_min = initial_theta, obj_func(
-            initial_theta, eval_gradient=False
+        theta_opt, func_min = (
+            initial_theta,
+            obj_func(initial_theta, eval_gradient=False),
         )
         for _ in range(10):
             theta = np.atleast_1d(
 
@@ -394,8 +394,9 @@ def test_custom_optimizer(kernel):
     # Define a dummy optimizer that simply tests 50 random hyperparameters
     def optimizer(obj_func, initial_theta, bounds):
         rng = np.random.RandomState(0)
-        theta_opt, func_min = initial_theta, obj_func(
-            initial_theta, eval_gradient=False
+        theta_opt, func_min = (
+            initial_theta,
+            obj_func(initial_theta, eval_gradient=False),
         )
         for _ in range(50):
             theta = np.atleast_1d(
 
@@ -1187,7 +1187,7 @@ def test_plot_partial_dependence_lines_kw(
 
     line = disp.lines_[0, 0, -1]
     assert line.get_color() == expected_colors[0], (
-        f"{line.get_color()}!={expected_colors[0]}\n" f"{line_kw} and {pd_line_kw}"
+        f"{line.get_color()}!={expected_colors[0]}\n{line_kw} and {pd_line_kw}"
     )
     if pd_line_kw is not None:
         if "linestyle" in pd_line_kw:
@@ -1198,9 +1198,9 @@ def test_plot_partial_dependence_lines_kw(
         assert line.get_linestyle() == "--"
 
     line = disp.lines_[0, 0, 0]
-    assert (
-        line.get_color() == expected_colors[1]
-    ), f"{line.get_color()}!={expected_colors[1]}"
+    assert line.get_color() == expected_colors[1], (
+        f"{line.get_color()}!={expected_colors[1]}"
+    )
     if ice_lines_kw is not None:
         if "linestyle" in ice_lines_kw:
             assert line.get_linestyle() == ice_lines_kw["linestyle"]
 
@@ -254,7 +254,7 @@ def line_search(self, X, y, sample_weight):
             check = loss_improvement <= t * armijo_term
             if is_verbose:
                 print(
-                    f"    line search iteration={i+1}, step size={t}\n"
+                    f"    line search iteration={i + 1}, step size={t}\n"
                     f"      check loss improvement <= armijo term: {loss_improvement} "
                     f"<= {t * armijo_term} {check}"
                 )
@@ -300,7 +300,7 @@ def line_search(self, X, y, sample_weight):
         self.raw_prediction = raw
         if is_verbose:
             print(
-                f"    line search successful after {i+1} iterations with "
+                f"    line search successful after {i + 1} iterations with "
                 f"loss={self.loss_value}."
             )
Original file line number	Diff line number	Diff line change
`@@ -606,8 +606,9 @@ def score_estimator(`
`606`	`606`	`"predicted, frequency*severity model": np.sum(`
`607`	`607`	`exposure * glm_freq.predict(X) * glm_sev.predict(X)`
`608`	`608`	`),`
`609`		`- "predicted, tweedie, power=%.2f"`
`610`		`- % glm_pure_premium.power: np.sum(exposure * glm_pure_premium.predict(X)),`
	`609`	`+ "predicted, tweedie, power=%.2f" % glm_pure_premium.power: np.sum(`
	`610`	`+ exposure * glm_pure_premium.predict(X)`
	`611`	`+ ),`
`611`	`612`	`}`
`612`	`613`	`)`
`613`	`614`