DOC speed up example plot_digits_pipe.py (scikit-learn#21728)

ArthDh · samronsin · commit 0bb859f11e8b · 2021-11-30T17:28:12.000+01:00
* Updated plot_digits_pipe

* Updated plot_digits_pipe with StandardScaler preprocessing
diff --git a/examples/compose/plot_digits_pipe.py b/examples/compose/plot_digits_pipe.py
@@ -24,20 +24,22 @@
 from sklearn.linear_model import LogisticRegression
 from sklearn.pipeline import Pipeline
 from sklearn.model_selection import GridSearchCV
-
+from sklearn.preprocessing import StandardScaler
 
 # Define a pipeline to search for the best combination of PCA truncation
 # and classifier regularization.
 pca = PCA()
+# Define a Standard Scaler to normalize inputs
+scaler = StandardScaler()
+
 # set the tolerance to a large value to make the example faster
 logistic = LogisticRegression(max_iter=10000, tol=0.1)
-pipe = Pipeline(steps=[("pca", pca), ("logistic", logistic)])
+pipe = Pipeline(steps=[("scaler", scaler), ("pca", pca), ("logistic", logistic)])
 
 X_digits, y_digits = datasets.load_digits(return_X_y=True)
-
 # Parameters of pipelines can be set using ‘__’ separated parameter names:
 param_grid = {
-    "pca__n_components": [5, 15, 30, 45, 64],
+    "pca__n_components": [5, 15, 30, 45, 60],
     "logistic__C": np.logspace(-4, 4, 4),
 }
 search = GridSearchCV(pipe, param_grid, n_jobs=2)