scikit-learn
diff --git a/‎doc/developers/index.rst
Lines changed: 8 additions & 4 deletions b/‎doc/developers/index.rst
Lines changed: 8 additions & 4 deletions
diff --git a/‎doc/whats_new.rst
Lines changed: 3 additions & 0 deletions b/‎doc/whats_new.rst
Lines changed: 3 additions & 0 deletions
diff --git a/‎sklearn/cluster/affinity_propagation_.py
Lines changed: 1 addition & 1 deletion b/‎sklearn/cluster/affinity_propagation_.py
Lines changed: 1 addition & 1 deletion
diff --git a/‎sklearn/cluster/dbscan_.py
Lines changed: 2 additions & 2 deletions b/‎sklearn/cluster/dbscan_.py
Lines changed: 2 additions & 2 deletions
diff --git a/‎sklearn/cluster/hierarchical.py
Lines changed: 1 addition & 1 deletion b/‎sklearn/cluster/hierarchical.py
Lines changed: 1 addition & 1 deletion
diff --git a/‎sklearn/cluster/k_means_.py
Lines changed: 2 additions & 2 deletions b/‎sklearn/cluster/k_means_.py
Lines changed: 2 additions & 2 deletions
diff --git a/‎sklearn/cluster/mean_shift_.py
Lines changed: 1 addition & 1 deletion b/‎sklearn/cluster/mean_shift_.py
Lines changed: 1 addition & 1 deletion
diff --git a/‎sklearn/cluster/spectral.py
Lines changed: 1 addition & 1 deletion b/‎sklearn/cluster/spectral.py
Lines changed: 1 addition & 1 deletion
diff --git a/‎sklearn/decomposition/dict_learning.py
Lines changed: 4 additions & 7 deletions b/‎sklearn/decomposition/dict_learning.py
Lines changed: 4 additions & 7 deletions
diff --git a/‎sklearn/decomposition/incremental_pca.py
Lines changed: 1 addition & 1 deletion b/‎sklearn/decomposition/incremental_pca.py
Lines changed: 1 addition & 1 deletion
@@ -716,8 +716,11 @@ is not met, an exception of type ``ValueError`` should be raised.
 ``y`` might be ignored in the case of unsupervised learning. However, to
 make it possible to use the estimator as part of a pipeline that can
 mix both supervised and unsupervised transformers, even unsupervised
-estimators are kindly asked to accept a ``y=None`` keyword argument in
+estimators need to accept a ``y=None`` keyword argument in
 the second position that is just ignored by the estimator.
+For the same reason, ``fit_predict``, ``fit_transform``, ``score``,
+``transform`` and ``partial_fit`` methods need to accept a ``y`` argument in
+the second place if they are implemented.
 
 The method should return the object (``self``). This pattern is useful
 to be able to implement quick one liners in an IPython session such as::
@@ -857,9 +860,10 @@ last step, it needs to provide a ``fit`` or ``fit_transform`` function.
 To be able to evaluate the pipeline on any data but the training set,
 it also needs to provide a ``transform`` function.
 There are no special requirements for the last step in a pipeline, except that
-it has a ``fit`` function.  All ``fit`` and ``fit_transform`` functions must
-take arguments ``X, y``, even if y is not used.
-
+it has a ``fit`` function. All ``fit`` and ``fit_transform`` functions must
+take arguments ``X, y``, even if y is not used. Similarly, for ``score`` to be
+usable, the last step of the pipeline needs to have a ``score`` function that
+accepts an optional ``y``.
 
 Working notes
 -------------
 
@@ -176,6 +176,9 @@ Enhancements
    - Parallelized calculation of :func:`pairwise_distances` is now supported
      for scipy metrics and custom callables. By `Joel Nothman`_.
 
+   - Allow the fitting and scoring of all clustering algorithms in
+     :class:`pipeline.Pipeline`. By `Andreas Müller`_.
+
 Documentation improvements
 ..........................
 
 
@@ -269,7 +269,7 @@ def __init__(self, damping=.5, max_iter=200, convergence_iter=15,
     def _pairwise(self):
         return self.affinity == "precomputed"
 
-    def fit(self, X):
+    def fit(self, X, y=None):
         """ Create affinity matrix from negative euclidean distances, then
         apply affinity propagation clustering.
 
 
@@ -189,7 +189,7 @@ class DBSCAN(BaseEstimator, ClusterMixin):
         of the construction and query, as well as the memory required
         to store the tree. The optimal value depends
         on the nature of the problem.
- 
+
     Attributes
     ----------
     core_sample_indices_ : array, shape = [n_core_samples]
@@ -224,7 +224,7 @@ def __init__(self, eps=0.5, min_samples=5, metric='euclidean',
         self.p = p
         self.random_state = random_state
 
-    def fit(self, X, sample_weight=None):
+    def fit(self, X, y=None, sample_weight=None):
         """Perform DBSCAN clustering from features or distance matrix.
 
         Parameters
 
@@ -683,7 +683,7 @@ def __init__(self, n_clusters=2, affinity="euclidean",
         self.affinity = affinity
         self.pooling_func = pooling_func
 
-    def fit(self, X):
+    def fit(self, X, y=None):
         """Fit the hierarchical clustering on the data
 
         Parameters
 
@@ -795,7 +795,7 @@ def fit(self, X, y=None):
                 n_jobs=self.n_jobs)
         return self
 
-    def fit_predict(self, X):
+    def fit_predict(self, X, y=None):
         """Compute cluster centers and predict cluster index for each sample.
 
         Convenience method; equivalent to calling fit(X) followed by
@@ -864,7 +864,7 @@ def predict(self, X):
         x_squared_norms = row_norms(X, squared=True)
         return _labels_inertia(X, x_squared_norms, self.cluster_centers_)[0]
 
-    def score(self, X):
+    def score(self, X, y=None):
         """Opposite of the value of X on the K-means objective.
 
         Parameters
 
@@ -320,7 +320,7 @@ def __init__(self, bandwidth=None, seeds=None, bin_seeding=False,
         self.cluster_all = cluster_all
         self.min_bin_freq = min_bin_freq
 
-    def fit(self, X):
+    def fit(self, X, y=None):
         """Perform clustering.
 
         Parameters
 
@@ -405,7 +405,7 @@ def __init__(self, n_clusters=8, eigen_solver=None, random_state=None,
         self.coef0 = coef0
         self.kernel_params = kernel_params
 
-    def fit(self, X):
+    def fit(self, X, y=None):
         """Creates an affinity matrix for X using the selected affinity,
         then applies spectral clustering to this affinity matrix.
 
 
@@ -412,7 +412,6 @@ def dict_learning(X, n_components, alpha, max_iter=100, tol=1e-8,
     SparsePCA
     MiniBatchSparsePCA
     """
-
     if method not in ('lars', 'cd'):
         raise ValueError('Coding method %r not supported as a fit algorithm.'
                          % method)
@@ -604,6 +603,8 @@ def dict_learning_online(X, n_components=2, alpha=1, n_iter=100,
     MiniBatchSparsePCA
 
     """
+    if n_components is None:
+        n_components = X.shape[1]
 
     if method not in ('lars', 'cd'):
         raise ValueError('Coding method not supported as a fit algorithm.')
@@ -750,7 +751,7 @@ def transform(self, X, y=None):
             Transformed data
 
         """
-        check_is_fitted(self, 'components_') 
+        check_is_fitted(self, 'components_')
 
         # XXX : kwargs is not documented
         X = check_array(X)
@@ -1159,13 +1160,9 @@ def fit(self, X, y=None):
         """
         random_state = check_random_state(self.random_state)
         X = check_array(X)
-        if self.n_components is None:
-            n_components = X.shape[1]
-        else:
-            n_components = self.n_components
 
         U, (A, B), self.n_iter_ = dict_learning_online(
-            X, n_components, self.alpha,
+            X, self.n_components, self.alpha,
             n_iter=self.n_iter, return_code=False,
             method=self.fit_algorithm,
             n_jobs=self.n_jobs, dict_init=self.dict_init,
 
@@ -174,7 +174,7 @@ def fit(self, X, y=None):
             self.partial_fit(X[batch])
         return self
 
-    def partial_fit(self, X):
+    def partial_fit(self, X, y=None):
         """Incremental fit with X. All of X is processed as a single batch.
 
         Parameters