scikit-learn
diff --git a/‎doc/whats_new.rst
Lines changed: 5 additions & 0 deletions b/‎doc/whats_new.rst
Lines changed: 5 additions & 0 deletions
diff --git a/‎sklearn/model_selection/tests/test_search.py
Lines changed: 0 additions & 9 deletions b/‎sklearn/model_selection/tests/test_search.py
Lines changed: 0 additions & 9 deletions
diff --git a/‎sklearn/model_selection/tests/test_validation.py
Lines changed: 6 additions & 1 deletion b/‎sklearn/model_selection/tests/test_validation.py
Lines changed: 6 additions & 1 deletion
diff --git a/‎sklearn/svm/base.py
Lines changed: 1 addition & 2 deletions b/‎sklearn/svm/base.py
Lines changed: 1 addition & 2 deletions
diff --git a/‎sklearn/utils/metaestimators.py
Lines changed: 51 additions & 20 deletions b/‎sklearn/utils/metaestimators.py
Lines changed: 51 additions & 20 deletions
@@ -99,6 +99,11 @@ Enhancements
      A ``TypeError`` will be raised for any other kwargs. :issue:`8028`
      by :user:`Alexander Booth <alexandercbooth>`.
 
+   - :class:`model_selection.GridSearchCV`, :class:`model_selection.RandomizedSearchCV`
+     and :func:`model_selection.cross_val_score` now allow estimators with callable
+     kernels which were previously prohibited. :issue:`8005` by `Andreas Müller`_ .
+
+
 Bug fixes
 .........
 
 
@@ -443,15 +443,6 @@ def test_grid_search_precomputed_kernel_error_nonsquare():
     assert_raises(ValueError, cv.fit, K_train, y_train)
 
 
-def test_grid_search_precomputed_kernel_error_kernel_function():
-    # Test that grid search returns an error when using a kernel_function
-    X_, y_ = make_classification(n_samples=200, n_features=100, random_state=0)
-    kernel_function = lambda x1, x2: np.dot(x1, x2.T)
-    clf = SVC(kernel=kernel_function)
-    cv = GridSearchCV(clf, {'C': [0.1, 1.0]})
-    assert_raises(ValueError, cv.fit, X_, y_)
-
-
 class BrokenClassifier(BaseEstimator):
     """Broken classifier that cannot be fit twice"""
 
 
@@ -310,7 +310,12 @@ def test_cross_val_score_precomputed():
     score_precomputed = cross_val_score(svm, linear_kernel, y)
     svm = SVC(kernel="linear")
     score_linear = cross_val_score(svm, X, y)
-    assert_array_equal(score_precomputed, score_linear)
+    assert_array_almost_equal(score_precomputed, score_linear)
+
+    # test with callable
+    svm = SVC(kernel=lambda x, y: np.dot(x, y.T))
+    score_callable = cross_val_score(svm, X, y)
+    assert_array_almost_equal(score_precomputed, score_callable)
 
     # Error raised for non-square X
     svm = SVC(kernel="precomputed")
 
@@ -104,8 +104,7 @@ def __init__(self, impl, kernel, degree, gamma, coef0,
     @property
     def _pairwise(self):
         # Used by cross_val_score.
-        kernel = self.kernel
-        return kernel == "precomputed" or callable(kernel)
+        return self.kernel == "precomputed"
 
     def fit(self, X, y, sample_weight=None):
         """Fit the SVM model according to the given training data.
 
@@ -81,31 +81,62 @@ def if_delegate_has_method(delegate):
 
 
 def _safe_split(estimator, X, y, indices, train_indices=None):
-    """Create subset of dataset and properly handle kernels."""
-    from ..gaussian_process.kernels import Kernel as GPKernel
+    """Create subset of dataset and properly handle kernels.
 
-    if (hasattr(estimator, 'kernel') and callable(estimator.kernel) and
-            not isinstance(estimator.kernel, GPKernel)):
-        # cannot compute the kernel values with custom function
-        raise ValueError("Cannot use a custom kernel function. "
-                         "Precompute the kernel matrix instead.")
+    Slice X, y according to indices for cross-validation, but take care of
+    precomputed kernel-matrices or pairwise affinities / distances.
 
-    if not hasattr(X, "shape"):
-        if getattr(estimator, "_pairwise", False):
+    If ``estimator._pairwise is True``, X needs to be square and
+    we slice rows and columns. If ``train_indices`` is not None,
+    we slice rows using ``indices`` (assumed the test set) and columns
+    using ``train_indices``, indicating the training set.
+
+    Labels y will always be sliced only along the last axis.
+
+    Parameters
+    ----------
+    estimator : object
+        Estimator to determine whether we should slice only rows or rows and
+        columns.
+
+    X : array-like, sparse matrix or iterable
+        Data to be sliced. If ``estimator._pairwise is True``,
+        this needs to be a square array-like or sparse matrix.
+
+    y : array-like, sparse matrix or iterable
+        Targets to be sliced.
+
+    indices : array of int
+        Rows to select from X and y.
+        If ``estimator._pairwise is True`` and ``train_indices is None``
+        then ``indices`` will also be used to slice columns.
+
+    train_indices : array of int or None, default=None
+        If ``estimator._pairwise is True`` and ``train_indices is not None``,
+        then ``train_indices`` will be use to slice the columns of X.
+
+    Returns
+    -------
+    X_sliced : array-like, sparse matrix or list
+        Sliced data.
+
+    y_sliced : array-like, sparse matrix or list
+        Sliced targets.
+
+    """
+    if getattr(estimator, "_pairwise", False):
+        if not hasattr(X, "shape"):
             raise ValueError("Precomputed kernels or affinity matrices have "
                              "to be passed as arrays or sparse matrices.")
-        X_subset = [X[index] for index in indices]
-    else:
-        if getattr(estimator, "_pairwise", False):
-            # X is a precomputed square kernel matrix
-            if X.shape[0] != X.shape[1]:
-                raise ValueError("X should be a square kernel matrix")
-            if train_indices is None:
-                X_subset = X[np.ix_(indices, indices)]
-            else:
-                X_subset = X[np.ix_(indices, train_indices)]
+        # X is a precomputed square kernel matrix
+        if X.shape[0] != X.shape[1]:
+            raise ValueError("X should be a square kernel matrix")
+        if train_indices is None:
+            X_subset = X[np.ix_(indices, indices)]
         else:
-            X_subset = safe_indexing(X, indices)
+            X_subset = X[np.ix_(indices, train_indices)]
+    else:
+        X_subset = safe_indexing(X, indices)
 
     if y is not None:
         y_subset = safe_indexing(y, indices)