scikit-learn
diff --git a/‎doc/whats_new/v0.23.rst
Lines changed: 7 additions & 1 deletion b/‎doc/whats_new/v0.23.rst
Lines changed: 7 additions & 1 deletion
diff --git a/‎sklearn/svm/_base.py
Lines changed: 30 additions & 21 deletions b/‎sklearn/svm/_base.py
Lines changed: 30 additions & 21 deletions
diff --git a/‎sklearn/svm/tests/test_svm.py
Lines changed: 53 additions & 11 deletions b/‎sklearn/svm/tests/test_svm.py
Lines changed: 53 additions & 11 deletions
@@ -23,7 +23,7 @@ parameters, may produce different models from the previous version. This often
 occurs due to changes in the modelling logic (bug fixes or enhancements), or in
 random sampling procedures.
 
-- models come here
+- list models here
 
 Details are listed in the changelog below.
 
@@ -210,6 +210,12 @@ Changelog
   `probB_`, are now deprecated as they were not useful. :pr:`15558` by
   `Thomas Fan`_.
 
+- |Fix| Fix use of custom kernel not taking float entries such as string
+  kernels in :class:`svm.SVC` and :class:`svm.SVR`. Note that custom kennels
+  are now expected to validate their input where they previously received
+  valid numeric arrays.
+  :pr:`11296` by `Alexandre Gramfort`_ and  :user:`Georgi Peev <georgipeev>`.
+
 :mod:`sklearn.tree`
 ...................
 
 
@@ -14,7 +14,8 @@
 from ..utils import compute_class_weight
 from ..utils.extmath import safe_sparse_dot
 from ..utils.validation import check_is_fitted, _check_large_sparse
-from ..utils.validation import _check_sample_weight
+from ..utils.validation import _num_samples
+from ..utils.validation import _check_sample_weight, check_consistent_length
 from ..utils.multiclass import check_classification_targets
 from ..exceptions import ConvergenceWarning
 from ..exceptions import NotFittedError
@@ -143,9 +144,13 @@ def fit(self, X, y, sample_weight=None):
             raise TypeError("Sparse precomputed kernels are not supported.")
         self._sparse = sparse and not callable(self.kernel)
 
-        X, y = check_X_y(X, y, dtype=np.float64,
-                         order='C', accept_sparse='csr',
-                         accept_large_sparse=False)
+        if callable(self.kernel):
+            check_consistent_length(X, y)
+        else:
+            X, y = check_X_y(X, y, dtype=np.float64,
+                             order='C', accept_sparse='csr',
+                             accept_large_sparse=False)
+
         y = self._validate_targets(y)
 
         sample_weight = np.asarray([]
@@ -154,24 +159,31 @@ def fit(self, X, y, sample_weight=None):
         solver_type = LIBSVM_IMPL.index(self._impl)
 
         # input validation
-        if solver_type != 2 and X.shape[0] != y.shape[0]:
+        n_samples = _num_samples(X)
+        if solver_type != 2 and n_samples != y.shape[0]:
             raise ValueError("X and y have incompatible shapes.\n" +
                              "X has %s samples, but y has %s." %
-                             (X.shape[0], y.shape[0]))
+                             (n_samples, y.shape[0]))
 
-        if self.kernel == "precomputed" and X.shape[0] != X.shape[1]:
+        if self.kernel == "precomputed" and n_samples != X.shape[1]:
             raise ValueError("Precomputed matrix must be a square matrix."
                              " Input is a {}x{} matrix."
                              .format(X.shape[0], X.shape[1]))
 
-        if sample_weight.shape[0] > 0 and sample_weight.shape[0] != X.shape[0]:
+        if sample_weight.shape[0] > 0 and sample_weight.shape[0] != n_samples:
             raise ValueError("sample_weight and X have incompatible shapes: "
                              "%r vs %r\n"
                              "Note: Sparse matrices cannot be indexed w/"
                              "boolean masks (use `indices=True` in CV)."
                              % (sample_weight.shape, X.shape))
 
-        if isinstance(self.gamma, str):
+        kernel = 'precomputed' if callable(self.kernel) else self.kernel
+
+        if kernel == 'precomputed':
+            # unused but needs to be a float for cython code that ignores
+            # it anyway
+            self._gamma = 0.
+        elif isinstance(self.gamma, str):
             if self.gamma == 'scale':
                 # var = E[X^2] - E[X]^2 if sparse
                 X_var = ((X.multiply(X)).mean() - (X.mean()) ** 2
@@ -187,10 +199,6 @@ def fit(self, X, y, sample_weight=None):
         else:
             self._gamma = self.gamma
 
-        kernel = self.kernel
-        if callable(kernel):
-            kernel = 'precomputed'
-
         fit = self._sparse_fit if self._sparse else self._dense_fit
         if self.verbose:  # pragma: no cover
             print('[LibSVM]', end='')
@@ -199,7 +207,7 @@ def fit(self, X, y, sample_weight=None):
         fit(X, y, sample_weight, solver_type, kernel, random_seed=seed)
         # see comment on the other call to np.iinfo in this file
 
-        self.shape_fit_ = X.shape
+        self.shape_fit_ = X.shape if hasattr(X, "shape") else (n_samples, )
 
         # In binary case, we need to flip the sign of coef, intercept and
         # decision function. Use self._intercept_ and self._dual_coef_
@@ -443,8 +451,10 @@ def _sparse_decision_function(self, X):
     def _validate_for_predict(self, X):
         check_is_fitted(self)
 
-        X = check_array(X, accept_sparse='csr', dtype=np.float64, order="C",
-                        accept_large_sparse=False)
+        if not callable(self.kernel):
+            X = check_array(X, accept_sparse='csr', dtype=np.float64,
+                            order="C", accept_large_sparse=False)
+
         if self._sparse and not sp.isspmatrix(X):
             X = sp.csr_matrix(X)
         if self._sparse:
@@ -454,17 +464,16 @@ def _validate_for_predict(self, X):
             raise ValueError(
                 "cannot use sparse input in %r trained on dense data"
                 % type(self).__name__)
-        n_samples, n_features = X.shape
 
         if self.kernel == "precomputed":
             if X.shape[1] != self.shape_fit_[0]:
                 raise ValueError("X.shape[1] = %d should be equal to %d, "
                                  "the number of samples at training time" %
                                  (X.shape[1], self.shape_fit_[0]))
-        elif n_features != self.shape_fit_[1]:
+        elif not callable(self.kernel) and X.shape[1] != self.shape_fit_[1]:
             raise ValueError("X.shape[1] = %d should be equal to %d, "
                              "the number of features at training time" %
-                             (n_features, self.shape_fit_[1]))
+                             (X.shape[1], self.shape_fit_[1]))
         return X
 
     @property
@@ -920,8 +929,8 @@ def _fit_liblinear(X, y, C, fit_intercept, intercept_scaling, class_weight,
     bias = -1.0
     if fit_intercept:
         if intercept_scaling <= 0:
-            raise ValueError("Intercept scaling is %r but needs to be greater than 0."
-                             " To disable fitting an intercept,"
+            raise ValueError("Intercept scaling is %r but needs to be greater "
+                             "than 0. To disable fitting an intercept,"
                              " set fit_intercept=False." % intercept_scaling)
         else:
             bias = intercept_scaling
 
@@ -20,9 +20,10 @@
 from sklearn.metrics.pairwise import rbf_kernel
 from sklearn.utils import check_random_state
 from sklearn.utils._testing import assert_warns
-from sklearn.utils._testing import assert_warns_message, assert_raise_message
+from sklearn.utils._testing import assert_raise_message
 from sklearn.utils._testing import ignore_warnings
 from sklearn.utils._testing import assert_no_warnings
+from sklearn.utils.validation import _num_samples
 from sklearn.utils import shuffle
 from sklearn.exceptions import ConvergenceWarning
 from sklearn.exceptions import NotFittedError, UndefinedMetricWarning
@@ -125,7 +126,7 @@ def test_precomputed():
 
     kfunc = lambda x, y: np.dot(x, y.T)
     clf = svm.SVC(kernel=kfunc)
-    clf.fit(X, Y)
+    clf.fit(np.array(X), Y)
     pred = clf.predict(T)
 
     assert_array_equal(clf.dual_coef_, [[-0.25, .25]])
@@ -542,8 +543,8 @@ def test_negative_weights_svc_leave_just_one_label(Classifier,
 
 @pytest.mark.parametrize(
     "Classifier, model",
-    [(svm.SVC, {'when-left': [0.3998,  0.4], 'when-right': [0.4,  0.3999]}),
-     (svm.NuSVC, {'when-left': [0.3333,  0.3333],
+    [(svm.SVC, {'when-left': [0.3998, 0.4], 'when-right': [0.4, 0.3999]}),
+     (svm.NuSVC, {'when-left': [0.3333, 0.3333],
       'when-right': [0.3333, 0.3333]})],
     ids=['SVC', 'NuSVC']
 )
@@ -681,9 +682,9 @@ def test_unicode_kernel():
     clf.fit(X, Y)
     clf.predict_proba(T)
     _libsvm.cross_validation(iris.data,
-                                iris.target.astype(np.float64), 5,
-                                kernel='linear',
-                                random_seed=0)
+                             iris.target.astype(np.float64), 5,
+                             kernel='linear',
+                             random_seed=0)
 
 
 def test_sparse_precomputed():
@@ -980,7 +981,7 @@ def test_svc_bad_kernel():
 def test_timeout():
     a = svm.SVC(kernel=lambda x, y: np.dot(x, y.T), probability=True,
                 random_state=0, max_iter=1)
-    assert_warns(ConvergenceWarning, a.fit, X, Y)
+    assert_warns(ConvergenceWarning, a.fit, np.array(X), Y)
 
 
 def test_unfitted():
@@ -1026,8 +1027,9 @@ def test_svr_coef_sign():
     for svr in [svm.SVR(kernel='linear'), svm.NuSVR(kernel='linear'),
                 svm.LinearSVR()]:
         svr.fit(X, y)
-        assert_array_almost_equal(svr.predict(X),
-                                  np.dot(X, svr.coef_.ravel()) + svr.intercept_)
+        assert_array_almost_equal(
+            svr.predict(X), np.dot(X, svr.coef_.ravel()) + svr.intercept_
+        )
 
 
 def test_linear_svc_intercept_scaling():
@@ -1094,7 +1096,7 @@ def test_ovr_decision_function():
         base_points * [-1, 1],   # Q2
         base_points * [-1, -1],  # Q3
         base_points * [1, -1]    # Q4
-        ))
+    ))
 
     y_test = [0] * 2 + [1] * 2 + [2] * 2 + [3] * 2
 
@@ -1248,3 +1250,43 @@ def test_svm_probA_proB_deprecated(SVMClass, data, deprecated_prob):
            "removed in version 0.25.").format(deprecated_prob)
     with pytest.warns(FutureWarning, match=msg):
         getattr(clf, deprecated_prob)
+
+
+@pytest.mark.parametrize("Estimator", [svm.SVC, svm.SVR])
+def test_custom_kernel_not_array_input(Estimator):
+    """Test using a custom kernel that is not fed with array-like for floats"""
+    data = ["A A", "A", "B", "B B", "A B"]
+    X = np.array([[2, 0], [1, 0], [0, 1], [0, 2], [1, 1]])  # count encoding
+    y = np.array([1, 1, 2, 2, 1])
+
+    def string_kernel(X1, X2):
+        assert isinstance(X1[0], str)
+        n_samples1 = _num_samples(X1)
+        n_samples2 = _num_samples(X2)
+        K = np.zeros((n_samples1, n_samples2))
+        for ii in range(n_samples1):
+            for jj in range(ii, n_samples2):
+                K[ii, jj] = X1[ii].count('A') * X2[jj].count('A')
+                K[ii, jj] += X1[ii].count('B') * X2[jj].count('B')
+                K[jj, ii] = K[ii, jj]
+        return K
+
+    K = string_kernel(data, data)
+    assert_array_equal(np.dot(X, X.T), K)
+
+    svc1 = Estimator(kernel=string_kernel).fit(data, y)
+    svc2 = Estimator(kernel='linear').fit(X, y)
+    svc3 = Estimator(kernel='precomputed').fit(K, y)
+
+    assert svc1.score(data, y) == svc3.score(K, y)
+    assert svc1.score(data, y) == svc2.score(X, y)
+    if hasattr(svc1, 'decision_function'):  # classifier
+        assert_allclose(svc1.decision_function(data),
+                        svc2.decision_function(X))
+        assert_allclose(svc1.decision_function(data),
+                        svc3.decision_function(K))
+        assert_array_equal(svc1.predict(data), svc2.predict(X))
+        assert_array_equal(svc1.predict(data), svc3.predict(K))
+    else:  # regressor
+        assert_allclose(svc1.predict(data), svc2.predict(X))
+        assert_allclose(svc1.predict(data), svc3.predict(K))