scikit-learn
diff --git a/‎sklearn/multiclass.py
Lines changed: 54 additions & 24 deletions b/‎sklearn/multiclass.py
Lines changed: 54 additions & 24 deletions
diff --git a/‎sklearn/tests/test_common.py
Lines changed: 0 additions & 1 deletion b/‎sklearn/tests/test_common.py
Lines changed: 0 additions & 1 deletion
diff --git a/‎sklearn/tests/test_docstring_parameters.py
Lines changed: 1 addition & 3 deletions b/‎sklearn/tests/test_docstring_parameters.py
Lines changed: 1 addition & 3 deletions
diff --git a/‎sklearn/tests/test_metaestimators.py
Lines changed: 1 addition & 2 deletions b/‎sklearn/tests/test_metaestimators.py
Lines changed: 1 addition & 2 deletions
@@ -50,13 +50,13 @@
 from .utils._tags import _safe_tags
 from .utils.validation import _num_samples
 from .utils.validation import check_is_fitted
-from .utils.validation import check_X_y, check_array
+from .utils.validation import column_or_1d
+from .utils.validation import _assert_all_finite
 from .utils.multiclass import (_check_partial_fit_first_call,
                                check_classification_targets,
                                _ovr_decision_function)
 from .utils.metaestimators import _safe_split, if_delegate_has_method
 from .utils.fixes import delayed
-from .exceptions import NotFittedError
 
 from joblib import Parallel
 
@@ -114,24 +114,28 @@ def _check_estimator(estimator):
 class _ConstantPredictor(BaseEstimator):
 
     def fit(self, X, y):
+        self._check_n_features(X, reset=True)
         self.y_ = y
         return self
 
     def predict(self, X):
         check_is_fitted(self)
+        self._check_n_features(X, reset=True)
 
-        return np.repeat(self.y_, X.shape[0])
+        return np.repeat(self.y_, _num_samples(X))
 
     def decision_function(self, X):
         check_is_fitted(self)
+        self._check_n_features(X, reset=True)
 
-        return np.repeat(self.y_, X.shape[0])
+        return np.repeat(self.y_, _num_samples(X))
 
     def predict_proba(self, X):
         check_is_fitted(self)
+        self._check_n_features(X, reset=True)
 
         return np.repeat([np.hstack([1 - self.y_, self.y_])],
-                         X.shape[0], axis=0)
+                         _num_samples(X), axis=0)
 
 
 class OneVsRestClassifier(MultiOutputMixin, ClassifierMixin,
@@ -219,6 +223,12 @@ class OneVsRestClassifier(MultiOutputMixin, ClassifierMixin,
     multilabel_ : boolean
         Whether a OneVsRestClassifier is a multilabel classifier.
 
+    n_features_in_ : int
+        Number of features seen during :term:`fit`. Only defined if the
+        underlying estimator exposes such an attribute when fit.
+
+        .. versionadded:: 0.24
+
     Examples
     --------
     >>> import numpy as np
@@ -282,6 +292,9 @@ def fit(self, X, y):
                 self.label_binarizer_.classes_[i]])
             for i, column in enumerate(columns))
 
+        if hasattr(self.estimators_[0], "n_features_in_"):
+            self.n_features_in_ = self.estimators_[0].n_features_in_
+
         return self
 
     @if_delegate_has_method('estimator')
@@ -338,6 +351,9 @@ def partial_fit(self, X, y, classes=None):
             delayed(_partial_fit_binary)(estimator, X, column)
             for estimator, column in zip(self.estimators_, columns))
 
+        if hasattr(self.estimators_[0], "n_features_in_"):
+            self.n_features_in_ = self.estimators_[0].n_features_in_
+
         return self
 
     def predict(self, X):
@@ -504,19 +520,6 @@ def _more_tags(self):
     def _first_estimator(self):
         return self.estimators_[0]
 
-    @property
-    def n_features_in_(self):
-        # For consistency with other estimators we raise a AttributeError so
-        # that hasattr() fails if the OVR estimator isn't fitted.
-        try:
-            check_is_fitted(self)
-        except NotFittedError as nfe:
-            raise AttributeError(
-                "{} object has no n_features_in_ attribute."
-                .format(self.__class__.__name__)
-            ) from nfe
-        return self.estimators_[0].n_features_in_
-
 
 def _fit_ovo_binary(estimator, X, y, i, j):
     """Fit a single binary estimator (one-vs-one)."""
@@ -525,7 +528,7 @@ def _fit_ovo_binary(estimator, X, y, i, j):
     y_binary = np.empty(y.shape, int)
     y_binary[y == i] = 0
     y_binary[y == j] = 1
-    indcond = np.arange(X.shape[0])[cond]
+    indcond = np.arange(_num_samples(X))[cond]
     return _fit_binary(estimator,
                        _safe_split(estimator, X, None, indices=indcond)[0],
                        y_binary, classes=[i, j]), indcond
@@ -593,6 +596,12 @@ class OneVsOneClassifier(MetaEstimatorMixin, ClassifierMixin, BaseEstimator):
             (renaming of 0.25) and onward, `pairwise_indices_` will use the
             pairwise estimator tag instead.
 
+    n_features_in_ : int
+        Number of features seen during :term:`fit`. Only defined if the
+        underlying estimator exposes such an attribute when fit.
+
+        .. versionadded:: 0.24
+
     Examples
     --------
     >>> from sklearn.datasets import load_iris
@@ -626,6 +635,7 @@ def fit(self, X, y):
         -------
         self
         """
+        # We need to validate the data because we do a safe_indexing later.
         X, y = self._validate_data(X, y, accept_sparse=['csr', 'csc'],
                                    force_all_finite=False)
         check_classification_targets(y)
@@ -642,6 +652,9 @@ def fit(self, X, y):
 
         self.estimators_ = estimators_indices[0]
 
+        if hasattr(self.estimators_[0], "n_features_in_"):
+            self.n_features_in_ = self.estimators_[0].n_features_in_
+
         pairwise = _is_pairwise(self)
         self.pairwise_indices_ = (
             estimators_indices[1] if pairwise else None)
@@ -686,8 +699,9 @@ def partial_fit(self, X, y, classes=None):
                              "must be subset of {1}".format(np.unique(y),
                                                             self.classes_))
 
-        X, y = check_X_y(X, y, accept_sparse=['csr', 'csc'],
-                         force_all_finite=False)
+        X, y = self._validate_data(
+            X, y, accept_sparse=['csr', 'csc'], force_all_finite=False,
+            reset=_check_partial_fit_first_call(self, classes))
         check_classification_targets(y)
         combinations = itertools.combinations(range(self.n_classes_), 2)
         self.estimators_ = Parallel(
@@ -699,6 +713,9 @@ def partial_fit(self, X, y, classes=None):
 
         self.pairwise_indices_ = None
 
+        if hasattr(self.estimators_[0], "n_features_in_"):
+            self.n_features_in_ = self.estimators_[0].n_features_in_
+
         return self
 
     def predict(self, X):
@@ -832,6 +849,12 @@ class OutputCodeClassifier(MetaEstimatorMixin, ClassifierMixin, BaseEstimator):
     code_book_ : numpy array of shape [n_classes, code_size]
         Binary array containing the code of each class.
 
+    n_features_in_ : int
+        Number of features seen during :term:`fit`. Only defined if the
+        underlying estimator exposes such an attribute when fit.
+
+        .. versionadded:: 0.24
+
     Examples
     --------
     >>> from sklearn.multiclass import OutputCodeClassifier
@@ -886,7 +909,9 @@ def fit(self, X, y):
         -------
         self
         """
-        X, y = self._validate_data(X, y, accept_sparse=True)
+        y = column_or_1d(y, warn=True)
+        _assert_all_finite(y)
+
         if self.code_size <= 0:
             raise ValueError("code_size should be greater than 0, got {0}"
                              "".format(self.code_size))
@@ -897,6 +922,9 @@ def fit(self, X, y):
 
         self.classes_ = np.unique(y)
         n_classes = self.classes_.shape[0]
+        if n_classes == 0:
+            raise ValueError("OutputCodeClassifier can not be fit when no "
+                             "class is present.")
         code_size_ = int(n_classes * self.code_size)
 
         # FIXME: there are more elaborate methods than generating the codebook
@@ -912,12 +940,15 @@ def fit(self, X, y):
         classes_index = {c: i for i, c in enumerate(self.classes_)}
 
         Y = np.array([self.code_book_[classes_index[y[i]]]
-                      for i in range(X.shape[0])], dtype=int)
+                      for i in range(_num_samples(y))], dtype=int)
 
         self.estimators_ = Parallel(n_jobs=self.n_jobs)(
             delayed(_fit_binary)(self.estimator, X, Y[:, i])
             for i in range(Y.shape[1]))
 
+        if hasattr(self.estimators_[0], "n_features_in_"):
+            self.n_features_in_ = self.estimators_[0].n_features_in_
+
         return self
 
     def predict(self, X):
@@ -934,7 +965,6 @@ def predict(self, X):
             Predicted multi-class targets.
         """
         check_is_fitted(self)
-        X = check_array(X, accept_sparse=True)
         Y = np.array([_predict_binary(e, X) for e in self.estimators_]).T
         pred = euclidean_distances(Y, self.code_book_).argmin(axis=1)
         return self.classes_[pred]
@@ -262,7 +262,6 @@ def test_search_cv(estimator, check, request):
 # check_classifiers_train would need to be updated with the error message
 N_FEATURES_IN_AFTER_FIT_MODULES_TO_IGNORE = {
     'model_selection',
-    'multiclass',
     'multioutput',
     'pipeline',
 }
 
@@ -192,7 +192,6 @@ def _construct_searchcv_instance(SearchCV):
     'linear_model',
     'manifold',
     'model_selection',
-    'multiclass',
     'multioutput',
     'naive_bayes',
     'neighbors',
@@ -219,8 +218,7 @@ def test_fit_docstring_attributes(name, Estimator):
                'CountVectorizer', 'DictVectorizer', 'FeatureUnion',
                'GaussianRandomProjection',
                'MultiOutputClassifier', 'MultiOutputRegressor',
-               'NoSampleWeightWrapper', 'OneVsOneClassifier',
-               'OutputCodeClassifier', 'Pipeline', 'RFE', 'RFECV',
+               'NoSampleWeightWrapper', 'Pipeline', 'RFE', 'RFECV',
                'RegressorChain', 'SelectFromModel',
                'SparseCoder', 'SparseRandomProjection',
                'SpectralBiclustering', 'StackingClassifier',
 
@@ -219,8 +219,7 @@ def _generate_meta_estimator_instances_with_pipeline():
         "IterativeImputer",
         "MultiOutputClassifier",
         "MultiOutputRegressor",
-        "OneVsOneClassifier",
-        "OutputCodeClassifier",
+        "OneVsOneClassifier",  # input validation can't be avoided
         "RANSACRegressor",
         "RFE",
         "RFECV",
Original file line number	Diff line number	Diff line change
`@@ -262,7 +262,6 @@ def test_search_cv(estimator, check, request):`
`262`	`262`	`# check_classifiers_train would need to be updated with the error message`
`263`	`263`	`N_FEATURES_IN_AFTER_FIT_MODULES_TO_IGNORE = {`
`264`	`264`	`'model_selection',`
`265`		`- 'multiclass',`
`266`	`265`	`'multioutput',`
`267`	`266`	`'pipeline',`
`268`	`267`	`}`