scikit-learn · NicolasHug · May 16, 2020 · May 19, 2020 · May 19, 2020 · May 19, 2020
diff --git a/sklearn/tests/test_common.py b/sklearn/tests/test_common.py
@@ -19,14 +19,15 @@
 
 from sklearn.utils import all_estimators
 from sklearn.utils._testing import ignore_warnings
-from sklearn.exceptions import ConvergenceWarning
+from sklearn.exceptions import ConvergenceWarning, SkipTestWarning
 from sklearn.utils.estimator_checks import check_estimator
 
 import sklearn
 from sklearn.base import BiclusterMixin
 
 from sklearn.linear_model._base import LinearClassifierMixin
 from sklearn.linear_model import LogisticRegression
+from sklearn.svm import NuSVC
 from sklearn.utils import IS_PYPY
 from sklearn.utils._testing import SkipTest
 from sklearn.utils.est
8000
imator_checks import (
@@ -204,3 +205,25 @@ def test_class_support_removed():
 
     with pytest.raises(TypeError, match=msg):
         parametrize_with_checks([LogisticRegression])
+
+
+def test_strict_mode_check_estimator():
+    # Make sure the strict checks are properly ignored when strict mode is off
+    # in check_estimator.
+    # We can't check the message because check_estimator doesn't give one.
+
+    with pytest.warns(SkipTestWarning):
+        # LogisticRegression has no _xfail_checks, but check_n_features_in is
+        # still skipped because it's a strict check
+        check_estimator(LogisticRegression(), strict_mode=False)
+
+    with pytest.warns(SkipTestWarning):
+        # NuSVC has some _xfail_checks. check_n_features_in is skipped along
+        # with the other checks in the tag.
+        check_estimator(NuSVC(), strict_mode=False)
+
+
+@parametrize_with_checks([LogisticRegression(), NuSVC()], strict_mode=False)
+def test_strict_mode_parametrize_with_checks(estimator, check):
+    # Ideally we should assert that the strict checks are Xfailed...
+    check(estimator)
diff --git a/sklearn/utils/estimator_checks.py b/sklearn/utils/estimator_checks.py
@@ -339,10 +339,12 @@ def _construct_instance(Estimator):
     return estimator
 
 
-def _mark_xfail_checks(estimator, check, pytest):
-    """Mark (estimator, check) pairs with xfail according to the
-    _xfail_checks_ tag"""
-    xfail_checks = estimator._get_tags()['_xfail_checks'] or {}
+def _maybe_mark_xfail(estimator, check, strict_mode, pytest):
+    # Mark (estimator, check) pairs as XFAIL if the check is in the
+    # _xfail_checks tag or if it's a strict check and strict_mode=False.
+    # This is similar to _maybe_skip(), but this one is used by
+    # @parametrize_with_checks() instead of check_estimator()
+    xfail_checks = _get_xfail_checks(estimator, strict_mode)
     check_name = _set_check_estimator_ids(check)
 
     if check_name not in xfail_checks:
@@ -355,10 +357,13 @@ def _mark_xfail_checks(estimator, check, pytest):
                             marks=pytest.mark.xfail(reason=reason))
 
 
-def _skip_if_xfail(estimator, check):
-    # wrap a check so that it's skipped with a warning if it's part of the
-    # xfail_checks tag.
-    xfail_checks = estimator._get_tags()['_xfail_checks'] or {}
+def _maybe_skip(estimator, check, strict_mode):
+    # Wrap a check so that it's skipped with a warning if it's part of the
+    # xfail_checks tag, or if it's a strict check and strict_mode=False
+    # This is similar to _maybe_mark_xfail(), but this one is used by
+    # check_estimator() instead of @parametrize_with_checks which requires
+    # pytest
+    xfail_checks = _get_xfail_checks(estimator, strict_mode)
     check_name = _set_check_estimator_ids(check)
 
     if check_name not in xfail_checks:
@@ -373,7 +378,23 @@ def wrapped(*args, **kwargs):
     return wrapped
 
 
-def parametrize_with_checks(estimators):
+def _get_xfail_checks(estimator, strict_mode):
+    # Return the checks that are in the estimator's _xfail_checks tag, along
+    # with the strict checks if strict_mode is False.
+    xfail_checks = estimator._get_tags()['_xfail_checks'] or {}
+
+    if not strict_mode:
+        strict_checks = {
+            _set_check_estimator_ids(check):
+            'The check is strict and strict mode is off'  # the reason
+            for check in _STRICT_CHECKS
+        }
+        xfail_checks.update(strict_checks)
+
+    return xfail_checks
+
+
+def parametrize_with_checks(estimators, strict_mode=True):
     """Pytest specific decorator for parametrizing estimator checks.
 
     The `id` of each check is set to be a pprint version of the estimator
@@ -391,6 +412,13 @@ def parametrize_with_checks(estimators):
            Passing a class was deprecated in version 0.23, and support for
            classes was removed in 0.24. Pass an instance instead.
 
+    strict_mode : bool, default=True
+        If False, the strict checks will be treated as if they were in the
+        estimators' `_xfails_checks` tag: they will be marked as `xfail` for
+        pytest. See :ref:`estimator_tags` for more info on the
+        `_xfails_check` tag. The set of strict checks is in
+        `sklearn.utils.estimator_checks._STRICT_CHECKS`.
+
     Returns
     -------
     decorator : `pytest.mark.parametrize`
@@ -422,14 +450,14 @@ def parametrize_with_checks(estimators):
                         for check in _yield_all_checks(estimator))
 
     checks_with_marks = (
-        _mark_xfail_checks(estimator, check, pytest)
+        _maybe_mark_xfail(estimator, check, strict_mode, pytest)
         for estimator, check in checks_generator)
 
     return pytest.mark.parametrize("estimator, check", checks_with_marks,
                                    ids=_set_check_estimator_ids)
 
 
-def check_estimator(Estimator, generate_only=False):
+def check_estimator(Estimator, generate_only=False, strict_mode=True):
     """Check if estimator adheres to scikit-learn conventions.
 
     This estimator will run an extensive test-suite for input validation,
@@ -457,14 +485,21 @@ def check_estimator(Estimator, generate_only=False):
            Passing a class was deprecated in version 0.23, and support for
            classes was removed in 0.24.
 
-    generate_only : bool, optional (default=False)
+    generate_only : bool, default=False
         When `False`, checks are evaluated when `check_estimator` is called.
         When `True`, `check_estimator` returns a generator that yields
         (estimator, check) tuples. The check is run by calling
         `check(estimator)`.
 
         .. versionadded:: 0.22
 
+    strict_mode : bool, default=True
+        If False, the strict checks will be treated as if they were in the
+        estimator's `_xfails_checks` tag: they will be ignored with a
+        warning. See :ref:`estimator_tags` for more info on the
+        `_xfails_check` tag. The set of strict checks is in
+        `sklearn.utils.estimator_checks._STRICT_CHECKS`.
+
     Returns
     -------
     checks_generator : generator
@@ -480,9 +515,10 @@ def check_estimator(Estimator, generate_only=False):
     estimator = Estimator
     name = type(estimator).__name__
 
-    checks_generator = ((estimator,
-                         partial(_skip_if_xfail(estimator, check), name))
-                        for check in _yield_all_checks(estimator))
+    checks_generator = (
+        (estimator, partial(_maybe_skip(estimator, check, strict_mode), name))
+        for check in _yield_all_checks(estimator)
+    )
 
     if generate_only:
         return checks_generato
59E4
r
@@ -3026,3 +3062,8 @@ def check_requires_y_none(name, estimator_orig):
     except ValueError as ve:
         if not any(msg in str(ve) for msg in expected_err_msgs):
             warnings.warn(warning_msg, FutureWarning)
+
+
+_STRICT_CHECKS = set([
+    check_n_features_in,  # arbitrary, we can decide on actual list later?
+])