scikit-learn
diff --git a/‎sklearn/tests/test_common.py
Lines changed: 19 additions & 45 deletions b/‎sklearn/tests/test_common.py
Lines changed: 19 additions & 45 deletions
diff --git a/‎sklearn/utils/estimator_checks.py
Lines changed: 16 additions & 26 deletions b/‎sklearn/utils/estimator_checks.py
Lines changed: 16 additions & 26 deletions
@@ -50,7 +50,6 @@
     check_estimators_overwrite_params,
     check_estimators_partial_fit_n_features,
     check_cluster_overwrite_params,
-    check_sparsify_binary_classifier,
     check_sparsify_multiclass_classifier,
     check_classifier_data_not_an_array,
     check_regressor_data_not_an_array,
@@ -82,6 +81,25 @@ def test_all_estimators():
         yield check_parameters_default_constructible, name, Estimator
 
 
+def test_non_meta_estimators():
+    # input validation etc for non-meta estimators
+    # FIXME these should be done also for non-mixin estimators!
+    estimators = all_estimators(type_filter=['classifier', 'regressor',
+                                             'transformer', 'cluster'])
+    for name, Estimator in estimators:
+        if name not in CROSS_DECOMPOSITION + ['Imputer']:
+            # Test that all estimators check their input for NaN's and infs
+            yield check_estimators_nan_inf, name, Estimator
+
+        if (name not in ['CCA', '_CCA', 'PLSCanonical', 'PLSRegression',
+                         'PLSSVD', 'GaussianProcess']):
+            # FIXME!
+            # in particular GaussianProcess!
+            yield check_estimators_overwrite_params, name, Estimator
+        if hasattr(Estimator, 'sparsify'):
+            yield check_sparsify_multiclass_classifier, name, Estimator
+
+
 def test_estimators_sparse_data():
     # All estimators should either deal with sparse data or raise an
     # exception with type TypeError and an intelligible error message
@@ -108,15 +126,6 @@ def test_transformers():
             yield check_transformer, name, Transformer
 
 
-def test_estimators_nan_inf():
-    # Test that all estimators check their input for NaN's and infs
-    estimators = all_estimators(type_filter=['classifier', 'regressor',
-                                             'transformer', 'cluster'])
-    for name, Estimator in estimators:
-        if name not in CROSS_DECOMPOSITION + ['Imputer']:
-            yield check_estimators_nan_inf, name, Estimator
-
-
 def test_clustering():
     # test if clustering algorithms do something sensible
     # also test all shapes / shape errors
@@ -279,18 +288,6 @@ def test_class_weight_auto_linear_classifiers():
         yield check_class_weight_auto_linear_classifier, name, Classifier
 
 
-def test_estimators_overwrite_params():
-    # test whether any classifier overwrites his init parameters during fit
-    for est_type in ["classifier", "regressor", "transformer"]:
-        estimators = all_estimators(type_filter=est_type)
-        for name, Estimator in estimators:
-            if (name not in ['CCA', '_CCA', 'PLSCanonical', 'PLSRegression',
-                             'PLSSVD', 'GaussianProcess']):
-                # FIXME!
-                # in particular GaussianProcess!
-                yield check_estimators_overwrite_params, name, Estimator
-
-
 @ignore_warnings
 def test_import_all_consistency():
     # Smoke test to check that any name in a __all__ list is actually defined
@@ -318,29 +315,6 @@ def test_root_import_all_completeness():
         assert_in(modname, sklearn.__all__)
 
 
-def test_sparsify_estimators():
-    #Test if predict with sparsified estimators works.
-    #Tests regression, binary classification, and multi-class classification.
-    estimators = all_estimators()
-
-    # test regression and binary classification
-    for name, Estimator in estimators:
-        try:
-            Estimator.sparsify
-            yield check_sparsify_binary_classifier, name, Estimator
-        except:
-            pass
-
-    # test multiclass classification
-    classifiers = all_estimators(type_filter='classifier')
-    for name, Classifier in classifiers:
-        try:
-            Classifier.sparsify
-            yield check_sparsify_multiclass_classifier, name, Classifier
-        except:
-            pass
-
-
 def test_non_transformer_estimators_n_iter():
     # Test that all estimators of type which are non-transformer
     # and which have an attribute of max_iter, return the attribute
 
@@ -23,7 +23,8 @@
 from sklearn.utils.testing import SkipTest
 from sklearn.utils.testing import check_skip_travis
 
-from sklearn.base import (clone, ClusterMixin, ClassifierMixin)
+from sklearn.base import (clone, ClusterMixin, ClassifierMixin, RegressorMixin,
+                          TransformerMixin)
 from sklearn.metrics import accuracy_score, adjusted_rand_score, f1_score
 
 from sklearn.lda import LDA
@@ -43,6 +44,13 @@
 CROSS_DECOMPOSITION = ['PLSCanonical', 'PLSRegression', 'CCA', 'PLSSVD']
 
 
+def is_supervised(estimator):
+    return (isinstance(estimator, ClassifierMixin)
+            or isinstance(estimator, RegressorMixin)
+            # transformers can all take a y
+            or isinstance(estimator, TransformerMixin))
+
+
 def _boston_subset(n_samples=200):
     global BOSTON
     if BOSTON is None:
@@ -685,9 +693,9 @@ def check_regressors_train(name, Regressor):
     regressor.fit(X.tolist(), y_.tolist())
     regressor.predict(X)
 
-      # TODO: find out why PLS and CCA fail. RANSAC is random
-      # and furthermore assumes the presence of outliers, hence
-      # skipped
+    # TODO: find out why PLS and CCA fail. RANSAC is random
+    # and furthermore assumes the presence of outliers, hence
+    # skipped
     if name not in ('PLSCanonical', 'CCA', 'RANSACRegressor'):
         assert_greater(regressor.score(X, y_), 0.5)
 
@@ -813,7 +821,10 @@ def check_estimators_overwrite_params(name, Estimator):
     set_random_state(estimator)
 
     params = estimator.get_params()
-    estimator.fit(X, y)
+    if is_supervised(estimator):
+        estimator.fit(X, y)
+    else:
+        estimator.fit(X)
     new_params = estimator.get_params()
     for k, v in params.items():
         assert_false(np.any(new_params[k] != v),
@@ -860,27 +871,6 @@ def check_sparsify_multiclass_classifier(name, Classifier):
     assert_array_equal(pred, pred_orig)
 
 
-def check_sparsify_binary_classifier(name, Estimator):
-    X = np.array([[-2, -1], [-1, -1], [-1, -2], [1, 1], [1, 2], [2, 1]])
-    y = [1, 1, 1, 2, 2, 2]
-    est = Estimator()
-
-    est.fit(X, y)
-    pred_orig = est.predict(X)
-
-    # test sparsify with dense inputs
-    est.sparsify()
-    assert_true(sparse.issparse(est.coef_))
-    pred = est.predict(X)
-    assert_array_equal(pred, pred_orig)
-
-    # pickle and unpickle with sparse coef_
-    est = pickle.loads(pickle.dumps(est))
-    assert_true(sparse.issparse(est.coef_))
-    pred = est.predict(X)
-    assert_array_equal(pred, pred_orig)
-
-
 def check_classifier_data_not_an_array(name, Estimator):
     X = np.array([[3, 0], [0, 1], [0, 2], [1, 1], [1, 2], [2, 1]])
     y = [1, 1, 1, 2, 2, 2]