thoo
diff --git a/‎doc/related_projects.rst
Lines changed: 3 additions & 0 deletions b/‎doc/related_projects.rst
Lines changed: 3 additions & 0 deletions
diff --git a/‎doc/testimonials/images/jpmorgan.png
8.16 KB b/‎doc/testimonials/images/jpmorgan.png
8.16 KB
diff --git a/‎doc/testimonials/testimonials.rst
Lines changed: 33 additions & 0 deletions b/‎doc/testimonials/testimonials.rst
Lines changed: 33 additions & 0 deletions
diff --git a/‎doc/whats_new/v0.20.rst
Lines changed: 8 additions & 0 deletions b/‎doc/whats_new/v0.20.rst
Lines changed: 8 additions & 0 deletions
diff --git a/‎examples/linear_model/plot_iris_logistic.py
Lines changed: 1 addition & 1 deletion b/‎examples/linear_model/plot_iris_logistic.py
Lines changed: 1 addition & 1 deletion
diff --git a/‎sklearn/cluster/tests/test_affinity_propagation.py
Lines changed: 3 additions & 3 deletions b/‎sklearn/cluster/tests/test_affinity_propagation.py
Lines changed: 3 additions & 3 deletions
diff --git a/‎sklearn/cluster/tests/test_bicluster.py
Lines changed: 1 addition & 2 deletions b/‎sklearn/cluster/tests/test_bicluster.py
Lines changed: 1 addition & 2 deletions
diff --git a/‎sklearn/cluster/tests/test_feature_agglomeration.py
Lines changed: 11 additions & 11 deletions b/‎sklearn/cluster/tests/test_feature_agglomeration.py
Lines changed: 11 additions & 11 deletions
diff --git a/‎sklearn/cluster/tests/test_hierarchical.py
Lines changed: 8 additions & 9 deletions b/‎sklearn/cluster/tests/test_hierarchical.py
Lines changed: 8 additions & 9 deletions
diff --git a/‎sklearn/cluster/tests/test_k_means.py
Lines changed: 6 additions & 7 deletions b/‎sklearn/cluster/tests/test_k_means.py
Lines changed: 6 additions & 7 deletions
@@ -150,6 +150,9 @@ and tasks.
 
 - `lasagne <https://github.com/Lasagne/Lasagne>`_ A lightweight library to
   build and train neural networks in Theano.
+  
+- `skorch <https://github.com/dnouri/skorch>`_ A scikit-learn compatible 
+  neural network library that wraps PyTorch.
 
 **Broad scope**
 
 
@@ -11,6 +11,39 @@ Who is using scikit-learn?
 
 .. to add a testimonials, just XXX
 
+`J.P.Morgan <https://www.jpmorgan.com>`_
+------------------------------------------
+
+.. raw:: html
+
+    <div class="logo">
+
+.. image:: images/jpmorgan.png
+    :width: 120pt
+    :target: https://www.jpmorgan.com
+
+.. raw:: html
+
+    </div>
+
+Scikit-learn is an indispensable part of the Python machine learning
+toolkit at JPMorgan. It is very widely used across all parts of the bank
+for classification, predictive analytics, and very many other machine
+learning tasks. Its straightforward API, its breadth of algorithms, and
+the quality of its documentation combine to make scikit-learn
+simultaneously very approachable and very powerful.
+
+.. raw:: html
+
+   <span class="testimonial-author">
+
+Stephen Simmons, VP, Athena Research, JPMorgan
+
+.. raw:: html
+
+   </span>
+
+
 `Spotify <https://www.spotify.com>`_
 ------------------------------------
 
 
@@ -85,6 +85,14 @@ Changelog
   where ``max_features`` was sometimes rounded down to zero.
   :issue:`12388` by :user:`Connor Tann <Connossor>`.
 
+:mod:`sklearn.feature_extraction`
+...........................
+
+- |Fix| Fixed a regression in v0.20.0 where
+  :func:`feature_extraction.text.CountVectorizer` and other text vectorizers
+  could error during stop words validation with custom preprocessors
+  or tokenizers. :issue:`12393` by `Roman Yurchak`_.
+
 :mod:`sklearn.linear_model`
 ...........................
 
 
@@ -30,7 +30,7 @@
 
 logreg = LogisticRegression(C=1e5, solver='lbfgs', multi_class='multinomial')
 
-# we create an instance of Neighbours Classifier and fit the data.
+# Create an instance of Logistic Regression Classifier and fit the data.
 logreg.fit(X, Y)
 
 # Plot the decision boundary. For that, we will assign a color to each
 
@@ -7,7 +7,7 @@
 
 from sklearn.exceptions import ConvergenceWarning
 from sklearn.utils.testing import (
-    assert_equal, assert_false, assert_true, assert_array_equal, assert_raises,
+    assert_equal, assert_false, assert_array_equal, assert_raises,
     assert_warns, assert_warns_message, assert_no_warnings)
 
 from sklearn.cluster.affinity_propagation_ import AffinityPropagation
@@ -160,5 +160,5 @@ def test_equal_similarities_and_preferences():
     assert_false(_equal_similarities_and_preferences(S, np.array([0, 1])))
 
     # Same preferences
-    assert_true(_equal_similarities_and_preferences(S, np.array([0, 0])))
-    assert_true(_equal_similarities_and_preferences(S, np.array(0)))
+    assert _equal_similarities_and_preferences(S, np.array([0, 0]))
+    assert _equal_similarities_and_preferences(S, np.array(0))
@@ -10,7 +10,6 @@
 from sklearn.utils.testing import assert_array_equal
 from sklearn.utils.testing import assert_array_almost_equal
 from sklearn.utils.testing import assert_raises
-from sklearn.utils.testing import assert_true
 from sklearn.utils.testing import SkipTest
 
 from sklearn.base import BaseEstimator, BiclusterMixin
@@ -51,7 +50,7 @@ def test_get_submatrix():
         submatrix[:] = -1
         if issparse(X):
             X = X.toarray()
-        assert_true(np.all(X != -1))
+        assert np.all(X != -1)
 
 
 def _test_shape_indices(model):
 
@@ -4,7 +4,7 @@
 # Authors: Sergul Aydore 2017
 import numpy as np
 from sklearn.cluster import FeatureAgglomeration
-from sklearn.utils.testing import assert_true, assert_no_warnings
+from sklearn.utils.testing import assert_no_warnings
 from sklearn.utils.testing import assert_array_almost_equal
 
 
@@ -18,24 +18,24 @@ def test_feature_agglomeration():
                                         pooling_func=np.median)
     assert_no_warnings(agglo_mean.fit, X)
     assert_no_warnings(agglo_median.fit, X)
-    assert_true(np.size(np.unique(agglo_mean.labels_)) == n_clusters)
-    assert_true(np.size(np.unique(agglo_median.labels_)) == n_clusters)
-    assert_true(np.size(agglo_mean.labels_) == X.shape[1])
-    assert_true(np.size(agglo_median.labels_) == X.shape[1])
+    assert np.size(np.unique(agglo_mean.labels_)) == n_clusters
+    assert np.size(np.unique(agglo_median.labels_)) == n_clusters
+    assert np.size(agglo_mean.labels_) == X.shape[1]
+    assert np.size(agglo_median.labels_) == X.shape[1]
 
     # Test transform
     Xt_mean = agglo_mean.transform(X)
     Xt_median = agglo_median.transform(X)
-    assert_true(Xt_mean.shape[1] == n_clusters)
-    assert_true(Xt_median.shape[1] == n_clusters)
-    assert_true(Xt_mean == np.array([1 / 3.]))
-    assert_true(Xt_median == np.array([0.]))
+    assert Xt_mean.shape[1] == n_clusters
+    assert Xt_median.shape[1] == n_clusters
+    assert Xt_mean == np.array([1 / 3.])
+    assert Xt_median == np.array([0.])
 
     # Test inverse transform
     X_full_mean = agglo_mean.inverse_transform(Xt_mean)
     X_full_median = agglo_median.inverse_transform(Xt_median)
-    assert_true(np.unique(X_full_mean[0]).size == n_clusters)
-    assert_true(np.unique(X_full_median[0]).size == n_clusters)
+    assert np.unique(X_full_mean[0]).size == n_clusters
+    assert np.unique(X_full_median[0]).size == n_clusters
 
     assert_array_almost_equal(agglo_mean.transform(X_full_mean),
                               Xt_mean)
 
@@ -14,7 +14,6 @@
 from scipy import sparse
 from scipy.cluster import hierarchy
 
-from sklearn.utils.testing import assert_true
 from sklearn.utils.testing import assert_raises
 from sklearn.utils.testing import assert_equal
 from sklearn.utils.testing import assert_almost_equal
@@ -72,7 +71,7 @@ def test_structured_linkage_tree():
         children, n_components, n_leaves, parent = \
             tree_builder(X.T, connectivity)
         n_nodes = 2 * X.shape[1] - 1
-        assert_true(len(children) + n_leaves == n_nodes)
+        assert len(children) + n_leaves == n_nodes
         # Check that ward_tree raises a ValueError with a connectivity matrix
         # of the wrong shape
         assert_raises(ValueError,
@@ -114,7 +113,7 @@ def test_height_linkage_tree():
     for linkage_func in _TREE_BUILDERS.values():
         children, n_nodes, n_leaves, parent = linkage_func(X.T, connectivity)
         n_nodes = 2 * X.shape[1] - 1
-        assert_true(len(children) + n_leaves == n_nodes)
+        assert len(children) + n_leaves == n_nodes
 
 
 def test_agglomerative_clustering_wrong_arg_memory():
@@ -152,7 +151,7 @@ def test_agglomerative_clustering():
                 linkage=linkage)
             clustering.fit(X)
             labels = clustering.labels_
-            assert_true(np.size(np.unique(labels)) == 10)
+            assert np.size(np.unique(labels)) == 10
         finally:
             shutil.rmtree(tempdir)
         # Turn caching off now
@@ -166,7 +165,7 @@ def test_agglomerative_clustering():
                                                          labels), 1)
         clustering.connectivity = None
         clustering.fit(X)
-        assert_true(np.size(np.unique(clustering.labels_)) == 10)
+        assert np.size(np.unique(clustering.labels_)) == 10
         # Check that we raise a TypeError on dense matrices
         clustering = AgglomerativeClustering(
             n_clusters=10,
@@ -226,12 +225,12 @@ def test_ward_agglomeration():
     connectivity = grid_to_graph(*mask.shape)
     agglo = FeatureAgglomeration(n_clusters=5, connectivity=connectivity)
     agglo.fit(X)
-    assert_true(np.size(np.unique(agglo.labels_)) == 5)
+    assert np.size(np.unique(agglo.labels_)) == 5
 
     X_red = agglo.transform(X)
-    assert_true(X_red.shape[1] == 5)
+    assert X_red.shape[1] == 5
     X_full = agglo.inverse_transform(X_red)
-    assert_true(np.unique(X_full[0]).size == 5)
+    assert np.unique(X_full[0]).size == 5
     assert_array_almost_equal(agglo.transform(X_full), X_red)
 
     # Check that fitting with no samples raises a ValueError
@@ -265,7 +264,7 @@ def assess_same_labelling(cut1, cut2):
         ecut = np.zeros((n, k))
         ecut[np.arange(n), cut] = 1
         co_clust.append(np.dot(ecut, ecut.T))
-    assert_true((co_clust[0] == co_clust[1]).all())
+    assert (co_clust[0] == co_clust[1]).all()
 
 
 def test_scikit_vs_scipy():
 
@@ -13,7 +13,6 @@
 from sklearn.utils.testing import assert_almost_equal
 from sklearn.utils.testing import assert_raises
 from sklearn.utils.testing import assert_raises_regex
-from sklearn.utils.testing import assert_true
 from sklearn.utils.testing import assert_greater
 from sklearn.utils.testing import assert_less
 from sklearn.utils.testing import assert_warns
@@ -107,8 +106,8 @@ def test_labels_assignment_and_inertia():
         labels_gold[dist < mindist] = center_id
         mindist = np.minimum(dist, mindist)
     inertia_gold = mindist.sum()
-    assert_true((mindist >= 0.0).all())
-    assert_true((labels_gold != -1).all())
+    assert (mindist >= 0.0).all()
+    assert (labels_gold != -1).all()
 
     sample_weight = None
 
@@ -565,9 +564,9 @@ def test_k_means_non_collapsed():
     assert_equal(len(np.unique(km.labels_)), 3)
 
     centers = km.cluster_centers_
-    assert_true(np.linalg.norm(centers[0] - centers[1]) >= 0.1)
-    assert_true(np.linalg.norm(centers[0] - centers[2]) >= 0.1)
-    assert_true(np.linalg.norm(centers[1] - centers[2]) >= 0.1)
+    assert np.linalg.norm(centers[0] - centers[1]) >= 0.1
+    assert np.linalg.norm(centers[0] - centers[2]) >= 0.1
+    assert np.linalg.norm(centers[1] - centers[2]) >= 0.1
 
 
 @pytest.mark.parametrize('algo', ['full', 'elkan'])
@@ -689,7 +688,7 @@ def test_n_init():
     failure_msg = ("Inertia %r should be decreasing"
                    " when n_init is increasing.") % list(inertia)
     for i in range(len(n_init_range) - 1):
-        assert_true(inertia[i] >= inertia[i + 1], failure_msg)
+        assert inertia[i] >= inertia[i + 1], failure_msg
 
 
 def test_k_means_function():