scikit-learn · adrinjalali · Oct 16, 2018 · Oct 16, 2018 · Oct 16, 2018 · Oct 16, 2018
diff --git a/doc/modules/compose.rst b/doc/modules/compose.rst
@@ -418,8 +418,8 @@ By default, the remaining rating columns are ignored (``remainder='drop'``)::
   >>> from sklearn.compose import ColumnTransformer
   >>> from sklearn.feature_extraction.text import CountVectorizer
   >>> column_trans = ColumnTransformer(
-  ...     [('city_category', CountVectorizer(analyzer=lambda x: [x]), 'city'),
-  ...      ('title_bow', CountVectorizer(), 'title')],
+  ...     [('city_category', 'city', CountVectorizer(analyzer=lambda x: [x])),
+  ...      ('title_bow', 'title', CountVectorizer())],
   ...     remainder='drop')
 
   >>> column_trans.fit(X) # doctest: +NORMALIZE_WHITESPACE +ELLIPSIS
@@ -458,8 +458,8 @@ We can keep the remaining rating columns by setting
 transformation::
 
   >>> column_trans = ColumnTransformer(
-  ...     [('city_category', CountVectorizer(analyzer=lambda x: [x]), 'city'),
-  ...      ('title_bow', CountVectorizer(), 'title')],
+  ...     [('city_category', 'city', CountVectorizer(analyzer=lambda x: [x])),
+  ...      ('title_bow', 'title', CountVectorizer())],
   ...     remainder='passthrough')
 
   >>> column_trans.fit_transform(X)
@@ -475,8 +475,8 @@ the transformation::
 
   >>> from sklearn.preprocessing import MinMaxScaler
   >>> column_trans = ColumnTransformer(
-  ...     [('city_category', CountVectorizer(analyzer=lambda x: [x]), 'city'),
-  ...      ('title_bow', CountVectorizer(), 'title')],
+  ...     [('city_category', 'city', CountVectorizer(analyzer=lambda x: [x])),
+  ...      ('title_bow', 'title', CountVectorizer())],
   ...     remainder=MinMaxScaler())
 
   >>> column_trans.fit_transform(X)[:, -2:]

diff --git a/doc/whats_new/v0.20.rst b/doc/whats_new/v0.20.rst
@@ -48,6 +48,14 @@ Changelog
   even if all transformation results are sparse. :issue:`12304` by `Andreas
   Müller`_.
 
+- |API| :class:`compose.ColumnTransformer` now expects
+  `(name, columns, transformer)` instead of `(name, transformer, columns)`
+  as the first argument to the constructor.
+  The support for the `(name, transformer, columns)` order will be removed
+  in v0.22, and until then, a `UserWarning` is raised if the deprecated
+  input order is given.
+  :issue:`12339` by :user:`Adrin Jalali <adrinjalali>`.
+
 :mod:`sklearn.datasets`
 ............................
 

diff --git a/examples/compose/plot_column_transformer.py b/examples/compose/plot_column_transformer.py
@@ -93,19 +93,19 @@ def transform(self, posts):
     ('union', ColumnTransformer(
         [
             # Pulling features from the post's subject line (first column)
-            ('subject', TfidfVectorizer(min_df=50), 0),
+            ('subject', 0, TfidfVectorizer(min_df=50)),
 
             # Pipeline for standard bag-of-words model for body (second column)
-            ('body_bow', Pipeline([
+            ('body_bow', 1, Pipeline([
                 ('tfidf', TfidfVectorizer()),
                 ('best', TruncatedSVD(n_components=50)),
-            ]), 1),
+            ])),
 
             # Pipeline for pulling ad hoc features from post's body
-            ('body_stats', Pipeline([
+            ('body_stats', 1, Pipeline([
                 ('stats', TextStats()),  # returns a list of dicts
                 ('vect', DictVectorizer()),  # list of dicts -> feature matrix
-            ]), 1),
+            ])),
         ],
 
         # weight components in ColumnTransformer

diff --git a/examples/compose/plot_column_transformer_mixed_types.py b/examples/compose/plot_column_transformer_mixed_types.py
@@ -65,8 +65,8 @@
 
 preprocessor = ColumnTransformer(
     transformers=[
-        ('num', numeric_transformer, numeric_features),
-        ('cat', categorical_transformer, categorical_features)])
+        ('num', numeric_features, numeric_transformer),
+        ('cat', categorical_features, categorical_transformer)])
 
 # Append classifier to preprocessing pipeline.
 # Now we have a full prediction pipeline.