franslarsson
diff --git a/‎doc/whats_new/v0.24.rst
Lines changed: 5 additions & 0 deletions b/‎doc/whats_new/v0.24.rst
Lines changed: 5 additions & 0 deletions
diff --git a/‎sklearn/compose/_column_transformer.py
Lines changed: 8 additions & 64 deletions b/‎sklearn/compose/_column_transformer.py
Lines changed: 8 additions & 64 deletions
diff --git a/‎sklearn/compose/tests/test_column_transformer.py
Lines changed: 19 additions & 32 deletions b/‎sklearn/compose/tests/test_column_transformer.py
Lines changed: 19 additions & 32 deletions
@@ -111,6 +111,11 @@ Changelog
 - |Fix| :class:`compose.ColumnTransformer` now displays the remainder in the
   diagram display. :pr:`18167` by `Thomas Fan`_.
 
+- |Fix| :class:`compose.ColumnTransformer` enforces strict count and order
+  of column names between `fit` and `transform` by raising an error instead
+  of a warning, following the deprecation cycle.
+  :pr:`18256` by :user:`Madhura Jayratne <madhuracj>`.
+
 :mod:`sklearn.covariance`
 .........................
 
 
@@ -6,10 +6,8 @@
 # Author: Andreas Mueller
 #         Joris Van den Bossche
 # License: BSD
-import warnings
 from itertools import chain
 
-import numbers
 import numpy as np
 from scipy import sparse
 from joblib import Parallel
@@ -418,34 +416,6 @@ def _validate_output(self, result):
                     "The output of the '{0}' transformer should be 2D (scipy "
                     "matrix, array, or pandas DataFrame).".format(name))
 
-    def _validate_features(self, n_features, feature_names):
-        """Ensures feature counts and names are the same during fit and
-        transform.
-
-        TODO: It should raise an error from v0.24
-        """
-
-        if ((self._feature_names_in is None or feature_names is None)
-                and self._n_features == n_features):
-            return
-
-        neg_col_present = np.any([_is_negative_indexing(col)
-                                  for col in self._columns])
-        if neg_col_present and self._n_features != n_features:
-            raise RuntimeError("At least one negative column was used to "
-                               "indicate columns, and the new data's number "
-                               "of columns does not match the data given "
-                               "during fit. "
-                               "Please make sure the data during fit and "
-                               "transform have the same number of columns.")
-
-        if (self._n_features != n_features or
-                np.any(self._feature_names_in != np.asarray(feature_names))):
-            warnings.warn("Given feature/column names or counts do not match "
-                          "the ones for the data given during fit. This will "
-                          "fail from v0.24.",
-                          FutureWarning)
-
     def _log_message(self, name, idx, total):
         if not self.verbose:
             return None
@@ -584,30 +554,14 @@ def transform(self, X):
         else:
             X_feature_names = None
 
-        if self._n_features > X.shape[1]:
-            raise ValueError('Number of features of the input must be equal '
-                             'to or greater than that of the fitted '
-                             'transformer. Transformer n_features is {0} '
-                             'and input n_features is {1}.'
-                             .format(self._n_features, X.shape[1]))
-
-        # No column reordering allowed for named cols combined with remainder
-        # TODO: remove this mechanism in 0.24, once we enforce strict column
-        # name order and count. See #14237 for details.
-        if (self._remainder[2] is not None and
-                hasattr(self, '_df_columns') and
-                self._has_str_cols and
-                hasattr(X, 'columns')):
-            n_cols_fit = len(self._df_columns)
-            n_cols_transform = len(X.columns)
-            if (n_cols_transform >= n_cols_fit and
-                    any(X.columns[:n_cols_fit] != self._df_columns)):
-                raise ValueError('Column ordering must be equal for fit '
-                                 'and for transform when using the '
-                                 'remainder keyword')
-
-        # TODO: also call _check_n_features(reset=False) in 0.24
-        self._validate_features(X.shape[1], X_feature_names)
+        self._check_n_features(X, reset=False)
+        if (self._feature_names_in is not None and
+            X_feature_names is not None and
+                np.any(self._feature_names_in != X_feature_names)):
+            raise RuntimeError(
+                "Given feature/column names do not match the ones for the "
+                "data given during fit."
+            )
         Xs = self._fit_transform(X, None, _transform_one, fitted=True)
         self._validate_output(Xs)
 
@@ -801,16 +755,6 @@ def make_column_transformer(*transformers,
                              verbose=verbose)
 
 
-def _is_negative_indexing(key):
-    # TODO: remove in v0.24
-    def is_neg(x): return isinstance(x, numbers.Integral) and x < 0
-    if isinstance(key, slice):
-        return is_neg(key.start) or is_neg(key.stop)
-    elif _determine_key_type(key) == 'int':
-        return np.any(np.asarray(key) < 0)
-    return False
-
-
 class make_column_selector:
     """Create a callable to select columns to be used with
     :class:`ColumnTransformer`.
 
@@ -514,12 +514,13 @@ def test_column_transformer_invalid_columns(remainder):
     ct = ColumnTransformer([('trans', Trans(), col)], remainder=remainder)
     ct.fit(X_array)
     X_array_more = np.array([[0, 1, 2], [2, 4, 6], [3, 6, 9]]).T
-    msg = ("Given feature/column names or counts do not match the ones for "
-           "the data given during fit.")
-    with pytest.warns(FutureWarning, match=msg):
-        ct.transform(X_array_more)  # Should accept added columns, for now
+    msg = ("X has 3 features, but ColumnTransformer is expecting 2 features "
+           "as input.")
+    with pytest.raises(ValueError, match=msg):
+        ct.transform(X_array_more)
     X_array_fewer = np.array([[0, 1, 2], ]).T
-    err_msg = 'Number of features'
+    err_msg = ("X has 1 features, but ColumnTransformer is expecting 2 "
+               "features as input.")
     with pytest.raises(ValueError, match=err_msg):
         ct.transform(X_array_fewer)
 
@@ -1186,17 +1187,18 @@ def test_column_transformer_reordered_column_names_remainder(explicit_colname):
                            remainder=Trans())
 
     tf.fit(X_fit_df)
-    err_msg = 'Column ordering must be equal'
-    warn_msg = ("Given feature/column names or counts do not match the ones "
-                "for the data given during fit.")
-    with pytest.raises(ValueError, match=err_msg):
+    err_msg = ("Given feature/column names do not match the ones for the "
+               "data given during fit.")
+    with pytest.raises(RuntimeError, match=err_msg):
         tf.transform(X_trans_df)
 
-    # No error for added columns if ordering is identical
+    # ValueError for added columns
     X_extended_df = X_fit_df.copy()
     X_extended_df['third'] = [3, 6, 9]
-    with pytest.warns(FutureWarning, match=warn_msg):
-        tf.transform(X_extended_df)  # No error should be raised, for now
+    err_msg = ("X has 3 features, but ColumnTransformer is expecting 2 "
+               "features as input.")
+    with pytest.raises(ValueError, match=err_msg):
+        tf.transform(X_extended_df)
 
     # No 'columns' AttributeError when transform input is a numpy array
     X_array = X_fit_array.copy()
@@ -1218,15 +1220,15 @@ def test_feature_name_validation():
     tf = ColumnTransformer([('bycol', Trans(), ['a', 'b'])])
     tf.fit(df)
 
-    msg = ("Given feature/column names or counts do not match the ones for "
-           "the data given during fit.")
-    with pytest.warns(FutureWarning, match=msg):
+    msg = ("X has 3 features, but ColumnTransformer is expecting 2 features "
+           "as input.")
+    with pytest.raises(ValueError, match=msg):
         tf.transform(df_extra)
 
     tf = ColumnTransformer([('bycol', Trans(), [0])])
     tf.fit(df)
 
-    with pytest.warns(FutureWarning, match=msg):
+    with pytest.raises(ValueError, match=msg):
         tf.transform(X_extra)
 
     with warnings.catch_warnings(record=True) as warns:
@@ -1236,24 +1238,9 @@ def test_feature_name_validation():
     tf = ColumnTransformer([('bycol', Trans(), ['a'])],
                            remainder=Trans())
     tf.fit(df)
-    with pytest.warns(FutureWarning, match=msg):
-        tf.transform(df_extra)
-
-    tf = ColumnTransformer([('bycol', Trans(), [0, -1])])
-    tf.fit(df)
-    msg = "At least one negative column was used to"
-    with pytest.raises(RuntimeError, match=msg):
-        tf.transform(df_extra)
-
-    tf = ColumnTransformer([('bycol', Trans(), slice(-1, -3, -1))])
-    tf.fit(df)
-    with pytest.raises(RuntimeError, match=msg):
+    with pytest.raises(ValueError, match=msg):
         tf.transform(df_extra)
 
-    with warnings.catch_warnings(record=True) as warns:
-        tf.transform(df)
-    assert not warns
-
 
 @pytest.mark.parametrize("array_type", [np.asarray, sparse.csr_matrix])
 def test_column_transformer_mask_indexing(array_type):