scikit-learn
diff --git a/‎asv_benchmarks/asv.conf.json
+2-2 b/‎asv_benchmarks/asv.conf.json
+2-2
diff --git a/‎sklearn/tree/_classes.py
+11-21 b/‎sklearn/tree/_classes.py
+11-21
diff --git a/‎sklearn/tree/_partitioner.pyx
+2-2 b/‎sklearn/tree/_partitioner.pyx
+2-2
diff --git a/‎sklearn/tree/_splitter.pxd
+4 b/‎sklearn/tree/_splitter.pxd
+4
diff --git a/‎sklearn/tree/_splitter.pyx
+9-38 b/‎sklearn/tree/_splitter.pyx
+9-38
@@ -26,7 +26,7 @@
 
     // List of branches to benchmark. If not provided, defaults to "master
     // (for git) or "default" (for mercurial).
-    "branches": ["main"],
+    // "branches": ["main"],
     // "branches": ["default"],    // for mercurial
 
     // The DVCS being used.  If not set, it will be automatically
@@ -40,7 +40,7 @@
     // If missing or the empty string, the tool will be automatically
     // determined by looking for tools on the PATH environment
     // variable.
-    "environment_type": "conda",
+    "environment_type": "mamba",
 
     // timeout in seconds for installing any dependencies in environment
     // defaults to 10 min
 
@@ -520,29 +520,19 @@ def _fit(
         SPLITTERS = SPARSE_SPLITTERS if issparse(X) else DENSE_SPLITTERS
         splitter = self.splitter
         if not isinstance(self.splitter, Splitter):
-            # Random splitter does not need to know about breiman shortcut
-            if self.splitter == "random":
-                splitter = SPLITTERS[self.splitter](
-                    criterion,
-                    self.max_features_,
-                    min_samples_leaf,
-                    min_weight_leaf,
-                    random_state,
-                    monotonic_cst,
-                )
-            else:
-                splitter = SPLITTERS[self.splitter](
-                    criterion,
-                    self.max_features_,
-                    min_samples_leaf,
-                    min_weight_leaf,
-                    random_state,
-                    monotonic_cst,
-                    breiman_shortcut,
-                )
+            # Note: random splitter does not use breiman shortcut
+            splitter = SPLITTERS[self.splitter](
+                criterion,
+                self.max_features_,
+                min_samples_leaf,
+                min_weight_leaf,
+                random_state,
+                monotonic_cst,
+                breiman_shortcut,
+            )
 
         if (
-            not isinstance(splitter, _splitter.RandomSplitter)
+            not isinstance(splitter, _splitter.RandomDenseSplitter)
             and np.max(n_categories) > 64
         ):
             raise ValueError(
 
@@ -124,7 +124,7 @@ cdef class DensePartitioner(BasePartitioner):
             self.sort_density = np.zeros(1, dtype=np.float32)
 
             # XXX: unsure what this it.
-            self.cat_offs = np.empty(1, dtype=np.int32)
+            self.cat_offset = np.empty(1, dtype=np.int32)
             # A storage of the sorted categories used in Breiman shortcut
             self.sorted_cat = np.empty(1, dtype=np.intp)
 
@@ -642,7 +642,7 @@ cdef class SparsePartitioner(BasePartitioner):
             self.sort_density = np.zeros(1, dtype=np.float32)
 
             # XXX: unsure what this it.
-            self.cat_offs = np.empty(1, dtype=np.int32)
+            self.cat_offset = np.empty(1, dtype=np.int32)
             # A storage of the sorted categories used in Breiman shortcut
             self.sorted_cat = np.empty(1, dtype=np.intp)
 
 
@@ -46,6 +46,10 @@ cdef class Splitter:
     cdef bint with_monotonic_cst
     cdef const float64_t[:] sample_weight
 
+    # Whether or not to sort categories by probabilities to split categorical
+    # features using the Breiman shortcut
+    cdef bint breiman_shortcut
+
     # We know the number of categories within our dataset across each feature.
     # If a feature index has -1, then it is not categorical
     cdef const int32_t[:] n_categories
 
@@ -69,6 +69,7 @@ cdef class Splitter:
         float64_t min_weight_leaf,
         object random_state,
         const int8_t[:] monotonic_cst,
+        bint breiman_shortcut,
         *argv
     ):
         """
@@ -111,6 +112,9 @@ cdef class Splitter:
         self.random_state = random_state
         self.monotonic_cst = monotonic_cst
         self.with_monotonic_cst = monotonic_cst is not None
+        
+        # Unused in random splitters
+        self.breiman_shortcut = breiman_shortcut
 
     def __getstate__(self):
         return {}
@@ -126,6 +130,7 @@ cdef class Splitter:
             self.min_weight_leaf,
             self.random_state,
             self.monotonic_cst,
+            self.breiman_shortcut,
         ), self.__getstate__())
 
     cdef int init(
@@ -280,41 +285,7 @@ cdef class Splitter:
         return self.criterion.node_impurity()
 
 
-cdef class BestSplitter(Splitter):
-    """Splitter for finding the best split on dense data.
-
-    breiman_shortcut : bint
-        Whether we use the Breiman shortcut method when splitting
-        a categorical feature.
-    """
-    cdef bint breiman_shortcut
-
-    def __cinit__(
-        self,
-        Criterion criterion,
-        intp_t max_features,
-        intp_t min_samples_leaf,
-        float64_t min_weight_leaf,
-        object random_state,
-        const int8_t[:] monotonic_cst,
-        bint breiman_shortcut,
-        *argv
-    ):
-        self.breiman_shortcut = breiman_shortcut
-
-    def __reduce__(self):
-        return (type(self), (
-            self.criterion,
-            self.max_features,
-            self.min_samples_leaf,
-            self.min_weight_leaf,
-            self.random_state,
-            self.monotonic_cst,
-            self.breiman_shortcut
-        ), self.__getstate__())
-
-
-cdef class BestDenseSplitter(BestSplitter):
+cdef class BestDenseSplitter(Splitter):
     """Splitter for finding the best split on dense data."""
     cdef DensePartitioner partitioner
     cdef int init(
@@ -348,7 +319,7 @@ cdef class BestDenseSplitter(BestSplitter):
             parent_record,
         )
 
-cdef class BestSparseSplitter(BestSplitter):
+cdef class BestSparseSplitter(Splitter):
     """Splitter for finding the best split, using the sparse data."""
     cdef SparsePartitioner partitioner
     cdef int init(
@@ -361,7 +332,7 @@ cdef class BestSparseSplitter(BestSplitter):
     ) except -1:
         Splitter.init(self, X, y, sample_weight, missing_values_in_feature_mask, n_categories)
         self.partitioner = SparsePartitioner(
-            X, self.samples, self.n_samples, self.feature_values, missing_values_in_feature_mask, n_categories
+            X, self.samples, self.n_samples, self.feature_values, missing_values_in_feature_mask, n_categories, self.breiman_shortcut
         )
 
     cdef int node_split(
@@ -438,7 +409,7 @@ cdef class RandomSparseSplitter(Splitter):
 
 
 cdef inline int node_split_best(
-    BestSplitter splitter,
+    Splitter splitter,
     Partitioner partitioner,
     Criterion criterion,
     SplitRecord* split,