musically-ut
diff --git a/‎doc/whats_new.rst‎
Lines changed: 5 additions & 0 deletions b/‎doc/whats_new.rst‎
Lines changed: 5 additions & 0 deletions
diff --git a/‎sklearn/ensemble/tests/test_voting_classifier.py‎
Lines changed: 37 additions & 1 deletion b/‎sklearn/ensemble/tests/test_voting_classifier.py‎
Lines changed: 37 additions & 1 deletion
diff --git a/‎sklearn/ensemble/voting_classifier.py‎
Lines changed: 33 additions & 5 deletions b/‎sklearn/ensemble/voting_classifier.py‎
Lines changed: 33 additions & 5 deletions
@@ -171,6 +171,11 @@ Trees and ensembles
 
    - :func:`tree.export_graphviz` now shows configurable number of decimal
      places. :issue:`8698` by :user:`Guillaume Lemaitre <glemaitre>`.
+     
+   - Added ``flatten_transform`` parameter to :class:`ensemble.VotingClassifier`
+     to change output shape of `transform` method to 2 dimensional.
+     :issue:`7794` by :user:`Ibraim Ganiev <olologin>` and
+     :user:`Herilalaina Rakotoarison <herilalaina>`.
 
 Linear, kernelized and related models
 
 
@@ -4,6 +4,7 @@
 from sklearn.utils.testing import assert_almost_equal, assert_array_equal
 from sklearn.utils.testing import assert_equal, assert_true, assert_false
 from sklearn.utils.testing import assert_raise_message
+from sklearn.utils.testing import assert_warns_message
 from sklearn.exceptions import NotFittedError
 from sklearn.linear_model import LogisticRegression
 from sklearn.naive_bayes import GaussianNB
@@ -223,7 +224,7 @@ def test_gridsearch():
     grid.fit(iris.data, iris.target)
 
 
-def test_parallel_predict():
+def test_parallel_fit():
     """Check parallel backend of VotingClassifier on toy dataset."""
     clf1 = LogisticRegression(random_state=123)
     clf2 = RandomForestClassifier(random_state=123)
@@ -364,3 +365,38 @@ def test_estimator_weights_format():
     eclf1.fit(X, y)
     eclf2.fit(X, y)
     assert_array_equal(eclf1.predict_proba(X), eclf2.predict_proba(X))
+
+
+def test_transform():
+    """Check transform method of VotingClassifier on toy dataset."""
+    clf1 = LogisticRegression(random_state=123)
+    clf2 = RandomForestClassifier(random_state=123)
+    clf3 = GaussianNB()
+    X = np.array([[-1.1, -1.5], [-1.2, -1.4], [-3.4, -2.2], [1.1, 1.2]])
+    y = np.array([1, 1, 2, 2])
+
+    eclf1 = VotingClassifier(estimators=[
+        ('lr', clf1), ('rf', clf2), ('gnb', clf3)],
+        voting='soft').fit(X, y)
+    eclf2 = VotingClassifier(estimators=[
+        ('lr', clf1), ('rf', clf2), ('gnb', clf3)],
+        voting='soft',
+        flatten_transform=True).fit(X, y)
+    eclf3 = VotingClassifier(estimators=[
+        ('lr', clf1), ('rf', clf2), ('gnb', clf3)],
+        voting='soft',
+        flatten_transform=False).fit(X, y)
+
+    warn_msg = ("'flatten_transform' default value will be "
+                "changed to True in 0.21."
+                "To silence this warning you may"
+                " explicitly set flatten_transform=False.")
+    res = assert_warns_message(DeprecationWarning, warn_msg,
+                               eclf1.transform, X)
+    assert_array_equal(res.shape, (3, 4, 2))
+    assert_array_equal(eclf2.transform(X).shape, (4, 6))
+    assert_array_equal(eclf3.transform(X).shape, (3, 4, 2))
+    assert_array_equal(res.swapaxes(0, 1).reshape((4, 6)),
+                       eclf2.transform(X))
+    assert_array_equal(eclf3.transform(X).swapaxes(0, 1).reshape((4, 6)),
+                       eclf2.transform(X))
@@ -12,6 +12,7 @@
 # License: BSD 3 clause
 
 import numpy as np
+import warnings
 
 from ..base import ClassifierMixin
 from ..base import TransformerMixin
@@ -61,6 +62,13 @@ class VotingClassifier(_BaseComposition, ClassifierMixin, TransformerMixin):
         The number of jobs to run in parallel for ``fit``.
         If -1, then the number of jobs is set to the number of cores.
 
+    flatten_transform : bool, optional (default=None)
+        Affects shape of transform output only when voting='soft'
+        If voting='soft' and flatten_transform=True, transform method returns
+        matrix with shape (n_samples, n_classifiers * n_classes). If
+        flatten_transform=False, it returns
+        (n_classifiers, n_samples, n_classes).
+
     Attributes
     ----------
     estimators_ : list of classifiers
@@ -94,18 +102,23 @@ class VotingClassifier(_BaseComposition, ClassifierMixin, TransformerMixin):
     [1 1 1 2 2 2]
     >>> eclf3 = VotingClassifier(estimators=[
     ...        ('lr', clf1), ('rf', clf2), ('gnb', clf3)],
-    ...        voting='soft', weights=[2,1,1])
+    ...        voting='soft', weights=[2,1,1],
+    ...        flatten_transform=True)
     >>> eclf3 = eclf3.fit(X, y)
     >>> print(eclf3.predict(X))
     [1 1 1 2 2 2]
+    >>> print(eclf3.transform(X).shape)
+    (6, 6)
     >>>
     """
 
-    def __init__(self, estimators, voting='hard', weights=None, n_jobs=1):
+    def __init__(self, estimators, voting='hard', weights=None, n_jobs=1,
+                 flatten_transform=None):
         self.estimators = estimators
         self.voting = voting
         self.weights = weights
         self.n_jobs = n_jobs
+        self.flatten_transform = flatten_transform
 
     @property
     def named_estimators(self):
@@ -163,6 +176,7 @@ def fit(self, X, y, sample_weight=None):
         if n_isnone == len(self.estimators):
             raise ValueError('All estimators are None. At least one is '
                              'required to be a classifier!')
+
         self.le_ = LabelEncoder().fit(y)
         self.classes_ = self.le_.classes_
         self.estimators_ = []
@@ -256,16 +270,30 @@ def transform(self, X):
 
         Returns
         -------
-        If `voting='soft'`:
-          array-like = [n_classifiers, n_samples, n_classes]
+        If `voting='soft'` and `flatten_transform=True`:
+          array-like = (n_classifiers, n_samples * n_classes)
+          otherwise array-like = (n_classifiers, n_samples, n_classes)
             Class probabilities calculated by each classifier.
         If `voting='hard'`:
           array-like = [n_samples, n_classifiers]
             Class labels predicted by each classifier.
         """
         check_is_fitted(self, 'estimators_')
+
         if self.voting == 'soft':
-            return self._collect_probas(X)
+            probas = self._collect_probas(X)
+            if self.flatten_transform is None:
+                warnings.warn("'flatten_transform' default value will be "
+                              "changed to True in 0.21."
+                              "To silence this warning you may"
+                              " explicitly set flatten_transform=False.",
+                              DeprecationWarning)
+                return probas
+            elif not self.flatten_transform:
+                return probas
+            else:
+                return np.hstack(probas)
+
         else:
             return self._predict(X)