raghavrv
diff --git a/‎sklearn/cross_validation.py
Lines changed: 1 addition & 1 deletion b/‎sklearn/cross_validation.py
Lines changed: 1 addition & 1 deletion
diff --git a/‎sklearn/feature_selection/rfe.py
Lines changed: 4 additions & 4 deletions b/‎sklearn/feature_selection/rfe.py
Lines changed: 4 additions & 4 deletions
diff --git a/‎sklearn/grid_search.py
Lines changed: 2 additions & 1 deletion b/‎sklearn/grid_search.py
Lines changed: 2 additions & 1 deletion
diff --git a/‎sklearn/learning_curve.py
Lines changed: 2 additions & 1 deletion b/‎sklearn/learning_curve.py
Lines changed: 2 additions & 1 deletion
diff --git a/‎sklearn/linear_model/coordinate_descent.py
Lines changed: 0 additions & 24 deletions b/‎sklearn/linear_model/coordinate_descent.py
Lines changed: 0 additions & 24 deletions
diff --git a/‎sklearn/linear_model/least_angle.py
Lines changed: 1 addition & 1 deletion b/‎sklearn/linear_model/least_angle.py
Lines changed: 1 addition & 1 deletion
diff --git a/‎sklearn/linear_model/logistic.py
Lines changed: 1 addition & 1 deletion b/‎sklearn/linear_model/logistic.py
Lines changed: 1 addition & 1 deletion
diff --git a/‎sklearn/linear_model/tests/test_logistic.py
Lines changed: 11 additions & 4 deletions b/‎sklearn/linear_model/tests/test_logistic.py
Lines changed: 11 additions & 4 deletions
diff --git a/‎sklearn/metrics/scorer.py
Lines changed: 2 additions & 2 deletions b/‎sklearn/metrics/scorer.py
Lines changed: 2 additions & 2 deletions
diff --git a/‎sklearn/model_selection/__init__.py
Lines changed: 32 additions & 45 deletions b/‎sklearn/model_selection/__init__.py
Lines changed: 32 additions & 45 deletions
diff --git a/‎sklearn/model_selection/search.py renamed to ‎sklearn/model_selection/_search.py
Lines changed: 16 additions & 18 deletions b/‎sklearn/model_selection/search.py renamed to ‎sklearn/model_selection/_search.py
Lines changed: 16 additions & 18 deletions
@@ -37,7 +37,7 @@
               "model_selection module into which all the refactored classes "
               "and functions are moved. Also note that the interface of the "
               "new CV iterators are different from that of this module. "
-              "Refer to model_selection for more info.", DeprecationWarning)
+              "This module will be removed in 0.19.", DeprecationWarning)
 
 
 __all__ = ['KFold',
 
@@ -15,7 +15,7 @@
 from ..base import clone
 from ..base import is_classifier
 from ..model_selection import check_cv
-from ..model_selection.validate import _safe_split, _score
+from ..model_selection._validation import _safe_split, _score
 from ..metrics.scorer import check_scoring
 from .base import SelectorMixin
 
@@ -447,7 +447,7 @@ def fit(self, X, y):
             self.estimator_.set_params(**self.estimator_params)
         self.estimator_.fit(self.transform(X), y)
 
-        # Fixing a normalization error, n is equal to len_cv - 1
-        # here, the scores are normalized by len_cv
-        self.grid_scores_ = scores / cv.n_splits(X, y)
+        # Fixing a normalization error, n is equal to get_n_splits(X, y) - 1
+        # here, the scores are normalized by get_n_splits(X, y)
+        self.grid_scores_ = scores / cv.get_n_splits(X, y)
         return self
@@ -38,7 +38,8 @@
 
 warnings.warn("This module has been deprecated in favor of the "
               "model_selection module into which all the refactored classes "
-              "and functions are moved.", DeprecationWarning)
+              "and functions are moved. This module will be removed in 0.19.",
+              DeprecationWarning)
 
 
 class ParameterGrid(object):
 
@@ -18,7 +18,8 @@
 
 
 warnings.warn("This module has been deprecated in favor of the "
-              "model_selection module into which all the functions are moved.",
+              "model_selection module into which all the functions are moved."
+              " This module will be removed in 0.19",
               DeprecationWarning)
 
 
 
@@ -1370,7 +1370,6 @@ class ElasticNetCV(LinearModelCV, RegressorMixin):
         dual gap for optimality and continues until it is smaller
         than ``tol``.
 
-<<<<<<< HEAD
     cv : int, cross-validation generator or an iterable, optional
         Determines the cross-validation splitting strategy.
         Possible inputs for cv are:
@@ -1383,13 +1382,6 @@ class ElasticNetCV(LinearModelCV, RegressorMixin):
 
         Refer :ref:`User Guide <cross_validation>` for the various
         cross-validation strategies that can be used here.
-=======
-    cv : integer or cross-validation generator, optional
-        If an integer is passed, it is the number of fold (default 3).
-        Specific cross-validation objects can be passed, see the
-        :mod:`sklearn.model_selection.split` module for the list of
-        possible objects.
->>>>>>> ENH introduce the model_selection module
 
     verbose : bool or integer
         Amount of verbosity.
@@ -1860,7 +1852,6 @@ class MultiTaskElasticNetCV(LinearModelCV, RegressorMixin):
         dual gap for optimality and continues until it is smaller
         than ``tol``.
 
-<<<<<<< HEAD
     cv : int, cross-validation generator or an iterable, optional
         Determines the cross-validation splitting strategy.
         Possible inputs for cv are:
@@ -1873,13 +1864,6 @@ class MultiTaskElasticNetCV(LinearModelCV, RegressorMixin):
 
         Refer :ref:`User Guide <cross_validation>` for the various
         cross-validation strategies that can be used here.
-=======
-    cv : integer or cross-validation generator, optional
-        If an integer is passed, it is the number of fold (default 3).
-        Specific cross-validation objects can be passed, see the
-        :mod:`sklearn.model_selection.split` module for the list of
-        possible objects.
->>>>>>> ENH introduce the model_selection module
 
     verbose : bool or integer
         Amount of verbosity.
@@ -2025,7 +2009,6 @@ class MultiTaskLassoCV(LinearModelCV, RegressorMixin):
         dual gap for optimality and continues until it is smaller
         than ``tol``.
 
-<<<<<<< HEAD
     cv : int, cross-validation generator or an iterable, optional
         Determines the cross-validation splitting strategy.
         Possible inputs for cv are:
@@ -2038,13 +2021,6 @@ class MultiTaskLassoCV(LinearModelCV, RegressorMixin):
 
         Refer :ref:`User Guide <cross_validation>` for the various
         cross-validation strategies that can be used here.
-=======
-    cv : integer or cross-validation generator, optional
-        If an integer is passed, it is the number of fold (default 3).
-        Specific cross-validation objects can be passed, see the
-        :mod:`sklearn.model_selection.split` module for the list of
-        possible objects.
->>>>>>> ENH introduce the model_selection module
 
     verbose : bool or integer
         Amount of verbosity.
 
@@ -1086,7 +1086,7 @@ def fit(self, X, y):
                 method=self.method, verbose=max(0, self.verbose - 1),
                 normalize=self.normalize, fit_intercept=self.fit_intercept,
                 max_iter=self.max_iter, eps=self.eps, positive=self.positive)
-            for train, test in cv)
+            for train, test in cv.split(X, y))
         all_alphas = np.concatenate(list(zip(*cv_paths))[0])
         # Unique also sorts
         all_alphas = np.unique(all_alphas)
 
@@ -1308,7 +1308,7 @@ class LogisticRegressionCV(LogisticRegression, BaseEstimator,
     cv : integer or cross-validation generator
         The default cross-validation generator used is Stratified K-Folds.
         If an integer is provided, then it is the number of folds used.
-        See the module :mod:`sklearn.model_selection.split` module for the
+        See the module :mod:`sklearn.model_selection` module for the
         list of possible cross-validation objects.
 
     penalty : str, 'l1' or 'l2'
 
@@ -1,4 +1,3 @@
-
 import numpy as n
179B
p
 import scipy.sparse as sp
 from scipy import linalg, optimize, sparse
@@ -454,16 +453,24 @@ def test_ovr_multinomial_iris():
     train, target = iris.data, iris.target
     n_samples, n_features = train.shape
 
-    # Use pre-defined fold as folds generated for different y
+    # The cv indices from stratified kfold (where stratification is done based
+    # on the fine-grained iris classes, i.e, before the classes 0 and 1 are
+    # conflated) is used for both clf and clf1
     cv = StratifiedKFold(3)
-    clf = LogisticRegressionCV(cv=cv)
+    precomputed_folds = list(cv.split(train, target))
+
+    # Train clf on the original dataset where classes 0 and 1 are separated
+    clf = LogisticRegressionCV(cv=precomputed_folds)
     clf.fit(train, target)
 
-    clf1 = LogisticRegressionCV(cv=cv)
+    # Conflate classes 0 and 1 and train clf1 on this modifed dataset
+    clf1 = LogisticRegressionCV(cv=precomputed_folds)
     target_copy = target.copy()
     target_copy[target_copy == 0] = 1
     clf1.fit(train, target_copy)
 
+    # Ensure that what OvR learns for class2 is same regardless of whether
+    # classes 0 and 1 are separated or not
     assert_array_almost_equal(clf.scores_[2], clf1.scores_[2])
     assert_array_almost_equal(clf.intercept_[2:], clf1.intercept_)
     assert_array_almost_equal(clf.coef_[2][np.newaxis, :], clf1.coef_)
 
@@ -4,8 +4,8 @@
 arbitrary score functions.
 
 A scorer object is a callable that can be passed to
-:class:`sklearn.model_selection.search.GridSearchCV` or
-:func:`sklearn.model_selection.validation.cross_val_score` as the ``scoring``
+:class:`sklearn.model_selection.GridSearchCV` or
+:func:`sklearn.model_selection.cross_val_score` as the ``scoring``
 parameter, to specify how a model should be evaluated.
 
 The signature of the call is ``(estimator, X, y)`` where ``estimator``
 
@@ -1,48 +1,35 @@
-from .split import KFold
-from .split import StratifiedKFold
-from .split import LeaveOneLabelOut
-from .split import LeaveOneOut
-from .split import LeavePLabelOut
-from .split import LeavePOut
-from .split import ShuffleSplit
-from .split import StratifiedShuffleSplit
-from .split import PredefinedSplit
-from .split import train_test_split
-from .split import check_cv
+from ._split import BaseCrossValidator
+from ._split import KFold
+from ._split import LabelKFold
+from ._split import StratifiedKFold
+from ._split import LeaveOneLabelOut
+from ._split import LeaveOneOut
+from ._split import LeavePLabelOut
+from ._split import LeavePOut
+from ._split import ShuffleSplit
+from ._split import LabelShuffleSplit
+from ._split import StratifiedShuffleSplit
+from ._split import PredefinedSplit
+from ._split import train_test_split
+from ._split import check_cv
 
-from .validate import cross_val_score
-from .validate import cross_val_predict
-from .validate import learning_curve
-from .validate import permutation_test_score
-from .validate import validation_curve
+from ._validation import cross_val_score
+from ._validation import cross_val_predict
+from ._validation import learning_curve
+from ._validation import permutation_test_score
+from ._validation import validation_curve
 
-from .search import GridSearchCV
-from .search import RandomizedSearchCV
-from .search import ParameterGrid
-from .search import ParameterSampler
-from .search import fit_grid_point
+from ._search import GridSearchCV
+from ._search import RandomizedSearchCV
+from ._search import ParameterGrid
+from ._search import ParameterSampler
+from ._search import fit_grid_point
 
-__all__ = ('split',
-           'validate',
-           'search',
-           'KFold',
-           'StratifiedKFold',
-           'LeaveOneLabelOut',
-           'LeaveOneOut',
-           'LeavePLabelOut',
-           'LeavePOut',
-           'ShuffleSplit',
-           'StratifiedShuffleSplit',
-           'PredefinedSplit',
-           'train_test_split',
-           'check_cv',
-           'cross_val_score',
-           'cross_val_predict',
-           'permutation_test_score',
-           'learning_curve',
-           'validation_curve',
-           'GridSearchCV',
-           'ParameterGrid',
-           'fit_grid_point',
-           'ParameterSampler',
-           'RandomizedSearchCV')
+__all__ = ('BaseCrossValidator', 'GridSearchCV', 'KFold', 'LabelKFold',
+           'LeaveOneLabelOut', 'LeaveOneOut', 'LeavePLabelOut', 'LeavePOut',
+           'ParameterGrid', 'ParameterSampler', 'PredefinedSplit',
+           'RandomizedSearchCV', 'ShuffleSplit', 'LabelShuffleSplit',
+           'StratifiedKFold', 'StratifiedShuffleSplit', 'check_cv',
+           'cross_val_predict', 'cross_val_score', 'fit_grid_point',
+           'learning_curve', 'permutation_test_score', 'train_test_split',
+           'validation_curve')
@@ -21,8 +21,8 @@
 
 from ..base import BaseEstimator, is_classifier, clone
 from ..base import MetaEstimatorMixin, ChangedBehaviorWarning
-from .split import check_cv
-from .validate import _fit_and_score
+from ._split import check_cv
+from ._validation import _fit_and_score
 from ..externals.joblib import Parallel, delayed
 from ..externals import six
 from ..utils import check_random_state
@@ -527,7 +527,7 @@ def _fit(self, X, y, labels, parameter_iterable):
                                  'of samples (%i) than data (X: %i samples)'
                                  % (len(y), n_samples))
         cv = check_cv(cv, y, classifier=is_classifier(estimator))
-        len_cv = cv.n_splits(X, y, labels)
+        len_cv = cv.get_n_splits(X, y, labels)
 
         if self.verbose > 0:
             if isinstance(parameter_iterable, Sized):
@@ -552,16 +552,15 @@ def _fit(self, X, y, labels, parameter_iterable):
 
         # Out is a list of triplet: score, estimator, n_test_samples
         n_fits = len(out)
-        n_folds = cv.n_splits(X, y, labels)
 
         scores = list()
         grid_scores = list()
-        for grid_start in range(0, n_fits, n_folds):
+        for grid_start in range(0, n_fits, len_cv):
             n_test_samples = 0
             score = 0
             all_scores = []
             for this_score, this_n_test_samples, _, parameters in \
-                    out[grid_start:grid_start + n_folds]:
+                    out[grid_start:grid_start + len_cv]:
                 all_scores.append(this_score)
                 if self.iid:
                     this_score *= this_n_test_samples
@@ -570,7 +569,7 @@ def _fit(self, X, y, labels, parameter_iterable):
             if self.iid:
                 score /= float(n_test_samples)
             else:
-                score /= float(n_folds)
+                score /= float(len_cv)
             scores.append((score, parameters))
             # TODO: shall we also store the test_fold_sizes?
             grid_scores.append(_CVScoreTuple(
@@ -667,10 +666,10 @@ class GridSearchCV(BaseSearchCV):
         For integer/None inputs, ``StratifiedKFold`` is used for classification
         tasks, when ``y`` is binary or multiclass.
 
-        See the :mod:`sklearn.model_selection.split` module for the list of
-        cross-validation generators that can be used here.
+        See the :mod:`sklearn.model_selection` module for the list of
+        cross-validation strategies that can be used here.
 
-        Also refer :ref:`cross-validation documentation <_cross_validation>`
+        Also refer :ref:`cross-validation documentation <cross_validation>`
 
     refit : boolean, default=True
         Refit the best estimator with the entire dataset.
@@ -680,10 +679,6 @@ class GridSearchCV(BaseSearchCV):
     verbose : integer
         Controls the verbosity: the higher, the more messages.
 
-    random_state : int or RandomState
-        Pseudo random number generator state used for random uniform sampling
-        from lists of possible values instead of scipy.stats distributions.
-
     error_score : 'raise' (default) or numeric
         Value to assign to the score if an error occurs in estimator fitting.
         If set to 'raise', the error is raised. If a numeric value is given,
@@ -877,10 +872,10 @@ class RandomizedSearchCV(BaseSearchCV):
         For integer/None inputs, ``StratifiedKFold`` is used for classification
         tasks, when ``y`` is binary or multiclass.
 
-        See the :mod:`sklearn.model_selection.split` module for the list of
-        cross-validation generators that can be used here.
+        See the :mod:`sklearn.model_selection` module for the list of
+        cross-validation strategies that can be used here.
 
-        Also refer :ref:`cross-validation documentation <_cross_validation>`
+        Also refer :ref:`cross-validation documentation <cross_validation>`
 
     refit : boolean, default=True
         Refit the best estimator with the entire dataset.
@@ -890,13 +885,16 @@ class RandomizedSearchCV(BaseSearchCV):
     verbose : integer
         Controls the verbosity: the higher, the more messages.
 
+    random_state : int or RandomState
+        Pseudo random number generator state used for random uniform sampling
+        from lists of possible values instead of scipy.stats distributions.
+
     error_score : 'raise' (default) or numeric
         Value to assign to the score if an error occurs in estimator fitting.
         If set to 'raise', the error is raised. If a numeric value is given,
         FitFailedWarning is raised. This parameter does not affect the refit
         step, which will always raise the error.
 
-
     Attributes
     ----------
     grid_scores_ : list of named tuples