pprett
diff --git a/‎doc/developers/index.rst
Lines changed: 2 additions & 1 deletion b/‎doc/developers/index.rst
Lines changed: 2 additions & 1 deletion
diff --git a/‎doc/modules/multiclass.rst
Lines changed: 7 additions & 6 deletions b/‎doc/modules/multiclass.rst
Lines changed: 7 additions & 6 deletions
diff --git a/‎doc/modules/tree.rst
Lines changed: 6 additions & 0 deletions b/‎doc/modules/tree.rst
Lines changed: 6 additions & 0 deletions
diff --git a/‎doc/whats_new.rst
Lines changed: 4 additions & 0 deletions b/‎doc/whats_new.rst
Lines changed: 4 additions & 0 deletions
diff --git a/‎sklearn/cross_validation.py
Lines changed: 27 additions & 28 deletions b/‎sklearn/cross_validation.py
Lines changed: 27 additions & 28 deletions
diff --git a/‎sklearn/ensemble/gradient_boosting.py
Lines changed: 4 additions & 1 deletion b/‎sklearn/ensemble/gradient_boosting.py
Lines changed: 4 additions & 1 deletion
diff --git a/‎sklearn/ensemble/tests/test_gradient_boosting.py
Lines changed: 11 additions & 0 deletions b/‎sklearn/ensemble/tests/test_gradient_boosting.py
Lines changed: 11 additions & 0 deletions
diff --git a/‎sklearn/feature_extraction/tests/test_image.py
Lines changed: 12 additions & 2 deletions b/‎sklearn/feature_extraction/tests/test_image.py
Lines changed: 12 additions & 2 deletions
diff --git a/`‎sklearn/grid_search.py` b/`‎sklearn/grid_search.py`
@@ -145,7 +145,8 @@ rules before submitting a pull request:
 
 You can also check for common programming errors with the following tools:
 
-    * Code with a good unittest coverage (at least 80%), check with::
+    * Code with a good unittest coverage (at least 90%, better 100%), check
+      with::
 
         $ pip install nose coverage
         $ nosetests --with-coverage path/to/tests_for_package
 
@@ -64,7 +64,7 @@ default choice. Below is an example::
   >>> from sklearn.svm import LinearSVC
   >>> iris = datasets.load_iris()
   >>> X, y = iris.data, iris.target
-  >>> OneVsRestClassifier(LinearSVC()).fit(X, y).predict(X)
+  >>> OneVsRestClassifier(LinearSVC(random_state=0)).fit(X, y).predict(X)
   array([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
          0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
          0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
@@ -110,7 +110,7 @@ dataset is used `n_classes` times. Below is an example::
   >>> from sklearn.svm import LinearSVC
   >>> iris = datasets.load_iris()
   >>> X, y = iris.data, iris.target
-  >>> OneVsOneClassifier(LinearSVC()).fit(X, y).predict(X)
+  >>> OneVsOneClassifier(LinearSVC(random_state=0)).fit(X, y).predict(X)
   array([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
          0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
          0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
 At prediction time, the classifiers are used to project new points in the
 class space and the class closest to the points is chosen.
 
-In :class:`OutputCodeClassifier`, the `code_size` attribute allows the user to control
-the number of classifiers which will be used. It is a percentage of the
+In :class:`OutputCodeClassifier`, the `code_size` attribute allows the user to
+control the number of classifiers which will be used. It is a percentage of the
 total number of classes.
 
 A number between 0 and 1 will require fewer classifiers than
@@ -162,7 +162,9 @@ Example::
   >>> from sklearn.svm import LinearSVC
   >>> iris = datasets.load_iris()
   >>> X, y = iris.data, iris.target
-  >>> OutputCodeClassifier(LinearSVC(), code_size=2, random_state=0).fit(X, y).predict(X)
+  >>> clf = OutputCodeClassifier(LinearSVC(random_state=0),
+  ...                            code_size=2, random_state=0)
+  >>> clf.fit(X, y).predict(X)
   array([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
          0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
          0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 2, 1, 1, 1, 1, 1, 1, 1, 1, 1, 2, 1, 1,
@@ -171,7 +173,6 @@ Example::
          2, 2, 2, 2, 1, 2, 2, 2, 2, 2, 2, 2, 2, 2, 1, 2, 2, 2, 1, 1, 2, 2, 2,
          2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2])
 
-
 .. topic:: References:
 
     .. [1] "Solving multiclass learning problems via error-correcting ouput codes",
 
@@ -123,12 +123,18 @@ Once trained, we can export the tree in `Graphviz
 exporter. Below is an example export of a tree trained on the entire
 iris dataset::
 
+    >>> import StringIO
     >>> with open("iris.dot", 'w') as f:
     ...     f = tree.export_graphviz(clf, out_file=f)
 
 Then we can use Graphviz's ``dot`` tool to create a PDF file (or any other
 supported file type): ``dot -Tpdf iris.dot -o iris.pdf``.
 
+::
+
+    >>> import os
+    >>> os.unlink('iris.dot')
+
 Alternatively, if we have Python module ``pydot`` installed, we can generate
 a PDF file (or any other supported file type) directly in Python::
 
 
@@ -98,6 +98,10 @@ Changelog
    - Fixed a floating point exception in the :ref:`decision trees <tree>` 
      module, by Seberg. 
 
+   - Fix :func:`metrics.roc_curve` fails when y_true has only one class 
+     by Wei Li.
+
+
 API changes summary
 -------------------
    - Renamed all occurences of ``n_atoms`` to ``n_components`` for consistency.
 
@@ -188,7 +188,7 @@ def __repr__(self):
 
     def __len__(self):
         return int(factorial(self.n) / factorial(self.n - self.p)
-                / factorial(self.p))
+                   / factorial(self.p))
 
 
 def _validate_kfold(k, n_samples):
@@ -257,10 +257,10 @@ class KFold(object):
     """
 
     def __init__(self, n, n_folds=3, indices=True, shuffle=False,
-            random_state=None, k=None):
+                 random_state=None, k=None):
         if k is not None:  # pragma: no cover
             warnings.warn("The parameter k was renamed to n_folds and will be"
-                    " removed in 0.15.", DeprecationWarning)
+                          " removed in 0.15.", DeprecationWarning)
             n_folds = k
         _validate_kfold(n_folds, n)
         random_state = check_random_state(random_state)
@@ -353,7 +353,7 @@ class StratifiedKFold(object):
     def __init__(self, y, n_folds=3, indices=True, k=None):
         if k is not None:  # pragma: no cover
             warnings.warn("The parameter k was renamed to n_folds and will be"
-                    " removed in 0.15.", DeprecationWarning)
+                          " removed in 0.15.", DeprecationWarning)
             n_folds = k
         y = np.asarray(y)
         n = y.shape[0]
@@ -566,8 +566,8 @@ def __repr__(self):
 
     def __len__(self):
         return int(factorial(self.n_unique_labels) /
-                factorial(self.n_unique_labels - self.p) /
-                factorial(self.p))
+                   factorial(self.n_unique_labels - self.p) /
+                   factorial(self.p))
 
 
 class Bootstrap(object):
@@ -647,8 +647,8 @@ def __init__(self, n, n_iter=3, train_size=.5, test_size=None,
                           "be removed in 0.16.", DeprecationWarning)
             n_iter = n_bootstraps
         self.n_iter = n_iter
-        if (isinstance(train_size, numbers.Real) and train_size >= 0.0
-                            and train_size <= 1.0):
+        if (isinstance(train_size, numbers.Real) and train_size >= 0.0 and
+                train_size <= 1.0):
             self.train_size = ceil(train_size * n)
         elif isinstance(train_size, numbers.Integral):
             self.train_size = train_size
@@ -683,10 +683,8 @@ def __iter__(self):
                                    + self.test_size]
 
             # bootstrap in each split individually
-            train = rng.randint(0, self.train_size,
-                                size=(self.train_size,))
-            test = rng.randint(0, self.test_size,
-                                size=(self.test_size,))
+            train = rng.randint(0, self.train_size, size=(self.train_size,))
+            test = rng.randint(0, self.test_size, size=(self.test_size,))
             yield ind_train[train], ind_test[test]
 
     def __repr__(self):
@@ -772,12 +770,12 @@ class ShuffleSplit(object):
     """
 
     def __init__(self, n, n_iter=10, test_size=0.1, train_size=None,
-            indices=True, random_state=None, n_iterations=None):
+                 indices=True, random_state=None, n_iterations=None):
         self.n = n
         self.n_iter = n_iter
         if n_iterations is not None:  # pragma: no cover
             warnings.warn("n_iterations was renamed to n_iter for consistency "
-                    " and will be removed in 0.16.")
+                          " and will be removed in 0.16.")
             self.n_iter = n_iterations
         self.test_size = test_size
         self.train_size = train_size
@@ -956,14 +954,14 @@ class StratifiedShuffleSplit(object):
     """
 
     def __init__(self, y, n_iter=10, test_size=0.1, train_size=None,
-            indices=True, random_state=None, n_iterations=None):
+                 indices=True, random_state=None, n_iterations=None):
 
         self.y = np.array(y)
         self.n = self.y.size
         self.n_iter = n_iter
         if n_iterations is not None:  # pragma: no cover
             warnings.warn("n_iterations was renamed to n_iter for consistency "
-                   " and will be removed in 0.16.")
+                          " and will be removed in 0.16.")
             self.n_iter = n_iterations
         self.test_size = test_size
         self.train_size = train_size
@@ -1025,9 +1023,9 @@ def _cross_val_score(estimator, X, y, score_func, train, test, verbose,
                      fit_params):
     """Inner loop for cross validation"""
     n_samples = X.shape[0] if sp.issparse(X) else len(X)
-    fit_params = dict([(k, np.asarray(v)[train]
-                    if hasattr(v, '__len__') and len(v) == n_samples else v)
-                    for k, v in fit_params.items()])
+    fit_params = dict([(k, np.asarray(v)[train] if hasattr(v, '__len__') and
+                        len(v) == n_samples else v)
+                       for k, v in fit_params.items()])
     if getattr(estimator, "_pairwise", False):
         # X is a precomputed square kernel matrix
         if X.shape[0] != X.shape[1]:
@@ -1105,9 +1103,10 @@ def cross_val_score(estimator, X, y=None, score_func=None, cv=None, n_jobs=1,
     # independent, and that it is pickle-able.
     fit_params = fit_params if fit_params is not None else {}
     scores = Parallel(n_jobs=n_jobs, verbose=verbose)(
-                delayed(_cross_val_score)(clone(estimator), X, y, score_func,
-                                          train, test, verbose, fit_params)
-                for train, test in cv)
+        delayed(_cross_val_score)(
+            clone(estimator), X, y, score_func, train, test, verbose,
+            fit_params)
+        for train, test in cv)
     return np.array(scores)
 
 
@@ -1173,8 +1172,8 @@ def check_cv(cv, X=None, y=None, classifier=False):
 
 
 def permutation_test_score(estimator, X, y, score_func, cv=None,
-                      n_permutations=100, n_jobs=1, labels=None,
-                      random_state=0, verbose=0):
+                           n_permutations=100, n_jobs=1, labels=None,
+                           random_state=0, verbose=0):
     """Evaluate the significance of a cross-validated score with permutations
 
     Parameters
@@ -1249,10 +1248,10 @@ def permutation_test_score(estimator, X, y, score_func, cv=None,
     # independent, and that it is pickle-able.
     score = _permutation_test_score(clone(estimator), X, y, cv, score_func)
     permutation_scores = Parallel(n_jobs=n_jobs, verbose=verbose)(
-                delayed(_permutation_test_score)(clone(estimator), X,
-                                            _shuffle(y, labels, random_state),
-                                            cv, score_func)
-                for _ in range(n_permutations))
+        delayed(_permutation_test_score)(
+            clone(estimator), X, _shuffle(y, labels, random_state), cv,
+            score_func)
+        for _ in range(n_permutations))
     permutation_scores = np.array(permutation_scores)
     pvalue = (np.sum(permutation_scores >= score) + 1.0) / (n_permutations + 1)
     return score, permutation_scores, pvalue
 
@@ -468,7 +468,7 @@ def _fit_stage(self, i, X, X_argsorted, y, y_pred, sample_mask):
                 max_depth=self.max_depth,
                 min_samples_split=self.min_samples_split,
                 min_samples_leaf=self.min_samples_leaf,
-                min_density=0.0,
+                min_density=self.min_density,
                 max_features=self.max_features,
                 compute_importances=False,
                 random_state=self.random_state)
@@ -559,6 +559,9 @@ def fit(self, X, y):
 
         self.random_state = check_random_state(self.random_state)
 
+        # use default min_density (0.1) only for deep trees
+        self.min_density = 0.0 if self.max_depth < 6 else 0.1
+
         # create argsorted X for fast tree induction
         X_argsorted = np.asfortranarray(
             np.argsort(X.T, axis=1).astype(np.int32).T)
 
@@ -475,3 +475,14 @@ def test_mem_layout():
     clf.fit(X, y_)
     assert_array_equal(clf.predict(T), true_result)
     assert_equal(100, len(clf.estimators_))
+
+
+def test_min_density():
+    """Check if min_density is properly set when growing deep trees."""
+    clf = GradientBoostingClassifier(max_depth=6)
+    clf.fit(X, y)
+    assert clf.min_density == 0.1
+
+    clf = GradientBoostingClassifier(max_depth=5)
+    clf.fit(X, y)
+    assert clf.min_density == 0.0
@@ -246,8 +246,8 @@ def test_extract_patches_strided():
 
     for (image_shape, patch_size, patch_step,
          expected_view, last_patch) in zip(
-             image_shapes, patch_sizes, patch_steps,
-               expected_views, last_patches):
+             image_shapes, patch_sizes, patch_steps, expected_views,
+             last_patches):
         image = np.arange(np.prod(image_shape)).reshape(image_shape)
         patches = extract_patches(image, patch_shape=patch_size,
                                   extraction_step=patch_step)
@@ -261,6 +261,16 @@ def test_extract_patches_strided():
                     image[last_patch_slices].squeeze()).all())
 
 
+def test_extract_patches_square():
+    # test same patch size for all dimensions
+    lena = downsampled_lena
+    i_h, i_w = lena.shape
+    p = 8
+    expected_n_patches = ((i_h - p + 1),  (i_w - p + 1))
+    patches = extract_patches(lena, patch_shape=p)
+    assert_true(patches.shape == (expected_n_patches[0], expected_n_patches[1],
+                                  p, p))
+
 if __name__ == '__main__':
     import nose
     nose.runmodule()
@@ -77,7 +77,7 @@ def fit_grid_point(X, y, sample_weight, base_clf,
     if verbose > 1:
         start_time = time.time()
         msg = '%s' % (', '.join('%s=%s' % (k, v)
-                                     for k, v in clf_params.iteritems()))
+                                for k, v in clf_params.iteritems()))
         print "[GridSearchCV] %s %s" % (msg, (64 - len(msg)) * '.')
 
     X, y = check_arrays(X, y, sparse_format="csr")
@@ -157,7 +157,7 @@ def _check_param_grid(param_grid):
 
             if len(v) == 0:
                 raise ValueError("Parameter values should be a non-empty "
-                        "list.")
+                                 "list.")
 
 
 def _has_one_grid_point(param_grid):
@@ -305,8 +305,7 @@ class GridSearchCV(BaseEstimator, MetaEstimatorMixin):
 
     def __init__(self, estimator, param_grid, loss_func=None, score_func=None,
                  fit_params=None, n_jobs=1, iid=True, refit=True, cv=None,
-                 verbose=0, pre_dispatch='2*n_jobs',
-                ):
+                 verbose=0, pre_dispatch='2*n_jobs'):
         if not hasattr(estimator, 'fit') or \
            not (hasattr(estimator, 
538E
9;predict') or hasattr(estimator, 'score')):
             raise TypeError("estimator should a be an estimator implementing"
@@ -396,12 +395,12 @@ def _fit(self, X, y, sample_weight):
 
         pre_dispatch = self.pre_dispatch
         out = Parallel(n_jobs=self.n_jobs, verbose=self.verbose,
-                pre_dispatch=pre_dispatch)(
-            delayed(fit_grid_point)(
-                X, y, sample_weight, base_clf, clf_params, train, test,
-                self.loss_func, self.score_func, self.verbose,
-                **self.fit_params)
-                    for clf_params in grid for train, test in cv)
+                       pre_dispatch=pre_dispatch)(
+                            delayed(fit_grid_point)(
+                                X, y, sample_weight, base_clf, clf_params,
+                                train, test, self.loss_func, self.score_func,
+                                self.verbose, **self.fit_params)
+                            for clf_params in grid for train, test in cv)
 
         # Out is a list of triplet: score, estimator, n_test_samples
         n_grid_points = len(list(grid))
@@ -415,7 +414,7 @@ def _fit(self, X, y, sample_weight):
             score = 0
             these_points = list()
             for this_score, clf_params, this_n_test_samples in \
-                                    out[grid_start:grid_start + n_folds]:
+                    out[grid_start:grid_start + n_folds]:
                 these_points.append(this_score)
                 if self.iid:
                     this_score *= this_n_test_samples
@@ -461,10 +460,9 @@ def _fit(self, X, y, sample_weight):
         # Store the computed scores
         # XXX: the name is too specific, it shouldn't have
         # 'grid' in it. Also, we should be retrieving/storing variance
-        self.grid_scores_ = [
-            (clf_params, score, all_scores)
-                    for clf_params, (score, _), all_scores
-                    in zip(grid, scores, cv_scores)]
+        self.grid_scores_ = [(clf_params, score, all_scores)
+                             for clf_params, (score, _), all_scores
+                             in zip(grid, scores, cv_scores)]
         return self
 
     def score(self, X, y=None):