seckcoder
diff --git a/‎setup.py
Lines changed: 1 addition & 16 deletions b/‎setup.py
Lines changed: 1 addition & 16 deletions
diff --git a/‎sklearn/base.py
Lines changed: 4 additions & 3 deletions b/‎sklearn/base.py
Lines changed: 4 additions & 3 deletions
diff --git a/‎sklearn/cluster/affinity_propagation_.py
Lines changed: 2 additions & 2 deletions b/‎sklearn/cluster/affinity_propagation_.py
Lines changed: 2 additions & 2 deletions
diff --git a/‎sklearn/cluster/hierarchical.py
Lines changed: 8 additions & 7 deletions b/‎sklearn/cluster/hierarchical.py
Lines changed: 8 additions & 7 deletions
diff --git a/‎sklearn/cluster/k_means_.py
Lines changed: 17 additions & 18 deletions b/‎sklearn/cluster/k_means_.py
Lines changed: 17 additions & 18 deletions
diff --git a/‎sklearn/cluster/mean_shift_.py
Lines changed: 2 additions & 1 deletion b/‎sklearn/cluster/mean_shift_.py
Lines changed: 2 additions & 1 deletion
diff --git a/‎sklearn/cluster/tests/test_spectral.py
Lines changed: 2 additions & 1 deletion b/‎sklearn/cluster/tests/test_spectral.py
Lines changed: 2 additions & 1 deletion
diff --git a/‎sklearn/covariance/graph_lasso_.py
Lines changed: 8 additions & 7 deletions b/‎sklearn/covariance/graph_lasso_.py
Lines changed: 8 additions & 7 deletions
diff --git a/‎sklearn/covariance/robust_covariance.py
Lines changed: 1 addition & 1 deletion b/‎sklearn/covariance/robust_covariance.py
Lines changed: 1 addition & 1 deletion
diff --git a/‎sklearn/cross_validation.py
Lines changed: 4 additions & 3 deletions b/‎sklearn/cross_validation.py
Lines changed: 4 additions & 3 deletions
diff --git a/‎sklearn/datasets/base.py
Lines changed: 2 additions & 2 deletions b/‎sklearn/datasets/base.py
Lines changed: 2 additions & 2 deletions
@@ -98,28 +98,13 @@ def configuration(parent_package='', top_path=None):
         _old_stdout = sys.stdout
         try:
             sys.stdout = StringIO()  # supress noisy output
-            res = lib2to3.main.main("lib2to3.fixes",
-                                    ['-x', 'import', '-w', local_path])
+            res = lib2to3.main.main("lib2to3.fixes", ['-x', 'import', '-w', local_path])
         finally:
             sys.stdout = _old_stdout
 
         if res != 0:
             raise Exception('2to3 failed, exiting ...')
 
-        # Ugly hack to make pip work with Python 3, see
-        # http://projects.scipy.org/numpy/ticket/1857.
-        # Explanation: pip messes with __file__ which interacts badly with the
-        # change in directory due to the 2to3 conversion.  Therefore we restore
-        # __file__ to what it would have been otherwise.
-        global __file__
-        __file__ = os.path.join(os.curdir, os.path.basename(__file__))
-        if '--egg-base' in sys.argv: 
-            # Change pip-egg-info entry to absolute path, so pip can find it 
-            # after changing directory. 
-            idx = sys.argv.index('--egg-base')
-            if sys.argv[idx + 1] == 'pip-egg-info': 
-                sys.argv[idx + 1] = os.path.join(old_path, 'pip-egg-info') 
-
     os.chdir(local_path)
     sys.path.insert(0, local_path)
 
 
@@ -8,6 +8,7 @@
 
 import numpy as np
 from scipy import sparse
+from .externals import six
 
 
 ###############################################################################
@@ -42,7 +43,7 @@ def clone(estimator, safe=True):
                             % (repr(estimator), type(estimator)))
     klass = estimator.__class__
     new_object_params = estimator.get_params(deep=False)
-    for name, param in new_object_params.iteritems():
+    for name, param in six.iteritems(new_object_params):
         new_object_params[name] = clone(param, safe=False)
     new_object = klass(**new_object_params)
     params_set = new_object.get_params(deep=False)
@@ -120,7 +121,7 @@ def _pprint(params, offset=0, printer=repr):
     params_list = list()
     this_line_length = offset
     line_sep = ',\n' + (1 + offset // 2) * ' '
-    for i, (k, v) in enumerate(sorted(params.iteritems())):
+    for i, (k, v) in enumerate(sorted(six.iteritems(params))):
         if type(v) is float:
             # use str for representing floating point numbers
             # this way we get consistent representation across
@@ -225,7 +226,7 @@ def set_params(self, **params):
             # Simple optimisation to gain speed (inspect is slow)
             return self
         valid_params = self.get_params(deep=True)
-        for key, value in params.iteritems():
+        for key, value in six.iteritems(params):
             split = key.split('__', 1)
             if len(split) > 1:
                 # nested objects case
 
@@ -139,11 +139,11 @@ def affinity_propagation(S, preference=None, convergence_iter=15, max_iter=200,
                            != n_samples)
             if (not unconverged and (K > 0)) or (it == max_iter):
                 if verbose:
-                    print "Converged after %d iterations." % it
+                    print("Converged after %d iterations." % it)
                 break
     else:
         if verbose:
-            print "Did not converge"
+            print("Did not converge")
 
     I = np.where(np.diag(A + R) > 0)[0]
     K = I.size  # Identify exemplars
 
@@ -15,10 +15,11 @@
 from scipy.cluster import hierarchy
 
 from ..base import BaseEstimator, ClusterMixin
-from ..utils._csgraph import cs_graph_components
 from ..externals.joblib import Memory
+from ..externals import six
 from ..metrics import euclidean_distances
 from ..utils import array2d
+from ..utils._csgraph import cs_graph_components
 
 from . import _hierarchical
 from ._feature_agglomeration import AgglomerationTransform
@@ -144,9 +145,9 @@ def ward_tree(X, connectivity=None, n_components=None, copy=True,
     moments_2 = np.zeros((n_nodes, n_features))
     moments_2[:n_samples] = X
     inertia = np.empty(len(coord_row), dtype=np.float)
-    _hierarchical.compute_ward_dist(moments_1, moments_2, coord_row, coord_col,
-                                    inertia)
-    inertia = zip(inertia, coord_row, coord_col)
+    _hierarchical.compute_ward_dist(moments_1, moments_2,
+                             coord_row, coord_col, inertia)
+    inertia = list(six.moves.zip(inertia, coord_row, coord_col))
     heapify(inertia)
 
     # prepare the main fields
@@ -158,7 +159,7 @@ def ward_tree(X, connectivity=None, n_components=None, copy=True,
     not_visited = np.empty(n_nodes, dtype=np.int8)
 
     # recursive merge loop
-    for k in xrange(n_samples, n_nodes):
+    for k in range(n_samples, n_nodes):
         # identify the merge
         while True:
             inert, i, j = heappop(inertia)
@@ -191,7 +192,7 @@ def ward_tree(X, connectivity=None, n_components=None, copy=True,
                                         coord_row, coord_col, ini)
         # List comprehension is faster than a for loop
         [heappush(inertia, (ini[idx], k, coord_col[idx]))
-            for idx in xrange(n_additions)]
+            for idx in range(n_additions)]
 
     # Separate leaves in children (empty lists up to now)
     n_leaves = n_samples
@@ -346,7 +347,7 @@ def fit(self, X):
         """
         memory = self.memory
         X = array2d(X)
-        if isinstance(memory, basestring):
+        if isinstance(memory, six.string_types):
             memory = Memory(cachedir=memory, verbose=0)
 
         if not self.connectivity is None:
 
@@ -98,7 +98,7 @@ def _k_init(X, n_clusters, n_local_trials=None, random_state=None,
     current_pot = closest_dist_sq.sum()
 
     # Pick the remaining n_clusters-1 points
-    for c in xrange(1, n_clusters):
+    for c in range(1, n_clusters):
         # Choose center candidates by sampling with probability proportional
         # to the squared distance to the closest existing center
         rand_vals = random_state.random_sample(n_local_trials) * current_pot
@@ -112,7 +112,7 @@ def _k_init(X, n_clusters, n_local_trials=None, random_state=None,
         best_candidate = None
         best_pot = None
         best_dist_sq = None
-        for trial in xrange(n_local_trials):
+        for trial in range(n_local_trials):
             # Compute potential when including center candidate
             new_dist_sq = np.minimum(closest_dist_sq,
                                      distance_to_candidates[trial])
@@ -363,7 +363,7 @@ def _kmeans_single(X, n_clusters, max_iter=300, init='k-means++',
     centers = _init_centroids(X, n_clusters, init, random_state=random_state,
                               x_squared_norms=x_squared_norms)
     if verbose:
-        print 'Initialization complete'
+        print('Initialization complete')
 
     # Allocate memory to store the distances for each sample to its
     # closer center for reallocation in case of ties
@@ -386,7 +386,7 @@ def _kmeans_single(X, n_clusters, max_iter=300, init='k-means++',
             centers = _k_means._centers_dense(X, labels, n_clusters, distances)
 
         if verbose:
-            print 'Iteration %i, inertia %s' % (i, inertia)
+            print('Iteration %i, inertia %s' % (i, inertia))
 
         if best_inertia is None or inertia < best_inertia:
             best_labels = labels.copy()
@@ -395,7 +395,7 @@ def _kmeans_single(X, n_clusters, max_iter=300, init='k-means++',
 
         if np.sum((centers_old - centers) ** 2) < tol:
             if verbose:
-                print 'Converged to similar centers at iteration', i
+                print('Converged to similar centers at iteration', i)
             break
     return best_labels, best_inertia, best_centers
 
@@ -943,14 +943,14 @@ def _mini_batch_convergence(model, iteration_idx, n_iter, tol,
             'mean batch inertia: %f, ewa inertia: %f ' % (
                 iteration_idx + 1, n_iter, batch_inertia,
                 ewa_inertia))
-        print progress_msg
+        print(progress_msg)
 
     # Early stopping based on absolute tolerance on squared change of
     # centers postion (using EWA smoothing)
     if tol > 0.0 and ewa_diff < tol:
         if verbose:
-            print 'Converged (small centers change) at iteration %d/%d' % (
-                iteration_idx + 1, n_iter)
+            print('Converged (small centers change) at iteration %d/%d'
+                  % (iteration_idx + 1, n_iter))
         return True
 
     # Early stopping heuristic due to lack of improvement on smoothed inertia
@@ -965,9 +965,9 @@ def _mini_batch_convergence(model, iteration_idx, n_iter, tol,
     if (model.max_no_improvement is not None
             and no_improvement >= model.max_no_improvement):
         if verbose:
-            print ('Converged (lack of improvement in inertia)'
-                   ' at iteration %d/%d' % (
-                       iteration_idx + 1, n_iter))
+            print('Converged (lack of improvement in inertia)'
+                  ' at iteration %d/%d'
+                  % (iteration_idx + 1, n_iter))
         return True
 
     # update the convergence context to maintain state across sucessive calls:
@@ -1141,8 +1141,8 @@ def fit(self, X, y=None):
         best_inertia = None
         for init_idx in range(self.n_init):
             if self.verbose:
-                print "Init %d/%d with method: %s" % (
-                    init_idx + 1, self.n_init, self.init)
+                print("Init %d/%d with method: %s"
+                      % (init_idx + 1, self.n_init, self.init))
             counts = np.zeros(self.n_clusters, dtype=np.int32)
 
             # TODO: once the `k_means` function works with sparse input we
@@ -1167,8 +1167,8 @@ def fit(self, X, y=None):
             _, inertia = _labels_inertia(X_valid, x_squared_norms_valid,
                                          cluster_centers)
             if self.verbose:
-                print "Inertia for init %d/%d: %f" % (
-                    init_idx + 1, self.n_init, inertia)
+                print("Inertia for init %d/%d: %f"
+                      % (init_idx + 1, self.n_init, inertia))
             if best_inertia is None or inertia < best_inertia:
                 self.cluster_centers_ = cluster_centers
                 self.counts_ = counts
@@ -1179,8 +1179,7 @@ def fit(self, X, y=None):
 
         # Perform the iterative optimization until the final convergence
         # criterion
-        for iteration_idx in xrange(n_iter):
-
+        for iteration_idx in range(n_iter):
             # Sample a minibatch from the full dataset
             minibatch_indices = random_state.random_integers(
                 0, n_samples - 1, self.batch_size)
@@ -1210,7 +1209,7 @@ def fit(self, X, y=None):
 
         if self.compute_labels:
             if self.verbose:
-                print 'Computing label assignements and total inertia'
+                print('Computing label assignements and total inertia')
             self.labels_, self.inertia_ = _labels_inertia(
                 X, x_squared_norms, self.cluster_centers_)
 
 
@@ -8,6 +8,7 @@
 from collections import defaultdict
 import numpy as np
 
+from ..externals import six
 from ..utils import extmath, check_random_state
 from ..base import BaseEstimator, ClusterMixin
 from ..neighbors import NearestNeighbors
@@ -193,7 +194,7 @@ def get_bin_seeds(X, bin_size, min_bin_freq=1):
         bin_sizes[tuple(binned_point)] += 1
 
     # Select only those bins as seeds which have enough members
-    bin_seeds = np.array([point for point, freq in bin_sizes.iteritems() if
+    bin_seeds = np.array([point for point, freq in six.iteritems(bin_sizes) if
                           freq >= min_bin_freq], dtype=np.float32)
     bin_seeds = bin_seeds * bin_size
     return bin_seeds
 
@@ -1,6 +1,7 @@
 """Testing for Spectral Clustering methods"""
 
-from cPickle import dumps, loads
+from sklearn.externals.six.moves import cPickle
+dumps, loads = cPickle.dumps, cPickle.loads
 
 import numpy as np
 from scipy import sparse
 
@@ -22,6 +22,7 @@
 from ..linear_model import cd_fast
 from ..cross_validation import check_cv, cross_val_score
 from ..externals.joblib import Parallel, delayed
+import collections
 
 
 ###############################################################################
@@ -154,8 +155,8 @@ def graph_lasso(emp_cov, alpha, cov_init=None, mode='cd', tol=1e-4,
     else:
         errors = dict(invalid='raise')
     try:
-        for i in xrange(max_iter):
-            for idx in xrange(n_features):
+        for i in range(max_iter):
+            for idx in range(n_features):
                 sub_covariance = covariance_[indices != idx].T[indices != idx]
                 row = emp_cov[idx, indices != idx]
                 with np.errstate(**errors):
@@ -187,7 +188,7 @@ def graph_lasso(emp_cov, alpha, cov_init=None, mode='cd', tol=1e-4,
             d_gap = _dual_gap(emp_cov, precision_, alpha)
             cost = _objective(emp_cov, precision_, alpha)
             if verbose:
-                print (
+                print(
                     '[graph_lasso] Iteration % 3i, cost % 3.2e, dual gap %.3e'
                     % (i, cost, d_gap))
             if return_costs:
@@ -431,7 +432,7 @@ def fit(self, X, y=None):
         n_alphas = self.alphas
         inner_verbose = max(0, self.verbose - 1)
 
-        if operator.isSequenceType(n_alphas):
+        if isinstance(n_alphas, collections.Sequence):
             alphas = self.alphas
             n_refinements = 1
         else:
@@ -510,10 +511,10 @@ def fit(self, X, y=None):
                                  n_alphas + 2)
             alphas = alphas[1:-1]
             if self.verbose and n_refinements > 1:
-                print '[GraphLassoCV] Done refinement % 2i out of %i: % 3is'\
-                      % (i + 1, n_refinements, time.time() - t0)
+                print('[GraphLassoCV] Done refinement % 2i out of %i: % 3is'\
+                      % (i + 1, n_refinements, time.time() - t0))
 
-        path = zip(*path)
+        path = list(zip(*path))
         cv_scores = list(path[1])
         alphas = list(path[0])
         # Finally, compute the score with alpha = 0
 
@@ -144,7 +144,7 @@ def c_step(X, n_support, remaining_iterations=30, initial_estimates=None,
     # Check early stopping
     if remaining_iterations == 0:
         if verbose:
-            print 'Maximum number of iterations reached'
+            print('Maximum number of iterations reached')
         det = fast_logdet(covariance)
         results = location, covariance, det, support, dist
 
 
@@ -23,6 +23,7 @@
 from .utils.fixes import unique
 from .externals.joblib import Parallel, delayed
 from .metrics import SCORERS, Scorer
+import numbers
 
 __all__ = ['Bootstrap',
            'KFold',
@@ -93,7 +94,7 @@ def __init__(self, n, indices=True):
 
     def __iter__(self):
         n = self.n
-        for i in xrange(n):
+        for i in range(n):
             test_index = np.zeros(n, dtype=np.bool)
             test_index[i] = True
             train_index = np.logical_not(test_index)
@@ -282,7 +283,7 @@ def __iter__(self):
         n_folds = self.n_folds
         fold_size = n // n_folds
 
-        for i in xrange(n_folds):
+        for i in range(n_folds):
             test_index = np.zeros(n, dtype=np.bool)
             if i < n_folds - 1:
                 test_index[self.idxs[i * fold_size:(i + 1) * fold_size]] = True
@@ -377,7 +378,7 @@ def __iter__(self):
         n = y.size
         idx = np.argsort(y)
 
-        for i in xrange(n_folds):
+        for i in range(n_folds):
             test_index = np.zeros(n, dtype=np.bool)
             test_index[idx[i::n_folds]] = True
             train_index = np.logical_not(test_index)
 
@@ -398,12 +398,12 @@ def load_boston():
     data_file = csv.reader(open(join(module_path, 'data',
                                      'boston_house_prices.csv')))
     fdescr = open(join(module_path, 'descr', 'boston_house_prices.rst'))
-    temp = data_file.next()
+    temp = next(data_file)
     n_samples = int(temp[0])
     n_features = int(temp[1])
     data = np.empty((n_samples, n_features))
     target = np.empty((n_samples,))
-    temp = data_file.next()  # names of features
+    temp = next(data_file)  # names of features
     feature_names = np.array(temp)
 
     for i, d in enumerate(data_file):