scikit-learn
diff --git a/‎doc/modules/classes.rst
Lines changed: 1 addition & 0 deletions b/‎doc/modules/classes.rst
Lines changed: 1 addition & 0 deletions
diff --git a/‎doc/modules/clustering.rst
Lines changed: 29 additions & 24 deletions b/‎doc/modules/clustering.rst
Lines changed: 29 additions & 24 deletions
diff --git a/‎doc/sphinxext/gen_rst.py
Lines changed: 2 additions & 3 deletions b/‎doc/sphinxext/gen_rst.py
Lines changed: 2 additions & 3 deletions
diff --git a/‎sklearn/metrics/cluster/supervised.py
Lines changed: 11 additions & 9 deletions b/‎sklearn/metrics/cluster/supervised.py
Lines changed: 11 additions & 9 deletions
diff --git a/‎sklearn/metrics/cluster/unsupervised.py
Lines changed: 9 additions & 14 deletions b/‎sklearn/metrics/cluster/unsupervised.py
Lines changed: 9 additions & 14 deletions
@@ -868,6 +868,7 @@ details.
 
    metrics.adjusted_mutual_info_score
    metrics.adjusted_rand_score
+   metrics.calinski_harabaz_score
    metrics.completeness_score
    metrics.fowlkes_mallows_score
    metrics.homogeneity_completeness_v_measure
 
@@ -1344,18 +1344,20 @@ mean of homogeneity and completeness**:
 Fowlkes-Mallows scores
 ----------------------
 
-The Fowlkes-Mallows index (FMI) is defined as the geometric mean of
-the pairwise precision and recall::
+The Fowlkes-Mallows index (:func:`sklearn.metrics.fowlkes_mallows_score`) can be
+used when the ground truth class assignments of the samples is known. The
+Fowlkes-Mallows score FMI is defined as the geometric mean of the
+pairwise precision and recall:
 
-      FMI = TP / sqrt((TP + FP) * (TP + FN))
+.. math:: \text{FMI} = \frac{\text{TP}}{\sqrt{(\text{TP} + \text{FP}) (\text{TP} + \text{FN})}}
 
-Where :math:`TP` is the number of **True Positive** (i.e. the number of pair
-of points that belong to the same clusters in both labels_true and
-labels_pred), :math:`FP` is the number of **False Positive** (i.e. the number
-of pair of points that belong to the same clusters in labels_true and not
-in labels_pred) and :math:`FN`is the number of **False Negative** (i.e the
-number of pair of points that belongs in the same clusters in labels_pred
-and not in labels_True).
+Where ``TP`` is the number of **True Positive** (i.e. the number of pair
+of points that belong to the same clusters in both the true labels and the
+predicted labels), ``FP`` is the number of **False Positive** (i.e. the number
+of pair of points that belong to the same clusters in the true labels and not
+in the predicted labels) and ``FN`` is the number of **False Negative** (i.e the
+number of pair of points that belongs in the same clusters in the predicted
+labels and not in the true labels).
 
 The score ranges from 0 to 1. A high value indicates a good similarity
 between two clusters.
@@ -1505,24 +1507,28 @@ Calinski-Harabaz Index
 ----------------------
 
 If the ground truth labels are not known, the Calinski-Harabaz index
-(:func:'sklearn.metrics.calinski_harabaz_score') can be used to evaluate the
+(:func:`sklearn.metrics.calinski_harabaz_score`) can be used to evaluate the
 model, where a higher Calinski-Harabaz score relates to a model with better
 defined clusters.
 
-For :math:`k` clusters, the Calinski-Harabaz :math:`ch` is given as the ratio
-of the between-clusters dispersion mean and the within-cluster dispersion:
+For :math:`k` clusters, the Calinski-Harabaz score :math:`s` is given as the
+ratio of the between-clusters dispersion mean and the within-cluster
+dispersion:
 
 .. math::
-  ch(k) = \frac{trace(B_k)}{trace(W_k)} \times \frac{N - k}{k - 1}
-  W_k  = \sum_{q=1}^k \sum_{x \in C_q} (x - c_q) (x - c_q)^T \\
-  B_k = \sum_q n_q (c_q - c) (c_q - c)^T \\
+  s(k) = \frac{\mathrm{Tr}(B_k)}{\mathrm{Tr}(W_k)} \times \frac{N - k}{k - 1}
 
-where:
-- :math:`N` be the number of points in our data,
-- :math:`C_q` be the set of points in cluster :math:`q`,
-- :math:`c_q` be the center of cluster :math:`q`,
-- :math:`c` be the center of :math:`E`,
-- :math:`n_q` be the number of points in cluster :math:`q`:
+where :math:`B_K` is the between group dispersion matrix and :math:`W_K`
+is the within-cluster dispersion matrix defined by:
+
+.. math:: W_k = \sum_{q=1}^k \sum_{x \in C_q} (x - c_q) (x - c_q)^T
+
+.. math:: B_k = \sum_q n_q (c_q - c) (c_q - c)^T
+
+with :math:`N` be the number of points in our data, :math:`C_q` be the set of
+points in cluster :math:`q`, :math:`c_q` be the center of cluster
+:math:`q`, :math:`c` be the center of :math:`E`, :math:`n_q` be the number of
+points in cluster :math:`q`.
 
 
   >>> from sklearn import metrics
@@ -1539,8 +1545,7 @@ cluster analysis.
   >>> from sklearn.cluster import KMeans
   >>> kmeans_model = KMeans(n_clusters=3, random_state=1).fit(X)
   >>> labels = kmeans_model.labels_
-  >>> metrics.calinski_harabaz_score(X, labels)
-  ...                                                      # doctest: +ELLIPSIS
+  >>> metrics.calinski_harabaz_score(X, labels)  # doctest: +ELLIPSIS
   560.39...
 
 
 
@@ -26,12 +26,11 @@
 # Try Python 2 first, otherwise load from Python 3
 try:
     from StringIO import StringIO
-    from BytesIO import BytesIO
     import cPickle as pickle
     import urllib2 as urllib
     from urllib2 import HTTPError, URLError
 except ImportError:
-    from io import StringIO, BytesIO
+    from io import StringIO
     import pickle
     import urllib.request
     import urllib.error
@@ -105,7 +104,7 @@ def _get_data(url):
         if encoding == 'plain':
             pass
         elif encoding == 'gzip':
-            data = BytesIO(data)
+            data = StringIO(data)
             data = gzip.GzipFile(fileobj=data).read()
         else:
             raise RuntimeError('unknown encoding')
 
@@ -824,23 +824,25 @@ def fowlkes_mallows_score(labels_true, labels_pred, max_n_classes=5000):
 
         FMI = TP / sqrt((TP + FP) * (TP + FN))
 
-    Where :math:`TP` is the number of `True Positive` (i.e. the number of pair
-    of points that belongs in the same clusters in both labels_true and
-    labels_pred), :math:`FP` is the number of `False Positive` (i.e. the number
-    of pair of points that belongs in the same clusters in labels_true and not
-    in labels_pred) and :math:`FN`is the number of `False Negative` (i.e the
-    number of pair of points that belongs in the same clusters in labels_pred
-    and not in labels_True).
+    Where ``TP`` is the number of **True Positive** (i.e. the number of pair of
+    points that belongs in the same clusters in both ``labels_true`` and
+    ``labels_pred``), ``FP`` is the number of **False Positive** (i.e. the
+    number of pair of points that belongs in the same clusters in
+    ``labels_true`` and not in ``labels_pred``) and ``FN`` is the number of
+    **False Negative** (i.e the number of pair of points that belongs in the
+    same clusters in ``labels_pred`` and not in ``labels_True``).
 
     The score ranges from 0 to 1. A high value indicates a good similarity
     between two clusters.
 
+    Read more in the :ref:`User Guide <fowlkes_mallows_scores>`.
+
     Parameters
     ----------
-    labels_true : int array, shape = (n_samples,)
+    labels_true : int array, shape = (``n_samples``,)
         A clustering of the data into disjoint subsets.
 
-    labels_pred : array, shape = (n_samples, )
+    labels_pred : array, shape = (``n_samples``, )
         A clustering of the data into disjoint subsets.
 
     max_n_classes : int, optional (default=5000)
 
@@ -212,26 +212,21 @@ def calinski_harabaz_score(X, labels):
     """Compute the Calinski and Harabaz score.
 
     The score is defined as ratio between the within-cluster dispersion and
-    the between-cluster dispersion. For :math:`K` cluster, the Calinski and
-    Harabaz score is defined as::
+    the between-cluster dispersion.
 
+    Read more in the :ref:`User Guide <calinski_harabaz_index>`.
 
-    With :math:`B_K` the between group dispersion matrix and :math:`W_K`
-    the within-cluster dispersion matrix defined by::
-    the number of samples in the cluster :math:`k` and the mean of the samples
-    in the cluster :math:`k` and the mean of all the samples.
-
-    Parameter
-    ---------
-    X : array-like, shape (n_samples, n_features)
-        List of n_features-dimensional data points. Each row corresponds
+    Parameters
+    ----------
+    X : array-like, shape (``n_samples``, ``n_features``)
+        List of ``n_features``-dimensional data points. Each row corresponds
         to a single data point.
 
-    labels : array-like, shape (n_samples,)
+    labels : array-like, shape (``n_samples``,)
         Predicted labels for each sample.
 
-    Return
-    ------
+    Returns
+    -------
     score: float
         The resulting Calinski-Harabaz score.