jayzed82
diff --git a/‎sklearn/cluster/_affinity_propagation.py
Lines changed: 19 additions & 19 deletions b/‎sklearn/cluster/_affinity_propagation.py
Lines changed: 19 additions & 19 deletions
diff --git a/‎sklearn/cluster/_agglomerative.py
Lines changed: 21 additions & 20 deletions b/‎sklearn/cluster/_agglomerative.py
Lines changed: 21 additions & 20 deletions
diff --git a/‎sklearn/cluster/_bicluster.py
Lines changed: 1 addition & 1 deletion b/‎sklearn/cluster/_bicluster.py
Lines changed: 1 addition & 1 deletion
diff --git a/‎sklearn/cluster/_dbscan.py
Lines changed: 1 addition & 1 deletion b/‎sklearn/cluster/_dbscan.py
Lines changed: 1 addition & 1 deletion
diff --git a/‎sklearn/cluster/_feature_agglomeration.py
Lines changed: 2 additions & 2 deletions b/‎sklearn/cluster/_feature_agglomeration.py
Lines changed: 2 additions & 2 deletions
@@ -41,10 +41,10 @@ def affinity_propagation(S, *, preference=None, convergence_iter=15,
     Parameters
     ----------
 
-    S : array-like, shape (n_samples, n_samples)
+    S : array-like of shape (n_samples, n_samples)
         Matrix of similarities between points
 
-    preference : array-like, shape (n_samples,) or float, optional
+    preference : array-like of shape (n_samples,) or float, default=None
         Preferences for each point - points with larger values of
         preferences are more likely to be chosen as exemplars. The number of
         exemplars, i.e. of clusters, is influenced by the input preferences
@@ -53,27 +53,27 @@ def affinity_propagation(S, *, preference=None, convergence_iter=15,
         number of clusters). For a smaller amount of clusters, this can be set
         to the minimum value of the similarities.
 
-    convergence_iter : int, optional, default: 15
+    convergence_iter : int, default=15
         Number of iterations with no change in the number
         of estimated clusters that stops the convergence.
 
-    max_iter : int, optional, default: 200
+    max_iter : int, default=200
         Maximum number of iterations
 
-    damping : float, optional, default: 0.5
+    damping : float, default=0.5
         Damping factor between 0.5 and 1.
 
-    copy : boolean, optional, default: True
+    copy : bool, default=True
         If copy is False, the affinity matrix is modified inplace by the
         algorithm, for memory efficiency
 
-    verbose : boolean, optional, default: False
+    verbose : bool, default=False
         The verbosity level
 
-    return_n_iter : bool, default False
+    return_n_iter : bool, default=False
         Whether or not to return the number of iterations.
 
-    random_state : int or np.random.RandomStateInstance, default: 0
+    random_state : int or RandomState instance, default=0
         Pseudo-random number generator to control the starting state.
         Use an int for reproducible results across function calls.
         See the :term:`Glossary <random_state>`.
@@ -84,10 +84,10 @@ def affinity_propagation(S, *, preference=None, convergence_iter=15,
     Returns
     -------
 
-    cluster_centers_indices : array, shape (n_clusters,)
+    cluster_centers_indices : ndarray of shape (n_clusters,)
         index of clusters centers
 
-    labels : array, shape (n_samples,)
+    labels : ndarray of shape (n_samples,)
         cluster labels for each point
 
     n_iter : int
@@ -292,7 +292,7 @@ class AffinityPropagation(ClusterMixin, BaseEstimator):
     verbose : bool, default=False
         Whether to be verbose.
 
-    random_state : int or np.random.RandomStateInstance, default: 0
+    random_state : int or RandomState instance, default=0
         Pseudo-random number generator to control the starting state.
         Use an int for reproducible results across function calls.
         See the :term:`Glossary <random_state>`.
@@ -382,8 +382,8 @@ def fit(self, X, y=None):
 
         Parameters
         ----------
-        X : array-like or sparse matrix, shape (n_samples, n_features), or \
-            array-like, shape (n_samples, n_samples)
+        X : {array-like, sparse matrix} of shape (n_samples, n_features), or \
+                array-like of shape (n_samples, n_samples)
             Training instances to cluster, or similarities / affinities between
             instances if ``affinity='precomputed'``. If a sparse feature matrix
             is provided, it will be converted into a sparse ``csr_matrix``.
@@ -428,13 +428,13 @@ def predict(self, X):
 
         Parameters
         ----------
-        X : array-like or sparse matrix, shape (n_samples, n_features)
+        X : {array-like, sparse matrix} of shape (n_samples, n_features)
             New data to predict. If a sparse matrix is provided, it will be
             converted into a sparse ``csr_matrix``.
 
         Returns
         -------
-        labels : ndarray, shape (n_samples,)
+        labels : ndarray of shape (n_samples,)
             Cluster labels.
         """
         check_is_fitted(self)
@@ -457,8 +457,8 @@ def fit_predict(self, X, y=None):
 
         Parameters
         ----------
-        X : array-like or sparse matrix, shape (n_samples, n_features), or \
-            array-like, shape (n_samples, n_samples)
+        X : {array-like, sparse matrix} of shape (n_samples, n_features), or \
+                array-like of shape (n_samples, n_samples)
             Training instances to cluster, or similarities / affinities between
             instances if ``affinity='precomputed'``. If a sparse feature matrix
             is provided, it will be converted into a sparse ``csr_matrix``.
@@ -468,7 +468,7 @@ def fit_predict(self, X, y=None):
 
         Returns
         -------
-        labels : ndarray, shape (n_samples,)
+        labels : ndarray of shape (n_samples,)
             Cluster labels.
         """
         return super().fit_predict(X, y)
@@ -150,29 +150,29 @@ def ward_tree(X, *, connectivity=None, n_clusters=None, return_distance=False):
 
     Parameters
     ----------
-    X : array, shape (n_samples, n_features)
+    X : array-like of shape (n_samples, n_features)
         feature matrix representing n_samples samples to be clustered
 
-    connectivity : sparse matrix (optional).
+    connectivity : sparse matrix, default=None
         connectivity matrix. Defines for each sample the neighboring samples
         following a given structure of the data. The matrix is assumed to
         be symmetric and only the upper triangular half is used.
         Default is None, i.e, the Ward algorithm is unstructured.
 
-    n_clusters : int (optional)
+    n_clusters : int, default=None
         Stop early the construction of the tree at n_clusters. This is
         useful to decrease computation time if the number of clusters is
         not small compared to the number of samples. In this case, the
         complete tree is not computed, thus the 'children' output is of
         limited use, and the 'parents' output should rather be used.
         This option is valid only when specifying a connectivity matrix.
 
-    return_distance : bool (optional)
+    return_distance : bool, default=None
         If True, return the distance between the clusters.
 
     Returns
     -------
-    children : 2D array, shape (n_nodes-1, 2)
+    children : ndarray of shape (n_nodes-1, 2)
         The children of each non-leaf node. Values less than `n_samples`
         correspond to leaves of the tree which are the original samples.
         A node `i` greater than or equal to `n_samples` is a non-leaf
@@ -186,11 +186,11 @@ def ward_tree(X, *, connectivity=None, n_clusters=None, return_distance=False):
     n_leaves : int
         The number of leaves in the tree
 
-    parents : 1D array, shape (n_nodes, ) or None
+    parents : ndarray of shape (n_nodes,) or None
         The parent of each node. Only returned when a connectivity matrix
         is specified, elsewhere 'None' is returned.
 
-    distances : 1D array, shape (n_nodes-1, )
+    distances : ndarray of shape (n_nodes-1,)
         Only returned if return_distance is set to True (for compatibility).
         The distances between the centers of the nodes. `distances[i]`
         corresponds to a weighted euclidean distance between
@@ -356,24 +356,24 @@ def linkage_tree(X, connectivity=None, n_clusters=None, linkage='complete',
 
     Parameters
     ----------
-    X : array, shape (n_samples, n_features)
+    X : array-like of shape (n_samples, n_features)
         feature matrix representing n_samples samples to be clustered
 
-    connectivity : sparse matrix (optional).
+    connectivity : sparse matrix, default=None
         connectivity matrix. Defines for each sample the neighboring samples
         following a given structure of the data. The matrix is assumed to
         be symmetric and only the upper triangular half is used.
         Default is None, i.e, the Ward algorithm is unstructured.
 
-    n_clusters : int (optional)
+    n_clusters : int, default=None
         Stop early the construction of the tree at n_clusters. This is
         useful to decrease computation time if the number of clusters is
         not small compared to the number of samples. In this case, the
         complete tree is not computed, thus the 'children' output is of
         limited use, and the 'parents' output should rather be used.
         This option is valid only when specifying a connectivity matrix.
 
-    linkage : {"average", "complete", "single"}, optional, default: "complete"
+    linkage : {"average", "complete", "single"}, default="complete"
         Which linkage criteria to use. The linkage criterion determines which
         distance to use between sets of observation.
             - average uses the average of the distances of each observation of
@@ -383,16 +383,16 @@ def linkage_tree(X, connectivity=None, n_clusters=None, linkage='complete',
             - single uses the minimum of the distances between all observations
               of the two sets.
 
-    affinity : string or callable, optional, default: "euclidean".
+    affinity : str or callable, default="euclidean".
         which metric to use. Can be "euclidean", "manhattan", or any
         distance know to paired distance (see metric.pairwise)
 
-    return_distance : bool, default False
+    return_distance : bool, default=False
         whether or not to return the distances between the clusters.
 
     Returns
     -------
-    children : 2D array, shape (n_nodes-1, 2)
+    children : ndarray of shape (n_nodes-1, 2)
         The children of each non-leaf node. Values less than `n_samples`
         correspond to leaves of the tree which are the original samples.
         A node `i` greater than or equal to `n_samples` is a non-leaf
@@ -406,11 +406,11 @@ def linkage_tree(X, connectivity=None, n_clusters=None, linkage='complete',
     n_leaves : int
         The number of leaves in the tree.
 
-    parents : 1D array, shape (n_nodes, ) or None
+    parents : ndarray of shape (n_nodes, ) or None
         The parent of each node. Only returned when a connectivity matrix
         is specified, elsewhere 'None' is returned.
 
-    distances : ndarray, shape (n_nodes-1,)
+    distances : ndarray of shape (n_nodes-1,)
         Returned when return_distance is set to True.
 
         distances[i] refers to the distance between children[i][0] and
@@ -636,7 +636,7 @@ def _hc_cut(n_clusters, children, n_leaves):
     n_clusters : int or ndarray
         The number of clusters to form.
 
-    children : 2D array, shape (n_nodes-1, 2)
+    children : ndarray of shape (n_nodes-1, 2)
         The children of each non-leaf node. Values less than `n_samples`
         correspond to leaves of the tree which are the original samples.
         A node `i` greater than or equal to `n_samples` is a non-leaf
@@ -910,7 +910,8 @@ def fit_predict(self, X, y=None):
 
         Parameters
         ----------
-        X : array-like, shape (n_samples, n_features) or (n_samples, n_samples)
+        X : array-like of shape (n_samples, n_features) or \
+                (n_samples, n_samples)
             Training instances to cluster, or distances between instances if
             ``affinity='precomputed'``.
 
@@ -919,7 +920,7 @@ def fit_predict(self, X, y=None):
 
         Returns
         -------
-        labels : ndarray, shape (n_samples,)
+        labels : ndarray of shape (n_samples,)
             Cluster labels.
         """
         return super().fit_predict(X, y)
@@ -957,7 +958,7 @@ class FeatureAgglomeration(AgglomerativeClustering, AgglomerationTransform):
         kneighbors_graph. Default is None, i.e, the
         hierarchical clustering algorithm is unstructured.
 
-    compute_full_tree : 'auto' or bool, optional, default='auto'
+    compute_full_tree : 'auto' or bool, default='auto'
         Stop early the construction of the tree at n_clusters. This is useful
         to decrease computation time if the number of clusters is not small
         compared to the number of features. This option is useful only when
 
@@ -111,7 +111,7 @@ def fit(self, X, y=None):
 
         Parameters
         ----------
-        X : array-like, shape (n_samples, n_features)
+        X : array-like of shape (n_samples, n_features)
 
         y : Ignored
 
 
@@ -46,7 +46,7 @@ def dbscan(X, eps=0.5, *, min_samples=5, metric='minkowski',
         The number of samples (or total weight) in a neighborhood for a point
         to be considered as a core point. This includes the point itself.
 
-    metric : string, or callable
+    metric : str or callable, default='minkowski'
         The metric to use when calculating distance between instances in a
         feature array. If metric is a string or callable, it must be one of
         the options allowed by :func:`sklearn.metrics.pairwise_distances` for
 
@@ -33,7 +33,7 @@ def transform(self, X):
 
         Returns
         -------
-        Y : array, shape = [n_samples, n_clusters] or [n_clusters]
+        Y : ndarray of shape (n_samples, n_clusters) or (n_clusters,)
             The pooled values for each feature cluster.
         """
         check_is_fitted(self)
@@ -67,7 +67,7 @@ def inverse_transform(self, Xred):
 
         Returns
         -------
-        X : array, shape=[n_samples, n_features] or [n_features]
+        X : ndarray of shape (n_samples, n_features) or (n_features,)
             A vector of size n_samples with the values of Xred assigned to
             each of the cluster of samples.
         """