scikit-learn
diff --git a/‎doc/modules/model_evaluation.rst
Lines changed: 3 additions & 3 deletions b/‎doc/modules/model_evaluation.rst
Lines changed: 3 additions & 3 deletions
diff --git a/‎doc/whats_new/v1.1.rst
Lines changed: 19 additions & 0 deletions b/‎doc/whats_new/v1.1.rst
Lines changed: 19 additions & 0 deletions
diff --git a/‎sklearn/metrics/_ranking.py
Lines changed: 9 additions & 8 deletions b/‎sklearn/metrics/_ranking.py
Lines changed: 9 additions & 8 deletions
diff --git a/‎sklearn/metrics/tests/test_ranking.py
Lines changed: 13 additions & 7 deletions b/‎sklearn/metrics/tests/test_ranking.py
Lines changed: 13 additions & 7 deletions
@@ -904,11 +904,11 @@ Here are some small examples in binary classification::
   >>> y_scores = np.array([0.1, 0.4, 0.35, 0.8])
   >>> precision, recall, threshold = precision_recall_curve(y_true, y_scores)
   >>> precision
-  array([0.66..., 0.5       , 1.        , 1.        ])
+  array([0.5       , 0.66..., 0.5       , 1.        , 1.        ])
   >>> recall
-  array([1. , 0.5, 0.5, 0. ])
+  array([1. , 1. , 0.5, 0.5, 0. ])
   >>> threshold
-  array([0.35, 0.4 , 0.8 ])
+  array([0.1 , 0.35, 0.4 , 0.8 ])
   >>> average_precision_score(y_true, y_scores)
   0.83...
 
 
@@ -2,6 +2,25 @@
 
 .. currentmodule:: sklearn
 
+.. _changes_1_1_1:
+
+Version 1.1.1
+=============
+
+**In Development**
+
+Changelog
+---------
+
+:mod:`sklearn.metrics`
+......................
+
+- |Fix| Fixes `metrics.precision_recall_curve` to compute precision-recall at 100%
+  recall. The Precision-Recall curve now displays the last point corresponding to a
+  classifier that always predicts the positive class: recall=100% and
+  precision=class balance.
+  :pr:`23214` by :user:`Stéphane Collot <stephanecollot>` and :user:`Max Baak <mbaak>`.
+
 .. _changes_1_1:
 
 Version 1.1.0
 
@@ -801,6 +801,9 @@ def precision_recall_curve(y_true, probas_pred, *, pos_label=None, sample_weight
     have a corresponding threshold. This ensures that the graph starts on the
     y axis.
 
+    The first precision and recall values are precision=class balance and recall=1.0
+    which corresponds to a classifier that always predicts the positive class.
+
     Read more in the :ref:`User Guide <precision_recall_f_measure_metrics>`.
 
     Parameters
@@ -834,7 +837,7 @@ def precision_recall_curve(y_true, probas_pred, *, pos_label=None, sample_weight
 
     thresholds : ndarray of shape (n_thresholds,)
         Increasing thresholds on the decision function used to compute
-        precision and recall. n_thresholds <= len(np.unique(probas_pred)).
+        precision and recall where `n_thresholds = len(np.unique(probas_pred))`.
 
     See Also
     --------
@@ -855,11 +858,11 @@ def precision_recall_curve(y_true, probas_pred, *, pos_label=None, sample_weight
     >>> precision, recall, thresholds = precision_recall_curve(
     ...     y_true, y_scores)
     >>> precision
-    array([0.66666667, 0.5       , 1.        , 1.        ])
+    array([0.5       , 0.66666667, 0.5       , 1.        , 1.        ])
     >>> recall
-    array([1. , 0.5, 0.5, 0. ])
+    array([1. , 1. , 0.5, 0.5, 0. ])
     >>> thresholds
-    array([0.35, 0.4 , 0.8 ])
+    array([0.1 , 0.35, 0.4 , 0.8 ])
     """
     fps, tps, thresholds = _binary_clf_curve(
         y_true, probas_pred, pos_label=pos_label, sample_weight=sample_weight
@@ -879,10 +882,8 @@ def precision_recall_curve(y_true, probas_pred, *, pos_label=None, sample_weight
     else:
         recall = tps / tps[-1]
 
-    # stop when full recall attained
-    # and reverse the outputs so recall is decreasing
-    last_ind = tps.searchsorted(tps[-1])
-    sl = slice(last_ind, None, -1)
+    # reverse the outputs so recall is decreasing
+    sl = slice(None, None, -1)
     return np.hstack((precision[sl], 1)), np.hstack((recall[sl], 0)), thresholds[sl]
 
 
 
@@ -831,6 +831,12 @@ def test_precision_recall_curve():
     y_true, _, y_score = make_prediction(binary=True)
     _test_precision_recall_curve(y_true, y_score)
 
+    # Make sure the first point of the Precision-Recall on the right is:
+    # (p=1.0, r=class balance) on a non-balanced dataset [1:]
+    p, r, t = precision_recall_curve(y_true[1:], y_score[1:])
+    assert r[0] == 1.0
+    assert p[0] == y_true[1:].mean()
+
     # Use {-1, 1} for labels; make sure original labels aren't modified
     y_true[np.where(y_true == 0)] = -1
     y_true_copy = y_true.copy()
@@ -848,7 +854,7 @@ def test_precision_recall_curve():
 
 
 def _test_precision_recall_curve(y_true, y_score):
-    # Test Precision-Recall and aread under PR curve
+    # Test Precision-Recall and area under PR curve
     p, r, thresholds = precision_recall_curve(y_true, y_score)
     precision_recall_auc = _average_precision_slow(y_true, y_score)
     assert_array_almost_equal(precision_recall_auc, 0.859, 3)
@@ -874,8 +880,8 @@ def test_precision_recall_curve_toydata():
         y_score = [0, 1]
         p, r, _ = precision_recall_curve(y_true, y_score)
         auc_prc = average_precision_score(y_true, y_score)
-        assert_array_almost_equal(p, [1, 1])
-        assert_array_almost_equal(r, [1, 0])
+        assert_array_almost_equal(p, [0.5, 1, 1])
+        assert_array_almost_equal(r, [1, 1, 0])
         assert_almost_equal(auc_prc, 1.0)
 
         y_true = [0, 1]
@@ -901,8 +907,8 @@ def test_precision_recall_curve_toydata():
         y_score = [1, 0]
         p, r, _ = precision_recall_curve(y_true, y_score)
         auc_prc = average_prec
A0B2
ision_score(y_true, y_score)
-        assert_array_almost_equal(p, [1, 1])
-        assert_array_almost_equal(r, [1, 0])
+        assert_array_almost_equal(p, [0.5, 1, 1])
+        assert_array_almost_equal(r, [1, 1, 0])
         assert_almost_equal(auc_prc, 1.0)
 
         y_true = [1, 0]
@@ -919,8 +925,8 @@ def test_precision_recall_curve_toydata():
             p, r, _ = precision_recall_curve(y_true, y_score)
         with pytest.warns(UserWarning, match="No positive class found in y_true"):
             auc_prc = average_precision_score(y_true, y_score)
-        assert_allclose(p, [0, 1])
-        assert_allclose(r, [1, 0])
+        assert_allclose(p, [0, 0, 1])
+        assert_allclose(r, [1, 1, 0])
         assert_allclose(auc_prc, 0)
 
         y_true = [1, 1]