diff --git a/sklearn/model_selection/_validation.py b/sklearn/model_selection/_validation.py index dd204ad4a57d0..f7735a883ab79 100644 --- a/sklearn/model_selection/_validation.py +++ b/sklearn/model_selection/_validation.py @@ -965,9 +965,19 @@ def _check_is_permutation(indices, n_samples): def permutation_test_score(estimator, X, y, *, groups=None, cv=None, n_permutations=100, n_jobs=None, random_state=0, verbose=0, scoring=None): - """Evaluate the significance of a cross-validated score with permutations + """Evaluates the significance of a cross-validated score using permutations - Read more in the :ref:`User Guide `. + Permutes targets to generate 'randomized data' and compute the empirical + p-value against the null hypothesis that features and targets are + independent. + + The p-value represents the fraction of randomized data sets where the + estimator performed as well or better than in the original data. A small + p-value suggests that there is a real dependency between features and + targets which has been used by the estimator to give good predictions. + A large p-value may be due to lack of real dependency between features + and targets or the estimator was not able to use the dependency to + give good predictions. Parameters ---------- @@ -1054,10 +1064,10 @@ def permutation_test_score(estimator, X, y, *, groups=None, cv=None, ----- This function implements Test 1 in: - Ojala and Garriga. Permutation Tests for Studying Classifier - Performance. The Journal of Machine Learning Research (2010) - vol. 11 - `[pdf] `_. + Ojala and Garriga. `Permutation Tests for Studying Classifier + Performance + `_. The + Journal of Machine Learning Research (2010) vol. 11 """ X, y, groups = indexable(X, y, groups)