jeremiedbb
diff --git a/‎.gitignore
Lines changed: 60 additions & 1 deletion b/‎.gitignore
Lines changed: 60 additions & 1 deletion
diff --git a/‎benchmarks/bench_rcv1_logreg_convergence.py
Lines changed: 1 addition & 1 deletion b/‎benchmarks/bench_rcv1_logreg_convergence.py
Lines changed: 1 addition & 1 deletion
diff --git a/‎benchmarks/bench_sparsify.py
Lines changed: 1 addition & 1 deletion b/‎benchmarks/bench_sparsify.py
Lines changed: 1 addition & 1 deletion
diff --git a/‎build_tools/azure/install.cmd
Lines changed: 7 additions & 1 deletion b/‎build_tools/azure/install.cmd
Lines changed: 7 additions & 1 deletion
diff --git a/‎build_tools/azure/install.sh
Lines changed: 9 additions & 3 deletions b/‎build_tools/azure/install.sh
Lines changed: 9 additions & 3 deletions
diff --git a/‎build_tools/azure/posix-32.yml
Lines changed: 1 addition & 1 deletion b/‎build_tools/azure/posix-32.yml
Lines changed: 1 addition & 1 deletion
diff --git a/‎build_tools/azure/posix.yml
Lines changed: 1 addition & 1 deletion b/‎build_tools/azure/posix.yml
Lines changed: 1 addition & 1 deletion
diff --git a/‎build_tools/azure/windows.yml
Lines changed: 1 addition & 1 deletion b/‎build_tools/azure/windows.yml
Lines changed: 1 addition & 1 deletion
diff --git a/‎doc/developers/develop.rst
Lines changed: 1 addition & 1 deletion b/‎doc/developers/develop.rst
Lines changed: 1 addition & 1 deletion
diff --git a/‎doc/modules/classes.rst
Lines changed: 1 addition & 1 deletion b/‎doc/modules/classes.rst
Lines changed: 1 addition & 1 deletion
diff --git a/‎doc/modules/computing.rst
Lines changed: 1 addition & 1 deletion b/‎doc/modules/computing.rst
Lines changed: 1 addition & 1 deletion
diff --git a/‎doc/modules/cross_validation.rst
Lines changed: 24 additions & 13 deletions b/‎doc/modules/cross_validation.rst
Lines changed: 24 additions & 13 deletions
diff --git a/‎doc/modules/decomposition.rst
Lines changed: 1 addition & 1 deletion b/‎doc/modules/decomposition.rst
Lines changed: 1 addition & 1 deletion
diff --git a/‎doc/modules/density.rst
Lines changed: 1 addition & 1 deletion b/‎doc/modules/density.rst
Lines changed: 1 addition & 1 deletion
diff --git a/‎doc/modules/neighbors.rst
Lines changed: 1 addition & 1 deletion b/‎doc/modules/neighbors.rst
Lines changed: 1 addition & 1 deletion
diff --git a/‎doc/templates/index.html
Lines changed: 0 additions & 5 deletions b/‎doc/templates/index.html
Lines changed: 0 additions & 5 deletions
diff --git a/‎doc/themes/scikit-learn-modern/static/css/theme.css
Lines changed: 7 additions & 0 deletions b/‎doc/themes/scikit-learn-modern/static/css/theme.css
Lines changed: 7 additions & 0 deletions
diff --git a/‎doc/themes/scikit-learn/static/nature.css_t
Lines changed: 0 additions & 5 deletions b/‎doc/themes/scikit-learn/static/nature.css_t
Lines changed: 0 additions & 5 deletions
diff --git a/‎doc/whats_new/v0.21.rst
Lines changed: 1 addition & 1 deletion b/‎doc/whats_new/v0.21.rst
Lines changed: 1 addition & 1 deletion
diff --git a/‎doc/whats_new/v0.22.rst
Lines changed: 5 additions & 2 deletions b/‎doc/whats_new/v0.22.rst
Lines changed: 5 additions & 2 deletions
diff --git a/‎examples/applications/plot_model_complexity_influence.py
Lines changed: 1 addition & 1 deletion b/‎examples/applications/plot_model_complexity_influence.py
Lines changed: 1 addition & 1 deletion
diff --git a/‎examples/linear_model/plot_sgd_penalties.py
Lines changed: 2 additions & 2 deletions b/‎examples/linear_model/plot_sgd_penalties.py
Lines changed: 2 additions & 2 deletions
@@ -75,7 +75,7 @@ _configtest.o.d
 # files generated from a template
 sklearn/utils/_seq_dataset.pyx
 sklearn/utils/_seq_dataset.pxd
-sklearn/linear_model/sag_fast.pyx
+sklearn/linear_model/_sag_fast.pyx
 
 # deprecated paths
 # TODO: Remove in 0.24
@@ -129,3 +129,62 @@ sklearn/svm/bounds.py
 sklearn/svm/libsvm.py
 sklearn/svm/libsvm_sparse.py
 sklearn/svm/liblinear.py
+
+sklearn/linear_model/base.py
+sklearn/linear_model/bayes.py
+sklearn/linear_model/cd_fast.py
+sklearn/linear_model/coordinate_descent.py
+sklearn/linear_model/huber.py
+sklearn/linear_model/least_angle.py
+sklearn/linear_model/logistic.py
+sklearn/linear_model/omp.py
+sklearn/linear_model/passive_aggressive.py
+sklearn/linear_model/perceptron.py
+sklearn/linear_model/ransac.py
+sklearn/linear_model/ridge.py
+sklearn/linear_model/sag.py
+sklearn/linear_model/sag_fast.py
+sklearn/linear_model/sgd_fast.py
+sklearn/linear_model/stochastic_gradient.py
+sklearn/linear_model/theil_sen.py
+
+sklearn/metrics/cluster/bicluster.py
+sklearn/metrics/cluster/supervised.py
+sklearn/metrics/cluster/unsupervised.py
+sklearn/metrics/cluster/expected_mutual_info_fast.py
+
+sklearn/metrics/base.py
+sklearn/metrics/classification.py
+sklearn/metrics/regression.py
+sklearn/metrics/ranking.py
+sklearn/metrics/pairwise_fast.py
+sklearn/metrics/scorer.py
+
+sklearn/inspection/partial_dependence.py
+sklearn/inspection/permutation_importance.py
+
+sklearn/neighbors/ball_tree.py
+sklearn/neighbors/base.py
+sklearn/neighbors/classification.py
+sklearn/neighbors/dist_metrics.py
+sklearn/neighbors/graph.py
+sklearn/neighbors/kd_tree.py
+sklearn/neighbors/kde.py
+sklearn/neighbors/lof.py
+sklearn/neighbors/nca.py
+sklearn/neighbors/nearest_centroid.py
+sklearn/neighbors/quad_tree.py
+sklearn/neighbors/regression.py
+sklearn/neighbors/typedefs.py
+sklearn/neighbors/unsupervised.py
+
+sklearn/manifold/isomap.py
+sklearn/manifold/locally_linear.py
+sklearn/manifold/mds.py
+sklearn/manifold/spectral_embedding_.py
+sklearn/manifold/t_sne.py
+
+sklearn/semi_supervised/label_propagation.py
+
+sklearn/preprocessing/data.py
+sklearn/preprocessing/label.py
@@ -11,7 +11,7 @@
 
 from sklearn.linear_model import (LogisticRegression, SGDClassifier)
 from sklearn.datasets import fetch_rcv1
-from sklearn.linear_model.sag import get_auto_step_size
+from sklearn.linear_model._sag import get_auto_step_size
 
 try:
     import lightning.classification as lightning_clf
 
@@ -45,7 +45,7 @@
 
 from scipy.sparse.csr import csr_matrix
 import numpy as np
-from sklearn.linear_model.stochastic_gradient import SGDRegressor
+from sklearn.linear_model import SGDRegressor
 from sklearn.metrics import r2_score
 
 np.random.seed(42)
 
@@ -11,9 +11,15 @@ IF "%PYTHON_ARCH%"=="64" (
     call deactivate
     @rem Clean up any left-over from a previous build
     conda remove --all -q -y -n %VIRTUALENV%
-    conda create -n %VIRTUALENV% -q -y python=%PYTHON_VERSION% numpy scipy cython matplotlib pytest=%PYTEST_VERSION% wheel pillow joblib
+    conda create -n %VIRTUALENV% -q -y python=%PYTHON_VERSION% numpy scipy cython matplotlib wheel pillow joblib
 
     call activate %VIRTUALENV%
+
+    IF "%PYTEST_VERSION%"=="*" (
+        pip install pytest
+    ) else (
+        pip install pytest==%PYTEST_VERSION%
+    )
     pip install pytest-xdist
 ) else (
     pip install numpy scipy cython pytest wheel pillow joblib
 
@@ -20,8 +20,8 @@ version_ge() {
 
 if [[ "$DISTRIB" == "conda" ]]; then
 
-    TO_INSTALL="python=$PYTHON_VERSION pip pytest=$PYTEST_VERSION \
-                pytest-cov numpy=$NUMPY_VERSION scipy=$SCIPY_VERSION \
+    TO_INSTALL="python=$PYTHON_VERSION pip \
+                numpy=$NUMPY_VERSION scipy=$SCIPY_VERSION \
                 cython=$CYTHON_VERSION joblib=$JOBLIB_VERSION"
 
     if [[ "$INSTALL_MKL" == "true" ]]; then
@@ -60,6 +60,12 @@ if [[ "$DISTRIB" == "conda" ]]; then
         conda config --set restore_free_channel true
     fi
 
+    if [[ "$PYTEST_VERSION" == "*" ]]; then
+        pip install pytest
+    else
+        pip install pytest=="$PYTEST_VERSION"
+    fi
+
 	make_conda $TO_INSTALL
     if [[ "$PYTHON_VERSION" == "*" ]]; then
         pip install pytest-xdist
@@ -88,7 +94,7 @@ elif [[ "$DISTRIB" == "conda-pip-latest" ]]; then
 fi
 
 if [[ "$COVERAGE" == "true" ]]; then
-    python -m pip install coverage codecov
+    python -m pip install coverage codecov pytest-cov
 fi
 
 if [[ "$TEST_DOCSTRINGS" == "true" ]]; then
 
@@ -11,7 +11,7 @@ jobs:
     TEST_DIR: '$(Agent.WorkFolder)/tmp_folder'
     JUNITXML: 'test-data.xml'
     OMP_NUM_THREADS: '4'
-    PYTEST_VERSION: '3.8.1'
+    PYTEST_VERSION: '5.2.1'
     OPENBLAS_NUM_THREADS: '4'
     SKLEARN_SKIP_NETWORK_TESTS: '1'
   strategy:
 
@@ -11,7 +11,7 @@ jobs:
     TEST_DIR: '$(Agent.WorkFolder)/tmp_folder'
     VIRTUALENV: 'testvenv'
     JUNITXML: 'test-data.xml'
-    PYTEST_VERSION: '3.8.1'
+    PYTEST_VERSION: '5.2.1'
     OMP_NUM_THREADS: '4'
     OPENBLAS_NUM_THREADS: '4'
     SKLEARN_SKIP_NETWORK_TESTS: '1'
 
@@ -12,7 +12,7 @@ jobs:
     VIRTUALENV: 'testvenv'
     JUNITXML: 'test-data.xml'
     SKLEARN_SKIP_NETWORK_TESTS: '1'
-    PYTEST_VERSION: '3.8.1'
+    PYTEST_VERSION: '5.2.1'
     TMP_FOLDER: '$(Agent.WorkFolder)\tmp_folder'
   strategy:
     matrix:
 
@@ -453,7 +453,7 @@ this can be achieved with::
         return self.classes_[np.argmax(D, axis=1)]
 
 In linear models, coefficients are stored in an array called ``coef_``, and the
-independent term is stored in ``intercept_``.  ``sklearn.linear_model.base``
+independent term is stored in ``intercept_``.  ``sklearn.linear_model._base``
 contains a few base classes and mixins that implement common linear model
 patterns.
 
 
@@ -882,7 +882,7 @@ Miscellaneous
     manifold.locally_linear_embedding
     manifold.smacof
     manifold.spectral_embedding
-    manifold.t_sne.trustworthiness
+    manifold.trustworthiness
 
 
 .. _metrics_ref:
 
@@ -297,7 +297,7 @@ decision function that is applied at prediction time is the same (a dot product)
 , so latency should be equivalent.
 
 Here is an example using
-:class:`sklearn.linear_model.stochastic_gradient.SGDClassifier` with the
+:class:`sklearn.linear_model.SGDClassifier` with the
 ``elasticnet`` penalty. The regularization strength is globally controlled by
 the ``alpha`` parameter. With a sufficiently high ``alpha``,
 one can then increase the ``l1_ratio`` parameter of ``elasticnet`` to
 
@@ -241,7 +241,7 @@ predefined scorer names::
 
 Or as a dict mapping scorer name to a predefined or custom scoring function::
 
-    >>> from sklearn.metrics.scorer import make_scorer
+    >>> from sklearn.metrics import make_scorer
     >>> scoring = {'prec_macro': 'precision_macro',
     ...            'rec_macro': make_scorer(recall_score, average='macro')}
     >>> scores = cross_validate(clf, X, y, scoring=scoring,
@@ -534,19 +534,30 @@ Stratified k-fold
 folds: each set contains approximately the same percentage of samples of each
 target class as the complete set.
 
-Example of stratified 3-fold cross-validation on a dataset with 10 samples from
-two slightly unbalanced classes::
+Here is an example of stratified 3-fold cross-validation on a dataset with 50 samples from
+two unbalanced classes.  We show the number of samples in each class and compare with 
+:class:`KFold`.
 
-  >>> from sklearn.model_selection import StratifiedKFold
-
-  >>> X = np.ones(10)
-  >>> y = [0, 0, 0, 0, 1, 1, 1, 1, 1, 1]
-  >>> skf = StratifiedKFold(n_splits=3)
-  >>> for train, test in skf.split(X, y):
-  ...     print("%s %s" % (train, test))
-  [2 3 6 7 8 9] [0 1 4 5]
-  [0 1 3 4 5 8 9] [2 6 7]
-  [0 1 2 4 5 6 7] [3 8 9]
+  >>> from sklearn.model_selection import StratifiedKFold, KFold
+  >>> import numpy as np
+  >>> X, y = np.ones((50, 1)), np.hstack(([0] * 45, [1] * 5))
+  >>> skf = StratifiedKFold(n_splits=3) 
+  >>> for train, test in skf.split(X, y):  
+  ...     print('train -  {}   |   test -  {}'.format(
+  ...         np.bincount(y[train]), np.bincount(y[test])))
+  train -  [30  3]   |   test -  [15  2]
+  train -  [30  3]   |   test -  [15  2]
+  train -  [30  4]   |   test -  [15  1]
+  >>> kf = KFold(n_splits=3)
+  >>> for train, test in kf.split(X, y):
+  ...     print('train -  {}   |   test -  {}'.format(
+  ...         np.bincount(y[train]), np.bincount(y[test])))
+  train -  [28  5]   |   test -  [17]
+  train -  [28  5]   |   test -  [17]
+  train -  [34]   |   test -  [11  5]
+
+We can see that :class:`StratifiedKFold` preserves the class ratios 
+(approximately 1 / 10) in both train and test dataset.
 
 Here is a visualization of the cross-validation behavior.
 
 
@@ -24,7 +24,7 @@ that learns :math:`n` components in its ``fit`` method, and can be used on new
 data to project it on these components.
 
 PCA centers but does not scale the input data for each feature before
-applying the SVD. The optional parameter parameter ``whiten=True`` makes it
+applying the SVD. The optional parameter ``whiten=True`` makes it
 possible to project the data onto the singular space while scaling each
 component to unit variance. This is often useful if the models down-stream make
 strong assumptions on the isotropy of the signal: this is for example the case
 
@@ -78,7 +78,7 @@ It's clear how the kernel shape affects the smoothness of the resulting
 distribution.  The scikit-learn kernel density estimator can be used as
 follows:
 
-   >>> from sklearn.neighbors.kde import KernelDensity
+   >>> from sklearn.neighbors import KernelDensity
    >>> import numpy as np
    >>> X = np.array([[-1, -1], [-2, -1], [-3, -2], [1, 1], [2, 1], [3, 2]])
    >>> kde = KernelDensity(kernel='gaussian', bandwidth=0.2).fit(X)
 
@@ -469,7 +469,7 @@ and Quadratic Discriminant Analysis (:class:`sklearn.discriminant_analysis.Quadr
 for more complex methods that do not make this assumption. Usage of the default
 :class:`NearestCentroid` is simple:
 
-    >>> from sklearn.neighbors.nearest_centroid import NearestCentroid
+    >>> from sklearn.neighbors import NearestCentroid
     >>> import numpy as np
     >>> X = np.array([[-1, -1], [-2, -1], [-3, -2], [1, 1], [2, 1], [3, 2]])
     >>> y = np.array([1, 1, 1, 2, 2, 2])
 
@@ -182,11 +182,6 @@ <h4 class="sk-landing-call-header">Community</h4>
         <li><strong>Gitter:</strong> <a href="https://gitter.im/scikit-learn/scikit-learn">gitter.im/scikit-learn</a></li>
         </ul>
 
-        <form target="_top" id="paypal-form" method="post" action="https://www.paypal.com/cgi-bin/webscr">
-            <input type="hidden" value="_s-xclick" name="cmd">
-            <input type="hidden" value="74EYUMF3FTSW8" name="hosted_button_id">
-        </form>
-        <a class="btn btn-warning btn-big sk-donate-btn mb-1" onclick="document.getElementById('paypal-form').submit(); ">Help us, <strong>donate!</strong></a>
         <a class="btn btn-warning btn-big mb-1" href="about.html#citing-scikit-learn"><strong>Cite us!</strong></a>
       </div>
       <div class="col-md-4">
 
@@ -491,6 +491,13 @@ div.sk-navbar-collapse {
   text-align: center;
 }
 
+dl.citation > dd > ol > li {
+  display: inline;
+}
+
+dl.citation > dd > ol {
+  margin-bottom: 0;
+}
 
 /* docs index */
 
 
@@ -967,11 +967,6 @@ div.container.index-lower ul li em {
     font-weight: bold;
 }
 
-#paypal-form {
-    margin: 30px 0;
-    padding: 0;
-}
-
 div.container.index-lower a.cite-us {
     margin-left: 60px;
     padding-right: 20px;
 
@@ -228,7 +228,7 @@ random sampling procedures.
 - :func:`svm.SVC.decision_function` and
   :func:`multiclass.OneVsOneClassifier.decision_function`. |Fix|
 - :class:`linear_model.SGDClassifier` and any derived classifiers. |Fix|
-- Any model using the :func:`linear_model.sag.sag_solver` function with a `0`
+- Any model using the :func:`linear_model._sag.sag_solver` function with a `0`
   seed, including :class:`linear_model.LogisticRegression`,
   :class:`linear_model.LogisticRegressionCV`, :class:`linear_model.Ridge`,
   and :class:`linear_model.RidgeCV` with 'sag' solver. |Fix|
 
@@ -460,6 +460,10 @@ Changelog
   :func:`metrics.pairwise.manhattan_distances` in the case of sparse matrices.
   :pr:`15049` by `Paolo Toccaceli <ptocca>`.
 
+- |Enhancement| :func:`metrics.median_absolute_error` now supports
+  ``multioutput`` parameter.
+  :pr:`14732` by :user:`Agamemnon Krasoulis <agamemnonc>`.
+
 :mod:`sklearn.model_selection`
 ..............................
 
@@ -663,7 +667,7 @@ Changelog
 - |Fix| :func:`utils.check_array` will now correctly detect numeric dtypes in
   pandas dataframes, fixing a bug where ``float32`` was upcast to ``float64``
   unnecessarily. :pr:`15094` by `Andreas Müller`_.
-  
+
 - |API| The following utils have been deprecated and are now private:
   - ``choose_check_classifiers_labels``
   - ``enforce_estimator_tags_y``
@@ -719,4 +723,3 @@ These changes mostly affect library developers.
   :pr:`13392` by :user:`Rok Mihevc <rok>`.
 
 - |Fix| Added ``check_transformer_data_not_an_array`` to checks where missing
-
 
@@ -31,7 +31,7 @@
 from sklearn.metrics import mean_squared_error
 from sklearn.svm import NuSVR
 from sklearn.ensemble import GradientBoostingRegressor
-from sklearn.linear_model.stochastic_gradient import SGDClassifier
+from sklearn.linear_model import SGDClassifier
 from sklearn.metrics import hamming_loss
 
 # #############################################################################
 
@@ -6,8 +6,8 @@
 Contours of where the penalty is equal to 1
 for the three penalties L1, L2 and elastic-net.
 
-All of the above are supported by
-:class:`sklearn.linear_model.stochastic_gradient`.
+All of the above are supported by :class:`~sklearn.linear_model.SGDClassifier`
+and :class:`~sklearn.linear_model.SGDRegressor`.
 
 """
 print(__doc__)