scikit-learn
diff --git a/‎sklearn/decomposition/_pca.py
Lines changed: 26 additions & 12 deletions b/‎sklearn/decomposition/_pca.py
Lines changed: 26 additions & 12 deletions
diff --git a/‎sklearn/decomposition/tests/test_pca.py
Lines changed: 43 additions & 1 deletion b/‎sklearn/decomposition/tests/test_pca.py
Lines changed: 43 additions & 1 deletion
diff --git a/‎sklearn/utils/_array_api.py
Lines changed: 5 additions & 0 deletions b/‎sklearn/utils/_array_api.py
Lines changed: 5 additions & 0 deletions
diff --git a/‎sklearn/utils/extmath.py
Lines changed: 12 additions & 8 deletions b/‎sklearn/utils/extmath.py
Lines changed: 12 additions & 8 deletions
@@ -14,7 +14,6 @@
 from numbers import Integral, Real
 
 import numpy as np
-from scipy import linalg
 from scipy.special import gammaln
 from scipy.sparse import issparse
 from scipy.sparse.linalg import svds
@@ -28,6 +27,7 @@
 from ..utils.validation import check_is_fitted
 from ..utils._param_validation import Interval, StrOptions
 from ..utils._param_validation import RealNotInt
+from ..utils._array_api import get_namespace, _is_torch_namespace
 
 
 def _assess_dimension(spectrum, rank, n_samples):
@@ -109,8 +109,10 @@ def _infer_dimension(spectrum, n_samples):
 
     The returned value will be in [1, n_features - 1].
     """
-    ll = np.empty_like(spectrum)
-    ll[0] = -np.inf  # we don't want to return n_components = 0
+    xp, _ = get_namespace(spectrum)
+
+    ll = xp.empty_like(spectrum)
+    ll[0] = -xp.inf  # we don't want to return n_components = 0
     for rank in range(1, spectrum.shape[0]):
         ll[rank] = _assess_dimension(spectrum, rank, n_samples)
     return ll.argmax()
@@ -380,6 +382,9 @@ class PCA(_BasePCA):
         "power_iteration_normalizer": [StrOptions({"auto", "QR", "LU", "none"})],
         "random_state": ["random_state"],
     }
+    _pca_torch_arpack_solver_error_message: str = (
+        "PCA with arpack solver does not support PyTorch tensors."
+    )
 
     def __init__(
         self,
@@ -474,6 +479,7 @@ def fit_transform(self, X, y=None):
 
     def _fit(self, X):
         """Dispatch to the right submethod depending on the chosen solver."""
+        xp, _ = get_namespace(X)
 
         # Raise an error for sparse input.
         # This is more informative than the generic one raised by check_array.
@@ -482,9 +488,13 @@ def _fit(self, X):
                 "PCA does not support sparse input. See "
                 "TruncatedSVD for a possible alternative."
             )
+        # Raise an error for torch input and arpack or randomized solver.
+        # TODO support randomized solver for torch tensors
+        if self.svd_solver in ["arpack", "randomized"] and _is_torch_namespace(xp):
+            raise TypeError(self._pca_torch_arpack_solver_error_message)
 
         X = self._validate_data(
-            X, dtype=[np.float64, np.float32], ensure_2d=True, copy=self.copy
+            X, dtype=[xp.float64, xp.float32], ensure_2d=True, copy=self.copy
         )
 
         # Handle n_components==None
@@ -516,6 +526,8 @@ def _fit(self, X):
 
     def _fit_full(self, X, n_components):
         """Fit the model by computing full SVD on X."""
+        xp, _ = get_namespace(X)
+
         n_samples, n_features = X.shape
 
         if n_components == "mle":
@@ -531,10 +543,10 @@ def _fit_full(self, X, n_components):
             )
 
         # Center data
-        self.mean_ = np.mean(X, axis=0)
+        self.mean_ = xp.mean(X, axis=0)
         X -= self.mean_
 
-        U, S, Vt = linalg.svd(X, full_matrices=False)
+        U, S, Vt = xp.linalg.svd(X, full_matrices=False)
         # flip eigenvectors' sign to enforce deterministic output
         U, Vt = svd_flip(U, Vt)
 
@@ -544,7 +556,7 @@ def _fit_full(self, X, n_components):
         explained_variance_ = (S**2) / (n_samples - 1)
         total_var = explained_variance_.sum()
         explained_variance_ratio_ = explained_variance_ / total_var
         singular_values_ = S.copy()  # Store the singular values.
+        singular_values_ = xp.asarray(S, copy=True)  # Store the singular values.
 
         # Postprocess the number of components required
         if n_components == "mle":
@@ -556,7 +568,7 @@ def _fit_full(self, X, n_components):
             # their variance is always greater than n_components float
             # passed. More discussion in issue: #15669
             ratio_cumsum = stable_cumsum(explained_variance_ratio_)
-            n_components = np.searchsorted(ratio_cumsum, n_components, side="right") + 1
+            n_components = xp.searchsorted(ratio_cumsum, n_components, side="right") + 1
         # Compute noise covariance using Probabilistic PCA model
         # The sigma2 maximum likelihood (cf. eq. 12.46)
         if n_components < min(n_features, n_samples):
@@ -577,6 +589,8 @@ def _fit_truncated(self, X, n_components, svd_solver):
         """Fit the model by computing truncated SVD (by ARPACK or randomized)
         on X.
         """
+        xp, _ = get_namespace(X)
+
         n_samples, n_features = X.shape
 
         if isinstance(n_components, str):
@@ -602,7 +616,7 @@ def _fit_truncated(self, X, n_components, svd_solver):
         random_state = check_random_state(self.random_state)
 
         # Center data
-        self.mean_ = np.mean(X, axis=0)
+        self.mean_ = xp.mean(X, axis=0)
         X -= self.mean_
 
         if svd_solver == "arpack":
@@ -636,12 +650,12 @@ def _fit_truncated(self, X, n_components, svd_solver):
         # Workaround in-place variance calculation since at the time numpy
         # did not have a way to calculate variance in-place.
         N = X.shape[0] - 1
-        np.square(X, out=X)
-        np.sum(X, axis=0, out=X[0])
+        xp.square(X, out=X)
+        xp.sum(X, axis=0, out=X[0])
         total_var = (X[0] / N).sum()
 
         self.explained_variance_ratio_ = self.explained_variance_ / total_var
-        self.singular_values_ = S.copy()  # Store the singular values.
+        self.singular_values_ = xp.asarray(S)  # Store the singular values.
 
         if self.n_components_ < min(n_features, n_samples):
             self.noise_variance_ = total_var - self.explained_variance_.sum()
 
@@ -5,9 +5,14 @@
 import pytest
 import warnings
 
-from sklearn.utils._testing import assert_allclose
+from sklearn.utils._testing import (
+    assert_allclose,
+    skip_if_array_api_compat_not_configured,
+)
 
 from sklearn import datasets
+from sklearn._config import config_context
+from sklearn.base import clone
 from sklearn.decomposition import PCA
 from sklearn.datasets import load_iris
 from sklearn.decomposition._pca import _assess_dimension
@@ -17,6 +22,43 @@
 PCA_SOLVERS = ["full", "arpack", "randomized", "auto"]
 
 
+@skip_if_array_api_compat_not_configured
+@pytest.mark.parametrize("device", ["cuda", "cpu"])
+@pytest.mark.parametrize("dtype", ["float32", "float64"])
+@pytest.mark.parametrize("svd_solver", PCA_SOLVERS)
+@pytest.mark.parametrize("n_components", range(1, iris.data.shape[1]))
+def test_pca_array_torch(device, dtype, svd_solver, n_components):
+    """Check that running on PyTorch Tensors gives the same results as NumPy"""
+    torch = pytest.importorskip("torch")
+    if device == "cuda" and not torch.has_cuda:
+        pytest.skip("test requires cuda")
+
+    iris_data = iris.data.astype(dtype)
+    X_np = iris_data
+    X_torch = torch.asarray(iris_data, device=device)
+
+    pca_np = PCA(n_components=n_components, svd_solver=svd_solver)
+    pca_torch = clone(pca_np)
+
+    with config_context(array_api_dispatch=True):
+        if svd_solver in ["arpack", "randomized"]:
+            with pytest.raises(
+                TypeError, match=PCA._pca_torch_arpack_solver_error_message
+            ):
+                pca_torch.fit_transform(X_torch)
+        else:
+            X_transformed_torch = pca_torch.fit_transform(X_torch)
+            X_transformed_np = pca_np.fit_transform(X_np)
+
+            assert type(X_transformed_np) == np.ndarray, "Invalid type"
+            assert type(X_transformed_torch) == torch.Tensor, "Invalid type"
+            assert_allclose(X_transformed_np, X_transformed_torch, atol=1e-3)
+
+            # TODO introduce pytorch support for below methods
+            # cov = pca.get_covariance()
+            # precision = pca.get_precision()
+
+
 @pytest.mark.parametrize("svd_solver", PCA_SOLVERS)
 @pytest.mark.parametrize("n_components", range(1, iris.data.shape[1]))
 def test_pca(svd_solver, n_components):
 
@@ -72,6 +72,11 @@ def _is_numpy_namespace(xp):
     return xp.__name__ in {"numpy", "array_api_compat.numpy", "numpy.array_api"}
 
 
+def _is_torch_namespace(xp):
+    """Return True if xp is backed by PyTorch."""
+    return xp.__name__ in {"torch", "array_api_compat.torch"}
+
+
 def isdtype(dtype, kind, *, xp):
     """Returns a boolean indicating whether a provided dtype is of type "kind".
 
 
@@ -800,16 +800,18 @@ def svd_flip(u, v, u_based_decision=True):
     v_adjusted : ndarray
         Array v with adjusted rows and the same dimensions as v.
     """
+    xp, _ = get_namespace(u)
+
     if u_based_decision:
         # columns of u, rows of v
-        max_abs_cols = np.argmax(np.abs(u), axis=0)
-        signs = np.sign(u[max_abs_cols, range(u.shape[1])])
+        max_abs_cols = xp.argmax(xp.abs(u), axis=0)
+        signs = xp.sign(u[max_abs_cols, range(u.shape[1])])
         u *= signs
         v *= signs[:, np.newaxis]
     else:
         # rows of v, columns of u
-        max_abs_rows = np.argmax(np.abs(v), axis=1)
-        signs = np.sign(v[range(v.shape[0]), max_abs_rows])
+        max_abs_rows = xp.argmax(xp.abs(v), axis=1)
+        signs = xp.sign(v[range(v.shape[0]), max_abs_rows])
         u *= signs
         v *= signs[:, np.newaxis]
     return u, v
@@ -1139,10 +1141,12 @@ def stable_cumsum(arr, axis=None, rtol=1e-05, atol=1e-08):
     out : ndarray
         Array with the cumulative sums along the chosen axis.
     """
-    out = np.cumsum(arr, axis=axis, dtype=np.float64)
-    expected = np.sum(arr, axis=axis, dtype=np.float64)
-    if not np.all(
-        np.isclose(
+    xp, _ = get_namespace(arr)
+
+    out = xp.cumsum(arr, axis=axis, dtype=np.float64)
+    expected = xp.sum(arr, axis=axis, dtype=np.float64)
+    if not xp.all(
+        xp.isclose(
             out.take(-1, axis=axis), expected, rtol=rtol, atol=atol, equal_nan=True
         )
     ):