From d29fe057cfba5d24fd9442a0ef02fcba5d3b9c98 Mon Sep 17 00:00:00 2001
From: Vincent M <maladiere.vincent@yahoo.fr>
Date: Sat, 21 Jan 2023 15:36:07 +0100
Subject: [PATCH 1/2] remove TODOs and simplify variable names

---
 .../_middle_term_computer.pyx.tp              | 23 +++++++------------
 1 file changed, 8 insertions(+), 15 deletions(-)

diff --git a/sklearn/metrics/_pairwise_distances_reduction/_middle_term_computer.pyx.tp b/sklearn/metrics/_pairwise_distances_reduction/_middle_term_computer.pyx.tp
index 4eb3733c42bcf..5c3ca412252f8 100644
--- a/sklearn/metrics/_pairwise_distances_reduction/_middle_term_computer.pyx.tp
+++ b/sklearn/metrics/_pairwise_distances_reduction/_middle_term_computer.pyx.tp
@@ -38,14 +38,7 @@ import numpy as np
 from scipy.sparse import issparse, csr_matrix
 from ...utils._typedefs import DTYPE, SPARSE_INDEX_TYPE
 
-# TODO: If possible optimize this routine to efficiently treat cases where
-# `n_samples_X << n_samples_Y` met in practise when X_test consists of a
-# few samples, and thus when there's a single chunk of X whose number of
-# samples is less than the default chunk size.
-
-# TODO: compare this routine with the similar ones in SciPy, especially
-# `csr_matmat` which might implement a better algorithm.
-# See: https://github.com/scipy/scipy/blob/e58292e066ba2cb2f3d1e0563ca9314ff1f4f311/scipy/sparse/sparsetools/csr.h#L603-L669  # noqa
+
 cdef void _middle_term_sparse_sparse_64(
     const DTYPE_t[:] X_data,
     const SPARSE_INDEX_TYPE_t[:] X_indices,
@@ -66,17 +59,17 @@ cdef void _middle_term_sparse_sparse_64(
         ITYPE_t i, j, k
         ITYPE_t n_X = X_end - X_start
         ITYPE_t n_Y = Y_end - Y_start
-        ITYPE_t X_i_col_idx, X_i_ptr, Y_j_col_idx, Y_j_ptr
+        ITYPE_t x_col, x_ptr, y_col, y_ptr
 
     for i in range(n_X):
-        for X_i_ptr in range(X_indptr[X_start+i], X_indptr[X_start+i+1]):
-            X_i_col_idx = X_indices[X_i_ptr]
+        for x_ptr in range(X_indptr[X_start+i], X_indptr[X_start+i+1]):
+            x_col = X_indices[x_ptr]
             for j in range(n_Y):
                 k = i * n_Y + j
-                for Y_j_ptr in range(Y_indptr[Y_start+j], Y_indptr[Y_start+j+1]):
-                    Y_j_col_idx = Y_indices[Y_j_ptr]
-                    if X_i_col_idx == Y_j_col_idx:
-                        D[k] += -2 * X_data[X_i_ptr] * Y_data[Y_j_ptr]
+                for y_ptr in range(Y_indptr[Y_start+j], Y_indptr[Y_start+j+1]):
+                    y_col = Y_indices[y_ptr]
+                    if x_col == y_col:
+                        D[k] += -2 * X_data[x_ptr] * Y_data[y_ptr]
 
 
 {{for name_suffix, upcast_to_float64, INPUT_DTYPE_t, INPUT_DTYPE in implementation_specific_values}}

From 777e0126d81c091ea870b7159091cd0ac458cb70 Mon Sep 17 00:00:00 2001
From: Vincent M <maladiere.vincent@yahoo.fr>
Date: Wed, 1 Feb 2023 09:45:22 +0100
Subject: [PATCH 2/2] Update
 sklearn/metrics/_pairwise_distances_reduction/_middle_term_computer.pyx.tp

Co-authored-by: Julien Jerphanion <git@jjerphan.xyz>
---
 .../_pairwise_distances_reduction/_middle_term_computer.pyx.tp   | 1 -
 1 file changed, 1 deletion(-)

diff --git a/sklearn/metrics/_pairwise_distances_reduction/_middle_term_computer.pyx.tp b/sklearn/metrics/_pairwise_distances_reduction/_middle_term_computer.pyx.tp
index 5c3ca412252f8..dd8b205c753e0 100644
--- a/sklearn/metrics/_pairwise_distances_reduction/_middle_term_computer.pyx.tp
+++ b/sklearn/metrics/_pairwise_distances_reduction/_middle_term_computer.pyx.tp
@@ -38,7 +38,6 @@ import numpy as np
 from scipy.sparse import issparse, csr_matrix
 from ...utils._typedefs import DTYPE, SPARSE_INDEX_TYPE
 
-
 cdef void _middle_term_sparse_sparse_64(
     const DTYPE_t[:] X_data,
     const SPARSE_INDEX_TYPE_t[:] X_indices,