Fix int64_t type compatibility for Linux, remove sparse and return matrix parameter from emd and fix linting issues

nathanneike · nathanneike · commit 022720b295f4 · 2025-10-30T11:08:06.000+01:00
diff --git a/ot/lp/_network_simplex.py b/ot/lp/_network_simplex.py
@@ -12,7 +12,6 @@
 import warnings
 
 import scipy.sparse as sp
-import time
 from ..utils import list_to_array, check_number_threads
 from ..backend import get_backend
 from .emd_wrap import emd_c, emd_c_sparse, check_result
@@ -174,8 +173,6 @@ def emd(
     center_dual=True,
     numThreads=1,
     check_marginals=True,
-    sparse=False,
-    return_matrix=False,
 ):
     r"""Solves the Earth Movers distance problem and returns the OT matrix
 
@@ -236,22 +233,26 @@ def emd(
     check_marginals: bool, optional (default=True)
         If True, checks that the marginals mass are equal. If False, skips the
         check.
-    sparse: bool, optional (default=False)
-        If True, uses the sparse solver that only stores edges with finite costs.
-        When sparse=True, M should be a scipy.sparse matrix.
-    return_matrix: bool, optional (default=True)
-        If True, returns the transport matrix. If False and sparse=True, returns
-        sparse flow representation in log.
+
+    .. note:: The solver automatically detects sparse format when M is provided as:
+        - A scipy.sparse matrix (coo, csr, csc, etc.)
+        - A tuple (row_indices, col_indices, costs) representing an edge list
+
+        For sparse inputs, the solver uses a memory-efficient algorithm and returns
+        the flow in edge format (via log dict) instead of a full matrix.
 
 
     Returns
     -------
-    gamma: array-like, shape (ns, nt)
-        Optimal transportation matrix for the given
-        parameters
+    gamma: array-like, shape (ns, nt), or None
+        Optimal transportation matrix for the given parameters.
+        For sparse inputs, returns None (use log=True to get flow in edge format).
     log: dict, optional
-        If input log is true, a dictionary containing the
-        cost and dual variables and exit status
+        If input log is True, a dictionary containing the cost, dual variables,
+        and exit status. For sparse inputs with log=True, also contains:
+        - 'flow_sources': source nodes of flow edges
+        - 'flow_targets': target nodes of flow edges
+        - 'flow_values': flow values on edges
 
 
     Examples
@@ -287,7 +288,10 @@ def emd(
     edge_costs = None
     n1, n2 = None, None
 
-    if sparse:
+    # Auto-detect sparse format
+    is_sparse = sp.issparse(M) or (isinstance(M, tuple) and len(M) == 3)
+
+    if is_sparse:
         if sp.issparse(M):
             if not isinstance(M, sp.coo_matrix):
                 M_coo = sp.coo_matrix(M)
@@ -312,10 +316,6 @@ def emd(
             edge_costs = np.asarray(M[2], dtype=np.float64)
             n1 = int(edge_sources.max() + 1)
             n2 = int(edge_targets.max() + 1)
-        else:
-            raise ValueError(
-                "When sparse=True, M must be a scipy sparse matrix or a tuple (row, col, data)"
-            )
 
         a, b = list_to_array(a, b)
     else:
@@ -343,7 +343,7 @@ def emd(
             else nx.ones((M.shape[1],), type_as=type_as) / M.shape[1]
         )
 
-    if sparse:
+    if is_sparse:
         a, b = nx.to_numpy(a, b)
     else:
         M, a, b = nx.to_numpy(M, a, b)
@@ -375,14 +375,11 @@ def emd(
     numThreads = check_number_threads(numThreads)
 
     if edge_sources is not None:
+        # Sparse solver - never build full matrix
         flow_sources, flow_targets, flow_values, cost, u, v, result_code = emd_c_sparse(
             a, b, edge_sources, edge_targets, edge_costs, numItermax
         )
-        if return_matrix:
-            G = np.zeros((len(a), len(b)), dtype=np.float64)
-            G[flow_sources, flow_targets] = flow_values
-        else:
-            G = None
+        G = None
     else:
         G, cost, u, v, result_code = emd_c(a, b, M, numItermax, numThreads)
 
@@ -413,7 +410,8 @@ def emd(
         log_dict["warning"] = result_code_string
         log_dict["result_code"] = result_code
 
-        if edge_sources is not None and not return_matrix:
+        if edge_sources is not None:
+            # For sparse, include flow in edge format
             log_dict["flow_sources"] = flow_sources
             log_dict["flow_targets"] = flow_targets
             log_dict["flow_values"] = flow_values
@@ -427,7 +425,7 @@ def emd(
         return nx.from_numpy(G, type_as=type_as)
     else:
         raise ValueError(
-            "Cannot return matrix when return_matrix=False and sparse=True without log=True"
+            "For sparse inputs, log=True is required to get the flow in edge format"
         )
 
 
@@ -441,7 +439,6 @@ def emd2(
     center_dual=True,
     numThreads=1,
     check_marginals=True,
-    sparse=False,
     return_matrix=False,
 ):
     r"""Solves the Earth Movers distance problem and returns the loss
@@ -503,11 +500,12 @@ def emd2(
     check_marginals: bool, optional (default=True)
         If True, checks that the marginals mass are equal. If False, skips the
         check.
-    sparse: bool, optional (default=False)
-        If True, uses the sparse solver that only stores edges with finite costs.
-        This is memory-efficient when M has many infinite or forbidden edges.
-        When sparse=True, M should be a scipy.sparse matrix (coo, csr, or csc format)
-        or a tuple (row_indices, col_indices, costs) representing the edge list.
+
+    .. note:: The solver automatically detects sparse format when M is provided as:
+        - A scipy.sparse matrix (coo, csr, csc, etc.)
+        - A tuple (row_indices, col_indices, costs) representing an edge list
+
+        For sparse inputs, the solver uses a memory-efficient algorithm.
         Edges not included are treated as having infinite cost (forbidden).
 
 
@@ -554,14 +552,15 @@ def emd2(
     edge_costs = None
     n1, n2 = None, None
 
-    if sparse:
+    # Auto-detect sparse format
+    is_sparse = sp.issparse(M) or (isinstance(M, tuple) and len(M) == 3)
+
+    if is_sparse:
         if sp.issparse(M):
-            t0 = time.perf_counter()
             if not isinstance(M, sp.coo_matrix):
                 M_coo = sp.coo_matrix(M)
             else:
                 M_coo = M
-            t1 = time.perf_counter()
 
             edge_sources = (
                 M_coo.row if M_coo.row.dtype == np.int64 else M_coo.row.astype(np.int64)
@@ -574,21 +573,13 @@ def emd2(
                 if M_coo.data.dtype == np.float64
                 else M_coo.data.astype(np.float64)
             )
-            t2 = time.perf_counter()
-            print(
-                f"[PY SPARSE] COO conversion: {(t1-t0)*1000:.3f} ms, array copies: {(t2-t1)*1000:.3f} ms"
-            )
             n1, n2 = M_coo.shape
         elif isinstance(M, tuple) and len(M) == 3:
             edge_sources = np.asarray(M[0], dtype=np.int64)
             edge_targets = np.asarray(M[1], dtype=np.int64)
             edge_costs = np.asarray(M[2], dtype=np.float64)
             n1 = int(edge_sources.max() + 1)
             n2 = int(edge_targets.max() + 1)
-        else:
-            raise ValueError(
-                "When sparse=True, M must be a scipy sparse matrix or a tuple (row, col, data)"
-            )
 
         a, b = list_to_array(a, b)
     else:
@@ -618,14 +609,14 @@ def emd2(
         )
 
     a0, b0 = a, b
-    M0 = None if sparse else M
+    M0 = None if is_sparse else M
 
-    if sparse:
+    if is_sparse:
         edge_costs_original = nx.from_numpy(edge_costs, type_as=type_as)
     else:
         edge_costs_original = None
 
-    if sparse:
+    if is_sparse:
         a, b = nx.to_numpy(a, b)
     else:
         M, a, b = nx.to_numpy(M, a, b)
diff --git a/ot/lp/emd_wrap.pyx b/ot/lp/emd_wrap.pyx
@@ -14,15 +14,15 @@ from ..utils import dist
 
 cimport cython
 cimport libc.math as math
-from libc.stdint cimport uint64_t
+from libc.stdint cimport uint64_t, int64_t
 
 import warnings
 
 
 cdef extern from "EMD.h":
     int EMD_wrap(int n1,int n2, double *X, double *Y,double *D, double *G, double* alpha, double* beta, double *cost, uint64_t maxIter) nogil
     int EMD_wrap_omp(int n1,int n2, double *X, double *Y,double *D, double *G, double* alpha, double* beta, double *cost, uint64_t maxIter, int numThreads) nogil
-    int EMD_wrap_sparse(int n1, int n2, double *X, double *Y, uint64_t n_edges, long long *edge_sources, long long *edge_targets, double *edge_costs, long long *flow_sources_out, long long *flow_targets_out, double *flow_values_out, uint64_t *n_flows_out, double *alpha, double *beta, double *cost, uint64_t maxIter) nogil
+    int EMD_wrap_sparse(int n1, int n2, double *X, double *Y, uint64_t n_edges, int64_t *edge_sources, int64_t *edge_targets, double *edge_costs, int64_t *flow_sources_out, int64_t *flow_targets_out, double *flow_values_out, uint64_t *n_flows_out, double *alpha, double *beta, double *cost, uint64_t maxIter) nogil
     cdef enum ProblemType: INFEASIBLE, OPTIMAL, UNBOUNDED, MAX_ITER_REACHED
 
 
@@ -212,8 +212,8 @@ def emd_1d_sorted(np.ndarray[double, ndim=1, mode="c"] u_weights,
 @cython.wraparound(False)
 def emd_c_sparse(np.ndarray[double, ndim=1, mode="c"] a,
                 np.ndarray[double, ndim=1, mode="c"] b,
-                np.ndarray[long long, ndim=1, mode="c"] edge_sources,
-                np.ndarray[long long, ndim=1, mode="c"] edge_targets,
+                np.ndarray[int64_t, ndim=1, mode="c"] edge_sources,
+                np.ndarray[int64_t, ndim=1, mode="c"] edge_targets,
                 np.ndarray[double, ndim=1, mode="c"] edge_costs,
                 uint64_t max_iter):
     """
@@ -259,8 +259,8 @@ def emd_c_sparse(np.ndarray[double, ndim=1, mode="c"] a,
     cdef double cost = 0
 
     # Allocate output arrays (max size = n_edges)
-    cdef np.ndarray[long long, ndim=1, mode="c"] flow_sources = np.zeros(n_edges, dtype=np.int64)
-    cdef np.ndarray[long long, ndim=1, mode="c"] flow_targets = np.zeros(n_edges, dtype=np.int64)
+    cdef np.ndarray[int64_t, ndim=1, mode="c"] flow_sources = np.zeros(n_edges, dtype=np.int64)
+    cdef np.ndarray[int64_t, ndim=1, mode="c"] flow_targets = np.zeros(n_edges, dtype=np.int64)
     cdef np.ndarray[double, ndim=1, mode="c"] flow_values = np.zeros(n_edges, dtype=np.float64)
     cdef np.ndarray[double, ndim=1, mode="c"] alpha = np.zeros(n1)
     cdef np.ndarray[double, ndim=1, mode="c"] beta = np.zeros(n2)
@@ -270,8 +270,8 @@ def emd_c_sparse(np.ndarray[double, ndim=1, mode="c"] a,
             n1, n2,
             <double*> a.data, <double*> b.data,
             n_edges,
-            <long long*> edge_sources.data, <long long*> edge_targets.data, <double*> edge_costs.data,
-            <long long*> flow_sources.data, <long long*> flow_targets.data, <double*> flow_values.data,
+            <int64_t*> edge_sources.data, <int64_t*> edge_targets.data, <double*> edge_costs.data,
+            <int64_t*> flow_sources.data, <int64_t*> flow_targets.data, <double*> flow_values.data,
             &n_flows_out,
             <double*> alpha.data, <double*> beta.data, &cost, max_iter
         )
diff --git a/test/test_ot.py b/test/test_ot.py
@@ -985,19 +985,32 @@ def test_emd_sparse_vs_dense():
     C_augmented_dense[C_augmented_array > 0] = C_augmented_array[C_augmented_array > 0]
 
     G_dense, log_dense = ot.emd(a, b, C_augmented_dense, log=True)
-    G_sparse, log_sparse = ot.emd(
-        a, b, C_augmented, log=True, sparse=True, return_matrix=True
-    )
+    G_sparse, log_sparse = ot.emd(a, b, C_augmented, log=True)
 
     cost_dense = log_dense["cost"]
     cost_sparse = log_sparse["cost"]
 
     np.testing.assert_allclose(cost_dense, cost_sparse, rtol=1e-5, atol=1e-7)
 
+    # For dense, G_dense is returned; for sparse, reconstruct from flow edges
     np.testing.assert_allclose(a, G_dense.sum(1), rtol=1e-5, atol=1e-7)
     np.testing.assert_allclose(b, G_dense.sum(0), rtol=1e-5, atol=1e-7)
-    np.testing.assert_allclose(a, G_sparse.sum(1), rtol=1e-5, atol=1e-7)
-    np.testing.assert_allclose(b, G_sparse.sum(0), rtol=1e-5, atol=1e-7)
+
+    # Reconstruct sparse matrix from flow for marginal checks
+    if G_sparse is None:
+        G_sparse_reconstructed = np.zeros((n_source, n_target))
+        G_sparse_reconstructed[
+            log_sparse["flow_sources"], log_sparse["flow_targets"]
+        ] = log_sparse["flow_values"]
+        np.testing.assert_allclose(
+            a, G_sparse_reconstructed.sum(1), rtol=1e-5, atol=1e-7
+        )
+        np.testing.assert_allclose(
+            b, G_sparse_reconstructed.sum(0), rtol=1e-5, atol=1e-7
+        )
+    else:
+        np.testing.assert_allclose(a, G_sparse.sum(1), rtol=1e-5, atol=1e-7)
+        np.testing.assert_allclose(b, G_sparse.sum(0), rtol=1e-5, atol=1e-7)
 
 
 def test_emd2_sparse_vs_dense():
@@ -1071,7 +1084,7 @@ def test_emd2_sparse_vs_dense():
     C_augmented_dense[C_augmented_array > 0] = C_augmented_array[C_augmented_array > 0]
 
     cost_dense = ot.emd2(a, b, C_augmented_dense)
-    cost_sparse = ot.emd2(a, b, C_augmented, sparse=True)
+    cost_sparse = ot.emd2(a, b, C_augmented)
 
     np.testing.assert_allclose(cost_dense, cost_sparse, rtol=1e-5, atol=1e-7)