From b45511f8893aaac9441324eb82c5afe3f7d1f59b Mon Sep 17 00:00:00 2001
From: Intron7 <sdicks@nvidia.com>
Date: Tue, 9 Sep 2025 08:46:42 +0200
Subject: [PATCH 1/2] add PV

---
 src/decoupler/mt/_pv.py  | 78 ++++++++++++++++++++++++++++++++++++++++
 src/decoupler/mt/_run.py |  4 +--
 tests/mt/test_adj.py     | 17 +++++++++
 3 files changed, 97 insertions(+), 2 deletions(-)
 create mode 100644 src/decoupler/mt/_pv.py
 create mode 100644 tests/mt/test_adj.py

diff --git a/src/decoupler/mt/_pv.py b/src/decoupler/mt/_pv.py
new file mode 100644
index 0000000..dacaffb
--- /dev/null
+++ b/src/decoupler/mt/_pv.py
@@ -0,0 +1,78 @@
+import numba as nb
+import numpy as np
+
+
+@nb.njit(cache=True)
+def _fdr_bh_single_row(ps_row, m):
+    """
+    Apply Benjamini-Hochberg correction to a single row.
+    """
+    # Sort the row and get indices
+    order = np.argsort(ps_row)
+    ps_sorted = ps_row[order]
+
+    # BH scale: p_(i) * m / i
+    ps_bh = np.empty_like(ps_sorted, dtype=np.float64)
+    for i in range(m):
+        ps_bh[i] = ps_sorted[i] * (m / (i + 1))
+
+    # Reverse cumulative min
+    ps_rev = np.empty_like(ps_bh, dtype=np.float64)
+    for i in range(m):
+        ps_rev[i] = ps_bh[m - 1 - i]
+
+    for j in range(1, m):
+        ps_rev[j] = min(ps_rev[j], ps_rev[j - 1])
+
+    # Reverse back
+    ps_monotone = np.empty_like(ps_rev, dtype=np.float64)
+    for i in range(m):
+        ps_monotone[i] = ps_rev[m - 1 - i]
+
+    # Unsort back to original order
+    ps_adj = np.empty_like(ps_monotone, dtype=np.float64)
+    for i in range(m):
+        ps_adj[order[i]] = ps_monotone[i]
+
+    # Clip to [0, 1]
+    for i in range(m):
+        ps_adj[i] = max(0.0, min(1.0, ps_adj[i]))
+
+    return ps_adj
+
+
+@nb.njit(parallel=True, cache=True)
+def _fdr_bh_parallel(ps, m):
+    """
+    Apply Benjamini-Hochberg correction to all rows in parallel.
+    """
+    n_rows = ps.shape[0]
+    result = np.empty_like(ps, dtype=np.float64)
+
+    for i in nb.prange(n_rows):
+        result[i] = _fdr_bh_single_row(ps[i], m)
+
+    return result
+
+
+def _fdr_bh_axis1_numba(ps):
+    """
+    Benjamini–Hochberg adjusted p-values along axis=1 (rows).
+    ps: numpy.ndarray (n_rows, n_tests), values in [0, 1].
+    Returns: numpy.ndarray of same shape.
+    """
+    ps = np.asarray(ps, dtype=np.float64)
+    if ps.ndim != 2:
+        raise ValueError("ps must be 2D (n_rows, n_tests) for axis=1.")
+    if not np.issubdtype(ps.dtype, np.number):
+        raise ValueError("`ps` must be numeric.")
+    if not np.all((ps >= 0) & (ps <= 1)):
+        raise ValueError("`ps` must be within [0, 1].")
+
+    n_rows, m = ps.shape
+    if m <= 1:
+        return ps.copy().astype(np.float32)
+
+    # Process each row in parallel
+    result = _fdr_bh_parallel(ps, m)
+    return result.astype(np.float32)
diff --git a/src/decoupler/mt/_run.py b/src/decoupler/mt/_run.py
index abb8319..321f8b5 100644
--- a/src/decoupler/mt/_run.py
+++ b/src/decoupler/mt/_run.py
@@ -3,12 +3,12 @@
 import numpy as np
 import pandas as pd
 import scipy.sparse as sps
-import scipy.stats as sts
 from anndata import AnnData
 from tqdm.auto import tqdm
 
 from decoupler._datatype import DataType
 from decoupler._log import _log
+from decoupler.mt._pv import _fdr_bh_axis1_numba
 from decoupler.pp.data import extract
 from decoupler.pp.net import adjmat, idxmat, prune
 
@@ -115,7 +115,7 @@ def _run(
         pv = pd.DataFrame(pv, index=obs, columns=sources)
         if name != "mlm":
             _log(f"{name} - adjusting p-values by FDR", level="info", verbose=verbose)
-            pv.loc[:, :] = sts.false_discovery_control(pv.values, axis=1, method="bh")
+            pv.loc[:, :] = _fdr_bh_axis1_numba(pv.values)
     else:
         pv = None
     _log(f"{name} - done", level="info", verbose=verbose)
diff --git a/tests/mt/test_adj.py b/tests/mt/test_adj.py
new file mode 100644
index 0000000..11f7fdd
--- /dev/null
+++ b/tests/mt/test_adj.py
@@ -0,0 +1,17 @@
+from __future__ import annotations
+
+import numpy as np
+import scipy.stats as sts
+
+import decoupler as dc
+from decoupler.mt._pv import _fdr_bh_axis1_numba
+
+
+def test_func_mlm(
+    adata,
+    net,
+):
+    dc.mt.mlm(data=adata, net=net, tmin=3)
+    dc_pv = adata.obsm["padj_mlm"]
+    adj = _fdr_bh_axis1_numba(dc_pv.values)
+    np.testing.assert_allclose(adj, sts.false_discovery_control(dc_pv.values, axis=1, method="bh"))

From a8e7fa6852ab6c8c738b81050b3f53f8fe61115a Mon Sep 17 00:00:00 2001
From: Intron7 <sdicks@nvidia.com>
Date: Tue, 9 Sep 2025 08:52:23 +0200
Subject: [PATCH 2/2] pre-commit fix

---
 src/decoupler/mt/_pv.py | 14 +++-----------
 1 file changed, 3 insertions(+), 11 deletions(-)

diff --git a/src/decoupler/mt/_pv.py b/src/decoupler/mt/_pv.py
index dacaffb..b861907 100644
--- a/src/decoupler/mt/_pv.py
+++ b/src/decoupler/mt/_pv.py
@@ -4,9 +4,7 @@
 
 @nb.njit(cache=True)
 def _fdr_bh_single_row(ps_row, m):
-    """
-    Apply Benjamini-Hochberg correction to a single row.
-    """
+    """Apply Benjamini-Hochberg correction to a single row."""
     # Sort the row and get indices
     order = np.argsort(ps_row)
     ps_sorted = ps_row[order]
@@ -43,9 +41,7 @@ def _fdr_bh_single_row(ps_row, m):
 
 @nb.njit(parallel=True, cache=True)
 def _fdr_bh_parallel(ps, m):
-    """
-    Apply Benjamini-Hochberg correction to all rows in parallel.
-    """
+    """Apply Benjamini-Hochberg correction to all rows in parallel."""
     n_rows = ps.shape[0]
     result = np.empty_like(ps, dtype=np.float64)
 
@@ -56,11 +52,7 @@ def _fdr_bh_parallel(ps, m):
 
 
 def _fdr_bh_axis1_numba(ps):
-    """
-    Benjamini–Hochberg adjusted p-values along axis=1 (rows).
-    ps: numpy.ndarray (n_rows, n_tests), values in [0, 1].
-    Returns: numpy.ndarray of same shape.
-    """
+    """Benjamini–Hochberg adjusted p-values along axis=1 (rows)."""
     ps = np.asarray(ps, dtype=np.float64)
     if ps.ndim != 2:
         raise ValueError("ps must be 2D (n_rows, n_tests) for axis=1.")