add docs and fix test with smaller fucntions

Intron7 · Intron7 · commit ff3f823d5ba9 · 2026-01-23T16:37:00.000+01:00
diff --git a/docs/api/index.md b/docs/api/index.md
@@ -12,6 +12,7 @@ import rapids_singlecell as rsc
 
 scanpy_gpu
 squidpy_gpu
+pertpy_gpu
 decoupler_gpu
 get
 ```
diff --git a/docs/api/pertpy_gpu.md b/docs/api/pertpy_gpu.md
@@ -0,0 +1,20 @@
+# pertpy-GPU: `ptg`
+
+{mod}`pertpy` contains tools for perturbation analysis. {mod}`rapids_singlecell.ptg` accelerates some of these methods.
+
+## Distance
+
+```{eval-rst}
+.. module:: rapids_singlecell.ptg
+.. currentmodule:: rapids_singlecell
+
+.. autosummary::
+    :toctree: generated
+
+    ptg.Distance
+
+.. autoclass:: rapids_singlecell.ptg.Distance
+    :members:
+    :undoc-members:
+    :show-inheritance:
+```
diff --git a/docs/conf.py b/docs/conf.py
@@ -8,6 +8,7 @@
 from pathlib import Path, PurePosixPath
 from typing import TYPE_CHECKING
 import anndata  # noqa
+import fast_array_utils  # noqa
 
 if TYPE_CHECKING:
     from sphinx.application import Sphinx
diff --git a/docs/release-notes/0.13.6.md b/docs/release-notes/0.13.6.md
@@ -0,0 +1,5 @@
+### 0.13.6 {small}`the-future`
+
+```{rubric} Features
+```
+* Adds `ptg.Distance` for GPU-accelerated distance computation between groups of cells, compatible with pertpy's Distance API {pr}`454` {smaller}`S Dicks & S Özleyen`
diff --git a/tests/pertpy/test_distances.py b/tests/pertpy/test_distances.py
@@ -711,14 +711,30 @@ def test_distance_default_obsm_key() -> None:
 # ============================================================================
 
 
-def test_float64_matches_float32_results(small_adata: AnnData) -> None:
+def test_float64_matches_float32_results() -> None:
     """Test that float64 and float32 produce similar results (within float32 precision)."""
-    adata_f64 = small_adata.copy()
-    adata_f64.obsm["X_pca"] = small_adata.obsm["X_pca"].astype(cp.float64)
+    # Use small dataset to avoid GPU resource exhaustion with float64
+    rng = np.random.default_rng(0)
+    n_groups = 3
+    cells_per_group = 4
+    n_features = 5
+    total_cells = n_groups * cells_per_group
+
+    cpu_embedding = rng.normal(size=(total_cells, n_features)).astype(np.float32)
+    groups = [f"g{idx}" for idx in range(n_groups) for _ in range(cells_per_group)]
+    obs = pd.DataFrame(
+        {"group": pd.Categorical(groups, categories=[f"g{i}" for i in range(n_groups)])}
+    )
+
+    adata_f32 = AnnData(cpu_embedding, obs=obs)
+    adata_f32.obsm["X_pca"] = cp.asarray(cpu_embedding, dtype=cp.float32)
+
+    adata_f64 = AnnData(cpu_embedding, obs=obs.copy())
+    adata_f64.obsm["X_pca"] = cp.asarray(cpu_embedding, dtype=cp.float64)
 
     distance = Distance(metric="edistance")
 
-    result_f32 = distance.pairwise(small_adata, groupby="group")
+    result_f32 = distance.pairwise(adata_f32, groupby="group")
     result_f64 = distance.pairwise(adata_f64, groupby="group")
 
     np.testing.assert_allclose(
@@ -772,9 +788,10 @@ def test_bootstrap_different_feature_counts(n_features: int) -> None:
 def test_pairwise_correctness_parametrized(dtype) -> None:
     """Parametrized test for pairwise correctness across dtypes."""
     rng = np.random.default_rng(42)
-    n_groups = 4
-    cells_per_group = 15
-    n_features = 20
+    # Use smaller sizes for float64 to avoid GPU resource exhaustion
+    n_groups = 3
+    cells_per_group = 4 if dtype == np.float64 else 15
+    n_features = 5 if dtype == np.float64 else 20
     total_cells = n_groups * cells_per_group
 
     cpu_embedding = rng.normal(size=(total_cells, n_features)).astype(dtype)
@@ -793,7 +810,7 @@ def test_pairwise_correctness_parametrized(dtype) -> None:
     rtol = 1e-10 if dtype == np.float64 else 1e-5
     atol = 1e-12 if dtype == np.float64 else 1e-6
 
-    for g1, g2 in [("g0", "g1"), ("g1", "g3"), ("g2", "g3")]:
+    for g1, g2 in [("g0", "g1"), ("g0", "g2"), ("g1", "g2")]:
         X = cpu_embedding[np.array(groups) == g1]
         Y = cpu_embedding[np.array(groups) == g2]
         expected = _compute_energy_distance_cpu(X, Y)
@@ -807,30 +824,59 @@ def test_pairwise_correctness_parametrized(dtype) -> None:
         )
 
 
-@pytest.mark.parametrize("dtype", [np.float32, np.float64])
 @pytest.mark.parametrize("n_features", [50, 400])
-def test_correctness_dtype_and_features(dtype, n_features) -> None:
-    """Test correctness across dtypes and feature counts."""
+def test_correctness_float32_features(n_features) -> None:
+    """Test correctness across feature counts with float32."""
     rng = np.random.default_rng(42)
     n_groups = 3
     cells_per_group = 10
     total_cells = n_groups * cells_per_group
 
-    cpu_embedding = rng.normal(size=(total_cells, n_features)).astype(dtype)
+    cpu_embedding = rng.normal(size=(total_cells, n_features)).astype(np.float32)
     groups = [f"g{idx}" for idx in range(n_groups) for _ in range(cells_per_group)]
     obs = pd.DataFrame(
         {"group": pd.Categorical(groups, categories=[f"g{i}" for i in range(n_groups)])}
     )
 
-    adata = AnnData(cpu_embedding.copy().astype(np.float32), obs=obs)
-    adata.obsm["X_pca"] = cp.asarray(cpu_embedding, dtype=dtype)
+    adata = AnnData(cpu_embedding.copy(), obs=obs)
+    adata.obsm["X_pca"] = cp.asarray(cpu_embedding, dtype=np.float32)
 
     distance = Distance(metric="edistance")
     result_df = distance.pairwise(adata, groupby="group")
 
-    # Check correctness
-    rtol = 1e-10 if dtype == np.float64 else 1e-4
-    atol = 1e-12 if dtype == np.float64 else 1e-5
+    X = cpu_embedding[np.array(groups) == "g0"]
+    Y = cpu_embedding[np.array(groups) == "g1"]
+    expected = _compute_energy_distance_cpu(X, Y)
+    actual = result_df.loc["g0", "g1"]
+
+    np.testing.assert_allclose(
+        actual,
+        expected,
+        rtol=1e-4,
+        atol=1e-5,
+        err_msg=f"n_features={n_features} mismatch",
+    )
+
+
+def test_correctness_float64_small() -> None:
+    """Test correctness with float64 using small data to avoid GPU resource exhaustion."""
+    rng = np.random.default_rng(42)
+    n_groups = 3
+    cells_per_group = 4
+    n_features = 5
+    total_cells = n_groups * cells_per_group
+
+    cpu_embedding = rng.normal(size=(total_cells, n_features)).astype(np.float64)
+    groups = [f"g{idx}" for idx in range(n_groups) for _ in range(cells_per_group)]
+    obs = pd.DataFrame(
+        {"group": pd.Categorical(groups, categories=[f"g{i}" for i in range(n_groups)])}
+    )
+
+    adata = AnnData(cpu_embedding.copy().astype(np.float32), obs=obs)
+    adata.obsm["X_pca"] = cp.asarray(cpu_embedding, dtype=np.float64)
+
+    distance = Distance(metric="edistance")
+    result_df = distance.pairwise(adata, groupby="group")
 
     X = cpu_embedding[np.array(groups) == "g0"]
     Y = cpu_embedding[np.array(groups) == "g1"]
@@ -840,9 +886,9 @@ def test_correctness_dtype_and_features(dtype, n_features) -> None:
     np.testing.assert_allclose(
         actual,
         expected,
-        rtol=rtol,
-        atol=atol,
-        err_msg=f"dtype={dtype.__name__}, n_features={n_features} mismatch",
+        rtol=1e-10,
+        atol=1e-12,
+        err_msg="float64 mismatch",
     )
 
 
@@ -928,7 +974,7 @@ def pertpy_adata() -> AnnData:
 
     This uses the same data pertpy uses in their tests.
     """
-    import pertpy as pt
+    pt = pytest.importorskip("pertpy")
     import scanpy as sc
 
     adata = pt.dt.distance_example()