Add JAX array support to pted and pted_coverage_test (#14)

Copilot · ConnorStoneAstro · web-flow · commit 728bd5332731 · 2026-03-03T08:52:09.000-05:00
* Initial plan

* Add JAX compatibility to pted and pted_coverage_test

Co-authored-by: ConnorStoneAstro &lt;78555321+ConnorStoneAstro@users.noreply.github.com&gt;

* Add jax as a dev dependency

Co-authored-by: ConnorStoneAstro &lt;78555321+ConnorStoneAstro@users.noreply.github.com&gt;

* Update README for JAX support and add utils unit tests with mocking

Co-authored-by: ConnorStoneAstro &lt;78555321+ConnorStoneAstro@users.noreply.github.com&gt;

* Optimize _jax_cdist: squared-norm identity for L2, vmap for general p

Co-authored-by: ConnorStoneAstro &lt;78555321+ConnorStoneAstro@users.noreply.github.com&gt;

* Update pted() signatures/docstrings for jax.Array; add jax optional extra in pyproject.toml

Co-authored-by: ConnorStoneAstro &lt;78555321+ConnorStoneAstro@users.noreply.github.com&gt;

* Add cross-backend consistency tests for numpy/torch/JAX energy distance utils

Co-authored-by: ConnorStoneAstro &lt;78555321+ConnorStoneAstro@users.noreply.github.com&gt;

---------

Co-authored-by: copilot-swe-agent[bot] &lt;198982749+Copilot@users.noreply.github.com&gt;
Co-authored-by: ConnorStoneAstro &lt;78555321+ConnorStoneAstro@users.noreply.github.com&gt;
diff --git a/README.md b/README.md
@@ -29,6 +29,12 @@ If you want to run PTED on GPUs using PyTorch, then also install torch:
 pip install torch
 ```
 
+If you want to use JAX arrays as inputs, then also install jax:
+
+```bash
+pip install jax
+```
+
 The two functions are ``pted.pted`` and ``pted.pted_coverage_test``. For
 information about each argument, just use ``help(pted.pted)`` or
 ``help(pted.pted_coverage_test)``. 
@@ -261,8 +267,8 @@ results you are getting!
 
 ```python
 def pted(
-    x: Union[np.ndarray, "Tensor"],
-    y: Union[np.ndarray, "Tensor"],
+    x: Union[np.ndarray, "Tensor", "jax.Array"],
+    y: Union[np.ndarray, "Tensor", "jax.Array"],
     permutations: int = 1000,
     metric: Union[str, float] = "euclidean",
     return_all: bool = False,
@@ -273,10 +279,10 @@ def pted(
 ) -> Union[float, tuple[float, np.ndarray, float]]:
 ```
 
-* **x** *(Union[np.ndarray, Tensor])*: first set of samples. Shape (N, *D)
-* **y** *(Union[np.ndarray, Tensor])*: second set of samples. Shape (M, *D)
+* **x** *(Union[np.ndarray, Tensor, jax.Array])*: first set of samples. Shape (N, *D)
+* **y** *(Union[np.ndarray, Tensor, jax.Array])*: second set of samples. Shape (M, *D)
 * **permutations** *(int)*: number of permutations to run. This determines how accurately the p-value is computed.
-* **metric** *(Union[str, float])*: distance metric to use. See scipy.spatial.distance.cdist for the list of available metrics with numpy. See torch.cdist when using PyTorch, note that the metric is passed as the "p" for torch.cdist and therefore is a float from 0 to inf.
+* **metric** *(Union[str, float])*: distance metric to use. See scipy.spatial.distance.cdist for the list of available metrics with numpy. See torch.cdist when using PyTorch, note that the metric is passed as the "p" for torch.cdist and therefore is a float from 0 to inf. When using JAX arrays, the metric is passed as the "ord" for jnp.linalg.norm and therefore is also a float.
 * **return_all** *(bool)*: if True, return the test statistic and the permuted statistics with the p-value. If False, just return the p-value. bool (default: False)
 * **chunk_size** *(Optional[int])*: if not None, use chunked energy distance estimation. This is useful for large datasets. The chunk size is the number of samples to use for each chunk. If None, use the full dataset.
 * **chunk_iter** *(Optional[int])*: The chunk iter is the number of iterations to use with the given chunk size.
@@ -287,8 +293,8 @@ def pted(
 
 ```python
 def pted_coverage_test(
-    g: Union[np.ndarray, "Tensor"],
-    s: Union[np.ndarray, "Tensor"],
+    g: Union[np.ndarray, "Tensor", "jax.Array"],
+    s: Union[np.ndarray, "Tensor", "jax.Array"],
     permutations: int = 1000,
     metric: Union[str, float] = "euclidean",
     warn_confidence: Optional[float] = 1e-3,
@@ -301,10 +307,10 @@ def pted_coverage_test(
 ) -> Union[float, tuple[np.ndarray, np.ndarray, float]]:
 ```
 
-* **g** *(Union[np.ndarray, Tensor])*: Ground truth samples. Shape (n_sims, *D)
-* **s** *(Union[np.ndarray, Tensor])*: Posterior samples. Shape (n_samples, n_sims, *D)
+* **g** *(Union[np.ndarray, Tensor, jax.Array])*: Ground truth samples. Shape (n_sims, *D)
+* **s** *(Union[np.ndarray, Tensor, jax.Array])*: Posterior samples. Shape (n_samples, n_sims, *D)
 * **permutations** *(int)*: number of permutations to run. This determines how accurately the p-value is computed.
-* **metric** *(Union[str, float])*: distance metric to use. See scipy.spatial.distance.cdist for the list of available metrics with numpy. See torch.cdist when using PyTorch, note that the metric is passed as the "p" for torch.cdist and therefore is a float from 0 to inf.
+* **metric** *(Union[str, float])*: distance metric to use. See scipy.spatial.distance.cdist for the list of available metrics with numpy. See torch.cdist when using PyTorch, note that the metric is passed as the "p" for torch.cdist and therefore is a float from 0 to inf. When using JAX arrays, the metric is passed as the "ord" for jnp.linalg.norm and therefore is also a float.
 * **return_all** *(bool)*: if True, return the test statistic and the permuted statistics with the p-value. If False, just return the p-value. bool (default: False)
 * **chunk_size** *(Optional[int])*: if not None, use chunked energy distance estimation. This is useful for large datasets. The chunk size is the number of samples to use for each chunk. If None, use the full dataset.
 * **chunk_iter** *(Optional[int])*: The chunk iter is the number of iterations to use with the given chunk size.
@@ -315,9 +321,9 @@ def pted_coverage_test(
 ## GPU Compatibility
 
 PTED works on both CPU and GPU. All that is needed is to pass the `x` and `y` as
-PyTorch Tensors on the appropriate device.
+PyTorch Tensors or JAX Arrays on the appropriate device.
 
-Example:
+Example with PyTorch:
 ```python
 from pted import pted
 import numpy as np
@@ -330,6 +336,19 @@ p_value = pted(torch.tensor(x), torch.tensor(y))
 print(f"p-value: {p_value:.3f}") # expect uniform random from 0-1
 ```
 
+Example with JAX:
+```python
+from pted import pted
+import numpy as np
+import jax.numpy as jnp
+
+x = np.random.normal(size = (500, 10)) # (n_samples_x, n_dimensions)
+y = np.random.normal(size = (400, 10)) # (n_samples_y, n_dimensions)
+
+p_value = pted(jnp.array(x), jnp.array(y))
+print(f"p-value: {p_value:.3f}") # expect uniform random from 0-1
+```
+
 ## Memory and Compute limitations
 
 If a GPU isn't enough to get PTED running fast enough for you, or if you are
diff --git a/pyproject.toml b/pyproject.toml
@@ -41,11 +41,15 @@ dev = [
     "pytest-cov>=4.1,<5",
     "pytest-mock>=3.12,<4",
     "torch>=2.0,<3",
+    "jax>=0.4,<1",
     "matplotlib",
 ]
 torch = [
     "torch>=2.0,<3",
 ]
+jax = [
+    "jax>=0.4,<1",
+]
 
 [tool.hatch.metadata.hooks.requirements_txt]
 files = ["requirements.txt"]
diff --git a/src/pted/pted.py b/src/pted/pted.py
@@ -4,10 +4,13 @@
 
 from .utils import (
     is_torch_tensor,
+    is_jax_array,
     pted_torch,
     pted_numpy,
     pted_chunk_torch,
     pted_chunk_numpy,
+    pted_jax,
+    pted_chunk_jax,
     two_tailed_p,
     confidence_alert,
     simulation_based_calibration_histogram,
@@ -17,8 +20,8 @@
 
 
 def pted(
-    x: Union[np.ndarray, "Tensor"],
-    y: Union[np.ndarray, "Tensor"],
+    x: Union[np.ndarray, "Tensor", "jax.Array"],
+    y: Union[np.ndarray, "Tensor", "jax.Array"],
     permutations: int = 1000,
     metric: Union[str, float] = "euclidean",
     return_all: bool = False,
@@ -72,14 +75,17 @@ def pted(
 
     Parameters
     ----------
-        x (Union[np.ndarray, Tensor]): first set of samples. Shape (N, *D)
-        y (Union[np.ndarray, Tensor]): second set of samples. Shape (M, *D)
+        x (Union[np.ndarray, Tensor, jax.Array]): first set of samples. Shape (N, *D)
+        y (Union[np.ndarray, Tensor, jax.Array]): second set of samples. Shape (M, *D)
         permutations (int): number of permutations to run. This determines how
             accurately the p-value is computed.
-        metric (Union[str, float]): distance metric to use. See scipy.spatial.distance.cdist
-            for the list of available metrics with numpy. See torch.cdist when
-            using PyTorch, note that the metric is passed as the "p" for
-            torch.cdist and therefore is a float from 0 to inf.
+        metric (Union[str, float]): distance metric to use. For NumPy inputs,
+            see scipy.spatial.distance.cdist for available metrics. For PyTorch
+            inputs, the metric is passed as the "p" argument to torch.cdist and
+            therefore is a float from 0 to inf. For JAX inputs, "euclidean" uses
+            the squared-norm identity (p=2), and any float p uses
+            jnp.linalg.norm with ord=p; string metrics other than "euclidean"
+            are not supported for JAX.
         return_all (bool): if True, return the test statistic and the permuted
             statistics with the p-value. If False, just return the p-value.
             bool (default: False)
@@ -140,6 +146,18 @@ def pted(
         )
     elif is_torch_tensor(x):
         test, permute = pted_torch(x, y, permutations=permutations, metric=metric, prog_bar=prog_bar)
+    elif is_jax_array(x) and chunk_size is not None:
+        test, permute = pted_chunk_jax(
+            x,
+            y,
+            permutations=permutations,
+            metric=metric,
+            chunk_size=int(chunk_size),
+            chunk_iter=int(chunk_iter),
+            prog_bar=prog_bar,
+        )
+    elif is_jax_array(x):
+        test, permute = pted_jax(x, y, permutations=permutations, metric=metric, prog_bar=prog_bar)
     elif chunk_size is not None:
         test, permute = pted_chunk_numpy(
             x,
@@ -170,8 +188,8 @@ def pted(
 
 
 def pted_coverage_test(
-    g: Union[np.ndarray, "Tensor"],
-    s: Union[np.ndarray, "Tensor"],
+    g: Union[np.ndarray, "Tensor", "jax.Array"],
+    s: Union[np.ndarray, "Tensor", "jax.Array"],
     permutations: int = 1000,
     metric: Union[str, float] = "euclidean",
     warn_confidence: Optional[float] = 1e-3,
@@ -228,14 +246,17 @@ def pted_coverage_test(
 
     Parameters
     ----------
-        g (Union[np.ndarray, Tensor]): Ground truth samples. Shape (n_sims, *D)
-        s (Union[np.ndarray, Tensor]): Posterior samples. Shape (n_samples, n_sims, *D)
+        g (Union[np.ndarray, Tensor, jax.Array]): Ground truth samples. Shape (n_sims, *D)
+        s (Union[np.ndarray, Tensor, jax.Array]): Posterior samples. Shape (n_samples, n_sims, *D)
         permutations (int): number of permutations to run. This determines how
             accurately the p-value is computed.
-        metric (Union[str, float]): distance metric to use. See scipy.spatial.distance.cdist
-            for the list of available metrics with numpy. See torch.cdist when using
-            PyTorch, note that the metric is passed as the "p" for torch.cdist and
-            therefore is a float from 0 to inf.
+        metric (Union[str, float]): distance metric to use. For NumPy inputs,
+            see scipy.spatial.distance.cdist for available metrics. For PyTorch
+            inputs, the metric is passed as the "p" argument to torch.cdist and
+            therefore is a float from 0 to inf. For JAX inputs, "euclidean" uses
+            the squared-norm identity (p=2), and any float p uses
+            jnp.linalg.norm with ord=p; string metrics other than "euclidean"
+            are not supported for JAX.
         return_all (bool): if True, return the test statistic and the permuted
             statistics with the p-value. If False, just return the p-value. bool
             (default: False)
diff --git a/src/pted/utils.py b/src/pted/utils.py
@@ -16,12 +16,23 @@ class torch:
         Tensor = np.ndarray
 
 
+try:
+    import jax
+    import jax.numpy as jnp
+except ImportError:
+    jax = None
+    jnp = None
+
+
 __all__ = (
     "is_torch_tensor",
+    "is_jax_array",
     "pted_numpy",
     "pted_chunk_numpy",
     "pted_torch",
     "pted_chunk_torch",
+    "pted_jax",
+    "pted_chunk_jax",
     "two_tailed_p",
     "confidence_alert",
     "simulation_based_calibration_histogram",
@@ -39,6 +50,12 @@ def is_torch_tensor(o):
     )
 
 
+def is_jax_array(o):
+    if jax is None:
+        return False
+    return isinstance(o, jax.Array)
+
+
 def _energy_distance_precompute(
     D: Union[np.ndarray, torch.Tensor], nx: int, ny: int
 ) -> Union[float, torch.Tensor]:
@@ -110,6 +127,49 @@ def _energy_distance_estimate_torch(
     return np.mean(E_est)
 
 
+def _jax_cdist(x, y, p: float = 2.0):
+    if p == 2.0:
+        # Squared-norm identity avoids materializing the (nx, ny, d) diff tensor.
+        # ||x_i - y_j||^2 = ||x_i||^2 + ||y_j||^2 - 2 * x_i . y_j
+        x_sq = jnp.sum(x ** 2, axis=-1)  # (nx,)
+        y_sq = jnp.sum(y ** 2, axis=-1)  # (ny,)
+        sq_dist = x_sq[:, None] + y_sq[None, :] - 2.0 * (x @ y.T)
+        return jnp.sqrt(jnp.maximum(sq_dist, 0.0))
+    # For general p-norms use vmap to avoid the (nx, ny, d) intermediate.
+    return jax.vmap(lambda xi: jnp.linalg.norm(xi - y, ord=p, axis=-1))(x)
+
+
+def _energy_distance_jax(x, y, metric: Union[str, float] = "euclidean") -> float:
+    nx = len(x)
+    ny = len(y)
+    z = jnp.concatenate([x, y], axis=0)
+    if metric == "euclidean":
+        metric = 2.0
+    D = _jax_cdist(z, z, p=metric)
+    return float(_energy_distance_precompute(D, nx, ny))
+
+
+def _energy_distance_estimate_jax(
+    x,
+    y,
+    chunk_size: int,
+    chunk_iter: int,
+    metric: Union[str, float] = "euclidean",
+) -> float:
+
+    E_est = []
+    for _ in range(chunk_iter):
+        # Randomly sample a chunk of data
+        idx = np.random.choice(len(x), size=min(len(x), chunk_size), replace=False)
+        x_chunk = x[idx]
+        idy = np.random.choice(len(y), size=min(len(y), chunk_size), replace=False)
+        y_chunk = y[idy]
+
+        # Compute the energy distance
+        E_est.append(_energy_distance_jax(x_chunk, y_chunk, metric=metric))
+    return np.mean(E_est)
+
+
 def pted_chunk_numpy(
     x: np.ndarray,
     y: np.ndarray,
@@ -210,6 +270,59 @@ def pted_torch(
     return test_stat, permute_stats
 
 
+def pted_jax(
+    x,
+    y,
+    permutations: int = 100,
+    metric: Union[str, float] = "euclidean",
+    prog_bar: bool = False,
+) -> tuple[float, list[float]]:
+    assert jax is not None, "JAX is not installed! try: `pip install jax`"
+    z = jnp.concatenate([x, y], axis=0)
+    assert jnp.all(jnp.isfinite(z)), "Input contains NaN or Inf!"
+    if metric == "euclidean":
+        metric = 2.0
+    dmatrix = _jax_cdist(z, z, p=metric)
+    assert jnp.all(
+        jnp.isfinite(dmatrix)
+    ), "Distance matrix contains NaN or Inf! Consider using a different metric or normalizing values to be more stable (i.e. z-score norm)."
+    nx = len(x)
+    ny = len(y)
+
+    test_stat = float(_energy_distance_precompute(dmatrix, nx, ny))
+    permute_stats = []
+    for _ in trange(permutations, disable=not prog_bar):
+        I = np.random.permutation(len(z))
+        dmatrix = dmatrix[I][:, I]
+        permute_stats.append(float(_energy_distance_precompute(dmatrix, nx, ny)))
+    return test_stat, permute_stats
+
+
+def pted_chunk_jax(
+    x,
+    y,
+    permutations: int = 100,
+    metric: Union[str, float] = "euclidean",
+    chunk_size: int = 100,
+    chunk_iter: int = 10,
+    prog_bar: bool = False,
+) -> tuple[float, list[float]]:
+    assert jax is not None, "JAX is not installed! try: `pip install jax`"
+    assert jnp.all(jnp.isfinite(x)) and jnp.all(jnp.isfinite(y)), "Input contains NaN or Inf!"
+    nx = len(x)
+
+    test_stat = _energy_distance_estimate_jax(x, y, chunk_size, chunk_iter, metric=metric)
+    permute_stats = []
+    for _ in trange(permutations, disable=not prog_bar):
+        z = jnp.concatenate([x, y], axis=0)
+        z = z[np.random.permutation(len(z))]
+        x, y = z[:nx], z[nx:]
+        permute_stats.append(
+            _energy_distance_estimate_jax(x, y, chunk_size, chunk_iter, metric=metric)
+        )
+    return test_stat, permute_stats
+
+
 def two_tailed_p(chi2, df):
     assert df > 2, "Degrees of freedom must be greater than 2 for two-tailed p-value calculation."
     alpha = chi2_dist.pdf(chi2, df)
diff --git a/tests/test_pted.py b/tests/test_pted.py