Add loop_over_posterior

lucianopaz · lucianopaz · commit 3012b1797109 · 2025-08-01T13:23:53.000+02:00
diff --git a/docs/source/api/samplers.rst b/docs/source/api/samplers.rst
@@ -15,6 +15,7 @@ This submodule contains functions for MCMC and forward sampling.
    draw
    compute_deterministics
    vectorize_over_posterior
+   loop_over_posterior
    init_nuts
    sampling.jax.sample_blackjax_nuts
    sampling.jax.sample_numpyro_nuts
diff --git a/pymc/sampling/forward.py b/pymc/sampling/forward.py
@@ -42,6 +42,7 @@
     walk,
 )
 from pytensor.graph.fg import FunctionGraph
+from pytensor.scan.basic import scan
 from pytensor.tensor.random.var import RandomGeneratorSharedVariable
 from pytensor.tensor.sharedvar import SharedVariable, TensorSharedVariable
 from pytensor.tensor.variable import TensorConstant, TensorVariable
@@ -57,7 +58,12 @@
 from pymc.distributions.shape_utils import change_dist_size
 from pymc.model import Model, modelcontext
 from pymc.progress_bar import CustomProgress, default_progress_theme
-from pymc.pytensorf import compile, rvs_in_graph
+from pymc.pytensorf import (
+    clone_while_sharing_some_variables,
+    collect_default_updates,
+    compile,
+    rvs_in_graph,
+)
 from pymc.util import (
     RandomState,
     _get_seeds_per_chain,
@@ -68,6 +74,7 @@
 __all__ = (
     "compile_forward_sampling_function",
     "draw",
+    "loop_over_posterior",
     "sample_posterior_predictive",
     "sample_prior_predictive",
     "vectorize_over_posterior",
@@ -1083,3 +1090,122 @@ def vectorize_over_posterior(
                 f"The following random variables found in the extracted graph: {remaining_rvs}"
             )
     return vectorized_outputs
+
+
+def loop_over_posterior(
+    outputs: list[Variable],
+    posterior: xr.Dataset,
+    input_rvs: list[Variable],
+    input_tensors: Sequence[Variable] = (),
+    allow_rvs_in_graph: bool = True,
+    sample_dims: tuple[str, ...] = ("chain", "draw"),
+) -> tuple[list[Variable], dict[Variable, Variable]]:
+    """Loop over posterior samples of subset of input rvs.
+
+    This function creates a new graph for the supplied outputs, where the required
+    subset of input rvs are replaced by their posterior samples (chain and draw
+    dimensions, or the dimensions provided in sample_dims are flattened). The other
+    input tensors are kept as is.
+
+    Parameters
+    ----------
+    outputs : list[Variable]
+        The list of variables to vectorize over the posterior samples.
+    posterior : xr.Dataset
+        The posterior samples to use as replacements for the `input_rvs`.
+    input_rvs : list[Variable]
+        The list of random variables to replace with their posterior samples.
+    input_tensors : Sequence[Variable]
+        The list of tensors to keep as is.
+    allow_rvs_in_graph : bool
+        Whether to allow random variables to be present in the graph. If False,
+        an error will be raised if any random variables are found in the graph. If
+        True, the remaining random variables will be resized to match the number of
+        draws from the posterior.
+    sample_dims : tuple[str, ...]
+        The dimensions of the posterior samples to use for looping the `input_rvs`.
+
+    Returns
+    -------
+    looped_outputs : list[Variable]
+        The looped variables, reshaped to match the original shape of the outputs, but
+        adding the sample_dims to the left.
+    updates : dict[Variable, Variable]
+        Dictionary of updates needed to compile the pytensor function to produce the
+        outputs.
+
+    Raises
+    ------
+    RuntimeError
+        If random variables are found in the graph and `allow_rvs_in_graph` is False
+    ValueError
+        If the supplied output tensors do not depend on the requested input tensors
+    """
+    if not (set(input_tensors) <= set(ancestors(outputs))):
+        raise ValueError(  # pragma: no cover
+            "The supplied output tensors do not depend on the following requested "
+            f"input tensors: {set(input_tensors) - set(ancestors(outputs))}"
+        )
+    outputs_ancestors = ancestors(outputs, blockers=input_rvs)
+    rvs_from_posterior: list[TensorVariable] = [
+        cast(TensorVariable, rv) for rv in outputs_ancestors if rv in set(input_rvs)
+    ]
+    independent_rvs = [
+        rv
+        for rv in rvs_in_graph(outputs)
+        if rv in outputs_ancestors and rv not in rvs_from_posterior
+    ]
+
+    def step(*args):
+        input_values = args[: len(args) - len(input_tensors) - len(independent_rvs)]
+        non_sequences = args[len(args) - len(input_tensors) - len(independent_rvs) :]
+
+        # Compute output sample value for input sample values
+        replace = {
+            **dict(zip(rvs_from_posterior, input_values, strict=True)),
+        }
+        samples = clone_while_sharing_some_variables(
+            outputs, replace=replace, kept_variables=non_sequences
+        )
+
+        # Collect updates if there are RV Ops in the graph
+        updates = collect_default_updates(outputs=samples, inputs=input_values)
+        return (*samples,), updates
+
+    sequences = []
+    batch_shape = tuple([len(posterior.coords[dim]) for dim in sample_dims])
+    nsamples = np.prod(batch_shape)
+    for rv in rvs_from_posterior:
+        values = posterior[rv.name].data
+        sequences.append(
+            pt.constant(
+                np.reshape(values, (nsamples, *values.shape[2:])),
+                name=rv.name,
+                dtype=rv.dtype,
+            )
+        )
+    scan_out, updates = scan(
+        fn=step,
+        sequences=sequences,
+        non_sequences=[*input_tensors, *independent_rvs],
+        n_steps=nsamples,
+    )
+    if len(outputs) == 1:
+        scan_out = [scan_out]  # pragma: no cover
+
+    looped: list[Variable] = []
+    for out in scan_out:
+        core_shape = tuple(
+            [
+                static if static is not None else dynamic
+                for static, dynamic in zip(out.type.shape[1:], out.shape[1:])
+            ]
+        )
+        looped.append(pt.reshape(out, (*batch_shape, *core_shape)))
+    if not allow_rvs_in_graph:
+        remaining_rvs = rvs_in_graph(looped)
+        if remaining_rvs:
+            raise RuntimeError(
+                f"The following random variables found in the extracted graph: {remaining_rvs}"
+            )
+    return looped, updates
diff --git a/tests/sampling/test_forward.py b/tests/sampling/test_forward.py
@@ -41,6 +41,7 @@
     compile_forward_sampling_function,
     get_constant_coords,
     get_vars_in_point_list,
+    loop_over_posterior,
     observed_dependent_deterministics,
     vectorize_over_posterior,
 )
@@ -1958,3 +1959,115 @@ def test_vectorize_over_posterior_matches_sample():
             atol=0.6 / np.sqrt(10000),
         )
         assert np.all(np.abs(vect_obs - x_posterior[..., None]) < 1)
+
+
+def test_loop_over_posterior(
+    variable_to_vectorize,
+    input_rv_names,
+    allow_rvs_in_graph,
+    model_to_vectorize,
+):
+    model, idata = model_to_vectorize
+
+    if not allow_rvs_in_graph and (len(input_rv_names) == 0 or "z" in variable_to_vectorize):
+        with pytest.raises(
+            RuntimeError,
+            match="The following random variables found in the extracted graph",
+        ):
+            loop_over_posterior(
+                outputs=[model[name] for name in variable_to_vectorize],
+                posterior=idata.posterior,
+                input_rvs=[model[name] for name in input_rv_names],
+                input_tensors=[model["d"]],
+                allow_rvs_in_graph=allow_rvs_in_graph,
+            )
+    else:
+        vectorized, _ = loop_over_posterior(
+            outputs=[model[name] for name in variable_to_vectorize],
+            posterior=idata.posterior,
+            input_rvs=[model[name] for name in input_rv_names],
+            input_tensors=[model["d"]],
+            allow_rvs_in_graph=allow_rvs_in_graph,
+        )
+        assert all(
+            vectorized_var is not model[name]
+            for vectorized_var, name in zip(vectorized, variable_to_vectorize)
+        )
+        assert all(vectorized_var.type.shape == (1, 100, 3) for vectorized_var in vectorized)
+        assert all(
+            variable_depends_on(
+                vectorized_var.owner.inputs[0].owner.op.inner_outputs[0], model["d"]
+            )
+            for vectorized_var in vectorized
+        )
+        inner_graph_outputs = [
+            vectorized_var.owner.inputs[0].owner.op.inner_outputs[i]
+            for i, vectorized_var in enumerate(vectorized)
+        ]
+        if len(vectorized) == 2:
+            assert variable_depends_on(
+                inner_graph_outputs[variable_to_vectorize.index("z_downstream")],
+                inner_graph_outputs[variable_to_vectorize.index("z")],
+            )
+        if len(input_rv_names) > 0:
+            for input_rv_name in input_rv_names:
+                if input_rv_name == "x_parent":
+                    assert len(get_var_by_name(inner_graph_outputs, input_rv_name)) == 0
+                else:
+                    [vectorized_rv] = get_var_by_name(vectorized, input_rv_name)
+                    rv_posterior = idata.posterior[input_rv_name].data
+                    assert isinstance(vectorized_rv, TensorConstant)
+                    np.testing.assert_equal(
+                        np.reshape(vectorized_rv.value, rv_posterior.shape),
+                        rv_posterior,
+                        strict=True,
+                    )
+        else:
+            original_rvs = rvs_in_graph([model[name] for name in variable_to_vectorize])
+            expected_rv_shapes = {rv.type.shape for rv in original_rvs}
+            rvs = rvs_in_graph(inner_graph_outputs)
+            assert {rv.type.shape for rv in rvs} == expected_rv_shapes
+
+
+def test_loop_over_posterior_matches_sample():
+    rng = np.random.default_rng(1234)
+    with pm.Model() as model:
+        x = pm.Normal("x")
+        sigma = 0.1
+        obs = pm.Normal("obs", x, sigma, observed=rng.normal(size=10))
+        det = pm.Deterministic("det", obs + 1)
+
+    chains = 2
+    draws = 100
+    x_posterior = np.broadcast_to(100 * np.arange(chains)[..., None], (chains, draws))
+    with model:
+        posterior = xr.Dataset(
+            {
+                "x": xr.DataArray(
+                    x_posterior,
+                    dims=("chain", "draw"),
+                    coords={"chain": np.arange(chains), "draw": np.arange(draws)},
+                )
+            }
+        )
+    idata = InferenceData(posterior=posterior)
+    with model:
+        pp = pm.sample_posterior_predictive(idata, var_names=["obs", "det"], random_seed=1234)
+        vectorized, updates = loop_over_posterior(
+            outputs=[obs, det],
+            posterior=posterior,
+            input_rvs=[x],
+            allow_rvs_in_graph=True,
+        )
+        [vect_obs, vect_det] = compile(
+            inputs=[], outputs=vectorized, random_seed=1234, updates=updates
+        )()
+        assert pp.posterior_predictive["obs"].shape == vect_obs.shape
+        assert pp.posterior_predictive["det"].shape == vect_det.shape
+        np.testing.assert_allclose(vect_obs + 1, vect_det)
+        np.testing.assert_allclose(
+            pp.posterior_predictive["obs"].mean(dim=("chain", "draw")),
+            vect_obs.mean(axis=(0, 1)),
+            atol=0.6 / np.sqrt(10000),
+        )
+        assert np.all(np.abs(vect_obs - x_posterior[..., None]) < 1)