adding some tests and a conclusion

NathanielF · NathanielF · commit d2035f86f73f · 2025-07-11T23:04:41.000+01:00
Signed-off-by: Nathaniel &lt;NathanielF@users.noreply.github.com&gt;
diff --git a/causalpy/pymc_models.py b/causalpy/pymc_models.py
@@ -527,6 +527,69 @@ def fit_outcome_model(
         normal_outcome=True,
         spline_component=False,
     ):
+        """
+        Fit a Bayesian outcome model using covariates and previously estimated propensity scores.
+
+        This function implements the second stage of a modular two-step causal inference procedure.
+        It uses propensity scores extracted from a prior treatment model (via `self.fit()`) to adjust
+        for confounding when estimating treatment effects on an outcome variable `y`.
+
+        Parameters
+        ----------
+        X_outcome : array-like, shape (n_samples, n_covariates)
+            Covariate matrix for the outcome model.
+
+        y : array-like, shape (n_samples,)
+            Observed outcome variable.
+
+        coords : dict
+            Coordinate dictionary for named dimensions in the PyMC model. Should include
+            a key "outcome_coeffs" for `X_outcome`.
+
+        priors : dict, optional
+            Dictionary specifying priors for outcome model parameters:
+                - "b_outcome": list [mean, std] for regression coefficients.
+                - "a_outcome": list [mean, std] for the intercept.
+                - "sigma": standard deviation of the outcome noise (default 1).
+
+        noncentred : bool, default True
+            If True, use a non-centred parameterization for the outcome coefficients.
+
+        normal_outcome : bool, default True
+            If True, assume a Normal likelihood for the outcome.
+            If False, use a Student-t likelihood with unknown degrees of freedom.
+
+        spline_component : bool, default False
+            If True, include a spline basis expansion on the propensity score to allow
+            flexible (nonlinear) adjustment. Uses B-splines with 30 internal knots.
+
+        Returns
+        -------
+        idata_outcome : arviz.InferenceData
+            The posterior and prior predictive samples from the outcome model.
+
+        model_outcome : pm.Model
+            The PyMC model object.
+
+        Raises
+        ------
+        AttributeError
+            If the `self.idata` attribute is not available, which indicates that
+            `fit()` (i.e., the treatment model) has not been called yet.
+
+        Notes
+        -----
+        - This model uses a sampled version of the propensity score (`p`) from the
+        posterior of the treatment model, randomly selecting one posterior draw
+        per call.
+        - The term `beta_ps[0] * p + beta_ps[1] * (p * treatment)` captures both
+        main and interaction effects of the propensity score.
+        - Including spline adjustment enables modeling nonlinear relationships
+        between the propensity score and the outcome.
+        - Compatible with IPW-style estimation when combined with weighted loss or
+        diagnostics outside this function.
+
+        """
         if not hasattr(self, "idata"):
             raise AttributeError("""Object is missing required attribute 'idata'
                                  so cannot proceed. Call fit() first""")
@@ -551,7 +614,6 @@ def fit_outcome_model(
                     dims="outcome_coeffs",
                 )
 
-            beta_ps_spline = pm.Normal("beta_ps_spline", 0, 1, size=34)
             beta_ps = pm.Normal("beta_ps", 0, 1, size=2)
 
             chosen = np.random.choice(range(propensity_scores.shape[1]))
diff --git a/causalpy/tests/test_integration_pymc_examples.py b/causalpy/tests/test_integration_pymc_examples.py
@@ -14,6 +14,7 @@
 import arviz as az
 import numpy as np
 import pandas as pd
+import pymc as pm
 import pytest
 from matplotlib import pyplot as plt
 
@@ -723,5 +724,29 @@ def test_inverse_prop(mock_pymc_sample):
     assert isinstance(fig, plt.Figure)
     assert isinstance(axs, list)
     assert all(isinstance(ax, plt.Axes) for ax in axs)
+    plt.close()
     with pytest.raises(NotImplementedError):
         result.get_plot_data()
+
+    ### testing outcome model
+    idata_normal, model_normal = result.model.fit_outcome_model(
+        X_outcome=result.X_outcome,
+        y=result.y,
+        coords=result.coords,
+        normal_outcome=True,
+        spline_component=False,
+    )
+    assert isinstance(idata_normal, az.InferenceData)
+    assert isinstance(model_normal, pm.Model)
+    assert "beta_" in idata_normal.posterior
+    assert "beta_ps" in idata_normal.posterior
+
+    # Test spline model
+    idata_spline, _ = result.model.fit_outcome_model(
+        X_outcome=result.X_outcome,
+        y=result.y,
+        coords=result.coords,
+        normal_outcome=True,
+        spline_component=True,
+    )
+    assert "spline_features" in idata_spline.posterior
diff --git a/docs/source/_static/interrogate_badge.svg b/docs/source/_static/interrogate_badge.svg
@@ -1,5 +1,5 @@
 <svg width="140" height="20" viewBox="0 0 140 20" version="1.1" xmlns="http://www.w3.org/2000/svg" xmlns:xlink="http://www.w3.org/1999/xlink" xml:space="preserve" xmlns:serif="http://www.serif.com/" style="fill-rule:evenodd;clip-rule:evenodd;stroke-linejoin:round;stroke-miterlimit:2;">
-    <title>interrogate: 94.5%</title>
+    <title>interrogate: 95.0%</title>
     <g transform="matrix(1,0,0,1,22,0)">
         <g id="backgrounds" transform="matrix(1.32789,0,0,1,-22.3892,0)">
             <rect x="0" y="0" width="71" height="20" style="fill:rgb(85,85,85);"/>
@@ -12,8 +12,8 @@
     <g fill="#fff" text-anchor="middle" font-family="DejaVu Sans,Verdana,Geneva,sans-serif" font-size="110">
         <text x="590" y="150" fill="#010101" fill-opacity=".3" transform="scale(.1)" textLength="610">interrogate</text>
         <text x="590" y="140" transform="scale(.1)" textLength="610">interrogate</text>
-        <text x="1160" y="150" fill="#010101" fill-opacity=".3" transform="scale(.1)" textLength="370" data-interrogate="result">94.5%</text>
-        <text x="1160" y="140" transform="scale(.1)" textLength="370" data-interrogate="result">94.5%</text>
+        <text x="1160" y="150" fill="#010101" fill-opacity=".3" transform="scale(.1)" textLength="370" data-interrogate="result">95.0%</text>
+        <text x="1160" y="140" transform="scale(.1)" textLength="370" data-interrogate="result">95.0%</text>
     </g>
     <g id="logo-shadow" serif:id="logo shadow" transform="matrix(0.854876,0,0,0.854876,-6.73514,1.732)">
         <g transform="matrix(0.299012,0,0,0.299012,9.70229,-6.68582)">