Using Priors from Pymc-experimental for the cp_param_effects

JeanVanDyk · JeanVanDyk · commit b9c3a976f616 · 2025-10-23T17:14:17.000+02:00
diff --git a/causalpy/experiments/change_point_detection.py b/causalpy/experiments/change_point_detection.py
@@ -312,14 +312,14 @@ def _bayesian_plot(
         # Plot predicted values after change point (with HDI)
         h_line, h_patch = plot_xY(
             self.datapre.index,
-            self.pre_pred["posterior_predictive"].mu_ts.isel(treated_units=0),
+            self.pre_pred["posterior_predictive"].mu.isel(treated_units=0),
             ax=ax[0],
             plot_hdi_kwargs={"color": "yellowgreen"},
         )
 
         h_line, h_patch = plot_xY(
             self.datapost.index,
-            self.post_pred["posterior_predictive"].mu_ts.isel(treated_units=0),
+            self.post_pred["posterior_predictive"].mu.isel(treated_units=0),
             ax=ax[0],
             plot_hdi_kwargs={"color": "yellowgreen"},
         )
@@ -330,7 +330,7 @@ def _bayesian_plot(
         # pre-intervention period
         h_line, h_patch = plot_xY(
             self.datapre.index,
-            self.pre_pred["posterior_predictive"].mu.isel(treated_units=0),
+            self.pre_pred["posterior_predictive"].mu_ts.isel(treated_units=0),
             ax=ax[0],
             plot_hdi_kwargs={"color": "C0"},
         )
@@ -351,7 +351,7 @@ def _bayesian_plot(
         # post intervention period
         h_line, h_patch = plot_xY(
             self.datapost.index,
-            self.post_pred["posterior_predictive"].mu.isel(treated_units=0),
+            self.post_pred["posterior_predictive"].mu_ts.isel(treated_units=0),
             ax=ax[0],
             plot_hdi_kwargs={"color": "C1"},
         )
@@ -367,7 +367,7 @@ def _bayesian_plot(
         )
         # Shaded causal effect
         post_pred_mu = (
-            az.extract(self.post_pred, group="posterior_predictive", var_names="mu")
+            az.extract(self.post_pred, group="posterior_predictive", var_names="mu_ts")
             .isel(treated_units=0)
             .mean("sample")
         )  # Add .mean("sample") to get 1D array
diff --git a/causalpy/pymc_models.py b/causalpy/pymc_models.py
@@ -890,7 +890,7 @@ class initialisation.
 
 class LinearChangePointDetection(PyMCModel):
     r"""
-    Custom PyMC model to estimate the time an intervention took place.
+    Custom PyMC model to estimate one ChangePoint in time series.
 
     This model implements three types of changepoints: level shift, trend change, and impulse response.
     While the underlying mathematical framework could theoretically be applied to other changepoint
@@ -965,6 +965,14 @@ class LinearChangePointDetection(PyMCModel):
         Inference ...
     """
 
+    default_priors = {
+        "beta": Prior("Normal", mu=0, sigma=5, dims=["treated_units", "coeffs"]),
+        "level": Prior("Normal", mu=0, sigma=5),
+        "trend": Prior("Normal", mu=0, sigma=0.5),
+        "impulse_amplitude": Prior("Normal", mu=0, sigma=5),
+        "impulse_decay_rate": Prior("HalfNormal", sigma=5),
+    }
+
     def __init__(
         self,
         cp_effect_type: str | list[str],
@@ -984,50 +992,14 @@ def __init__(
         :param sample_kwargs: Optional dictionary of arguments passed to pm.sample().
         """
 
-        super().__init__(sample_kwargs)
-
-        # Hardcoded default priors
-        self.DEFAULT_BETA_PRIOR = (0, 5)
-        self.DEFAULT_LEVEL_PRIOR = (0, 5)
-        self.DEFAULT_TREND_PRIOR = (0, 0.5)
-        self.DEFAULT_IMPULSE_PRIOR = (0, 5, 5)
+        super().__init__(sample_kwargs, cp_effect_param)
 
         # Make sure we get a list of all expected effects
         if isinstance(cp_effect_type, str):
             self.cp_effect_type = [cp_effect_type]
         else:
             self.cp_effect_type = cp_effect_type
 
-        # Defining the priors here
-        self.cp_effect_param = {} if cp_effect_param is None else cp_effect_param
-
-        if "level" in self.cp_effect_type:
-            if (
-                "level" not in self.cp_effect_param
-                or len(self.cp_effect_param["level"]) != 2
-            ):
-                self.cp_effect_param["level"] = self.DEFAULT_LEVEL_PRIOR
-            else:
-                self.cp_effect_param["level"] = self.cp_effect_param["level"]
-
-        if "trend" in self.cp_effect_type:
-            if (
-                "trend" not in self.cp_effect_param
-                or len(self.cp_effect_param["trend"]) != 2
-            ):
-                self.cp_effect_param["trend"] = self.DEFAULT_TREND_PRIOR
-            else:
-                self.cp_effect_param["trend"] = self.cp_effect_param["trend"]
-
-        if "impulse" in self.cp_effect_type:
-            if (
-                "impulse" not in self.cp_effect_param
-                or len(self.cp_effect_param["impulse"]) != 3
-            ):
-                self.cp_effect_param["impulse"] = self.DEFAULT_IMPULSE_PRIOR
-            else:
-                self.cp_effect_param["impulse"] = self.cp_effect_param["impulse"]
-
     def build_model(self, X, y, coords):
         """
         Defines the PyMC model
@@ -1061,39 +1033,25 @@ def build_model(self, X, y, coords):
                 var=(t - change_point),
                 dims=["obs_ind"],
             )
-            beta = pm.Normal(
-                name="beta",
-                mu=self.DEFAULT_BETA_PRIOR[0],
-                sigma=self.DEFAULT_BETA_PRIOR[1],
-                dims=["treated_units", "coeffs"],
-            )
+            beta = self.priors["beta"].create_variable("beta")
 
             # --- Intervention effect ---
             mu_in_components = []
 
-            if "level" in self.cp_effect_param:
-                level = pm.Normal(
-                    "level",
-                    mu=self.cp_effect_param["level"][0],
-                    sigma=self.cp_effect_param["level"][1],
-                )
+            if "level" in self.cp_effect_type:
+                level = self.priors["level"].create_variable("level")
                 mu_in_components.append(level)
-            if "trend" in self.cp_effect_param:
-                trend = pm.Normal(
-                    "trend",
-                    mu=self.cp_effect_param["trend"][0],
-                    sigma=self.cp_effect_param["trend"][1],
-                )
+
+            if "trend" in self.cp_effect_type:
+                trend = self.priors["trend"].create_variable("trend")
                 mu_in_components.append(trend * delta_t)
-            if "impulse" in self.cp_effect_param:
-                impulse_amplitude = pm.Normal(
-                    "impulse_amplitude",
-                    mu=self.cp_effect_param["impulse"][0],
-                    sigma=self.cp_effect_param["impulse"][1],
+
+            if "impulse" in self.cp_effect_type:
+                impulse_amplitude = self.priors["impulse_amplitude"].create_variable(
+                    "impulse_amplitude"
                 )
-                decay_rate = pm.HalfNormal(
-                    "decay_rate",
-                    sigma=self.cp_effect_param["impulse"][2],
+                decay_rate = self.priors["impulse_decay_rate"].create_variable(
+                    "impulse_decay_rate"
                 )
                 impulse = pm.Deterministic(
                     "impulse",
@@ -1104,8 +1062,8 @@ def build_model(self, X, y, coords):
             # --- Parameterization ---
             weight = pm.math.sigmoid(delta_t)
             # Compute and store the base time series
-            mu = pm.Deterministic(
-                name="mu", var=pm.math.dot(X, beta.T), dims=["obs_ind", "treated_units"]
+            mu_ts = pm.Deterministic(
+                name="mu_ts", var=pt.dot(X, beta.T), dims=["obs_ind", "treated_units"]
             )
             # Compute and store the modelled intervention effect
             mu_in = (
@@ -1120,20 +1078,20 @@ def build_model(self, X, y, coords):
                 )
             )
             # Compute and store the sum of the base time series and the intervention's effect
-            mu_ts = pm.Deterministic(
-                "mu_ts",
-                mu + (weight * mu_in)[:, None],
+            mu = pm.Deterministic(
+                "mu",
+                mu_ts + (weight * mu_in)[:, None],
                 dims=["obs_ind", "treated_units"],
             )
-            sigma = pm.HalfNormal("sigma", 1, dims="treated_units")
 
             # --- Likelihood ---
+            sigma = pm.HalfNormal("sigma", 1, dims="treated_units")
             # Likelihood of the base time series
-            pm.Normal("y_hat", mu=mu, sigma=sigma, dims=["obs_ind", "treated_units"])
+            pm.Normal("y_ts", mu=mu_ts, sigma=sigma, dims=["obs_ind", "treated_units"])
             # Likelihodd of the base time series and the intervention's effect
             pm.Normal(
-                "y_ts",
-                mu=mu_ts,
+                "y_hat",
+                mu=mu,
                 sigma=sigma,
                 observed=y,
                 dims=["obs_ind", "treated_units"],
@@ -1193,8 +1151,8 @@ def score(self, X, y) -> pd.Series:
         """
         Score the Bayesian :math:`R^2` given inputs ``X`` and outputs ``y``.
         """
-        mu_ts = self.predict(X)
-        mu_data = az.extract(mu_ts, group="posterior_predictive", var_names="mu_ts")
+        mu = self.predict(X)
+        mu_data = az.extract(mu, group="posterior_predictive", var_names="mu")
 
         scores = {}
 
@@ -1208,6 +1166,12 @@ def score(self, X, y) -> pd.Series:
 
         return pd.Series(scores)
 
+    def calculate_impact(
+        self, y_true: xr.DataArray, y_pred: az.InferenceData
+    ) -> xr.DataArray:
+        impact = y_true - y_pred["posterior_predictive"]["y_ts"]
+        return impact.transpose(..., "obs_ind")
+
     def set_time_range(self, time_range, data):
         """
         Set time_range.
diff --git a/docs/source/_static/interrogate_badge.svg b/docs/source/_static/interrogate_badge.svg
@@ -1,5 +1,5 @@
 <svg width="140" height="20" viewBox="0 0 140 20" version="1.1" xmlns="http://www.w3.org/2000/svg" xmlns:xlink="http://www.w3.org/1999/xlink" xml:space="preserve" xmlns:serif="http://www.serif.com/" style="fill-rule:evenodd;clip-rule:evenodd;stroke-linejoin:round;stroke-miterlimit:2;">
-    <title>interrogate: 96.0%</title>
+    <title>interrogate: 95.7%</title>
     <g transform="matrix(1,0,0,1,22,0)">
         <g id="backgrounds" transform="matrix(1.32789,0,0,1,-22.3892,0)">
             <rect x="0" y="0" width="71" height="20" style="fill:rgb(85,85,85);"/>
@@ -12,8 +12,8 @@
     <g fill="#fff" text-anchor="middle" font-family="DejaVu Sans,Verdana,Geneva,sans-serif" font-size="110">
         <text x="590" y="150" fill="#010101" fill-opacity=".3" transform="scale(.1)" textLength="610">interrogate</text>
         <text x="590" y="140" transform="scale(.1)" textLength="610">interrogate</text>
-        <text x="1160" y="150" fill="#010101" fill-opacity=".3" transform="scale(.1)" textLength="370" data-interrogate="result">96.0%</text>
-        <text x="1160" y="140" transform="scale(.1)" textLength="370" data-interrogate="result">96.0%</text>
+        <text x="1160" y="150" fill="#010101" fill-opacity=".3" transform="scale(.1)" textLength="370" data-interrogate="result">95.7%</text>
+        <text x="1160" y="140" transform="scale(.1)" textLength="370" data-interrogate="result">95.7%</text>
     </g>
     <g id="logo-shadow" serif:id="logo shadow" transform="matrix(0.854876,0,0,0.854876,-6.73514,1.732)">
         <g transform="matrix(0.299012,0,0,0.299012,9.70229,-6.68582)">
diff --git a/docs/source/notebooks/cp_covid.ipynb b/docs/source/notebooks/cp_covid.ipynb