stochastic sampler

arrjon · arrjon · commit 9ed482defe3e · 2025-04-24T23:55:03.000+02:00
diff --git a/bayesflow/experimental/diffusion_model.py b/bayesflow/experimental/diffusion_model.py
@@ -374,7 +374,7 @@ class DiffusionModel(InferenceNetwork):
     }
 
     INTEGRATE_DEFAULT_CONFIG = {
-        "method": "euler",
+        "method": "euler",  # or euler_maruyama
         "steps": 100,
     }
 
@@ -530,6 +530,7 @@ def velocity(
         time: float | Tensor,
         conditions: Tensor = None,
         training: bool = False,
+        stochastic_solver: bool = False,
         clip_x: bool = False,
     ) -> Tensor:
         # calculate the current noise level and transform into correct shape
@@ -549,44 +550,28 @@ def velocity(
         # convert x to score
         score = (alpha_t * x_pred - xz) / ops.square(sigma_t)
 
-        # compute velocity for the ODE depending on the noise schedule
+        # compute velocity f, g of the SDE or ODE
         f, g_squared = self.noise_schedule.get_drift_diffusion(log_snr_t=log_snr_t, x=xz)
-        # out = f - 0.5 * g_squared * score
-        out = f - g_squared * score
 
-        # todo: for the SDE: d(z) = [ f(z, t) - g(t)^2 * score(z, lambda) ] dt + g(t) dW
+        if stochastic_solver:
+            # for the SDE: d(z) = [f(z, t) - g(t) ^ 2 * score(z, lambda )] dt + g(t) dW
+            out = f - g_squared * score
+        else:
+            # for the ODE: d(z) = [f(z, t) - 0.5 * g(t) ^ 2 * score(z, lambda )] dt
+            out = f - 0.5 * g_squared * score
+
         return out
 
-    def velocity2(
+    def compute_diffusion_term(
         self,
         xz: Tensor,
         time: float | Tensor,
-        conditions: Tensor = None,
         training: bool = False,
-        clip_x: bool = False,
     ) -> Tensor:
         # calculate the current noise level and transform into correct shape
         log_snr_t = expand_right_as(self.noise_schedule.get_log_snr(t=time, training=training), xz)
         log_snr_t = keras.ops.broadcast_to(log_snr_t, keras.ops.shape(xz)[:-1] + (1,))
-        # alpha_t, sigma_t = self.noise_schedule.get_alpha_sigma(log_snr_t=log_snr_t, training=training)
-
-        # if conditions is None:
-        #    xtc = keras.ops.concatenate([xz, log_snr_t], axis=-1)
-        # else:
-        #    xtc = keras.ops.concatenate([xz, log_snr_t, conditions], axis=-1)
-        # pred = self.output_projector(self.subnet(xtc, training=training), training=training)
-
-        # x_pred = self.convert_prediction_to_x(
-        #    pred=pred, z=xz, alpha_t=alpha_t, sigma_t=sigma_t, log_snr_t=log_snr_t, clip_x=clip_x
-        # )
-        # convert x to score
-        # score = (alpha_t * x_pred - xz) / ops.square(sigma_t)
-
-        # compute velocity for the ODE depending on the noise schedule
-        f, g_squared = self.noise_schedule.get_drift_diffusion(log_snr_t=log_snr_t, x=xz)
-        # out = f - 0.5 * g_squared * score
-        # out = f - g_squared * score
-
+        g_squared = self.noise_schedule.get_drift_diffusion(log_snr_t=log_snr_t)
         return ops.sqrt(g_squared)
 
     def _velocity_trace(
@@ -620,6 +605,9 @@ def _forward(
             | self.integrate_kwargs
             | kwargs
         )
+        if integrate_kwargs["method"] == "euler_maruyama":
+            raise ValueError("Stoachastic methods are not supported for forward integration.")
+
         if density:
 
             def deltas(time, xz):
@@ -670,6 +658,8 @@ def _inverse(
             | kwargs
         )
         if density:
+            if integrate_kwargs["method"] == "euler_maruyama":
+                raise ValueError("Stoachastic methods are not supported for density computation.")
 
             def deltas(time, xz):
                 v, trace = self._velocity_trace(xz, time=time, conditions=conditions, training=training)
@@ -689,21 +679,24 @@ def deltas(time, xz):
         def deltas(time, xz):
             return {"xz": self.velocity(xz, time=time, conditions=conditions, training=training)}
 
-        def diffusion(time, xz):
-            return {"xz": self.velocity2(xz, time=time, conditions=conditions, training=training)}
-
         state = {"xz": z}
-        # state = integrate(
-        #    deltas,
-        #    state,
-        #    **integrate_kwargs,
-        # )
-        state = integrate_stochastic(
-            deltas,
-            diffusion,
-            state,
-            **integrate_kwargs,
-        )
+        if integrate_kwargs["method"] == "euler_maruyama":
+
+            def diffusion(time, xz):
+                return {"xz": self.compute_diffusion_term(xz, time=time, training=training)}
+
+            state = integrate_stochastic(
+                deltas,
+                diffusion,
+                state,
+                **integrate_kwargs,
+            )
+        else:
+            state = integrate(
+                deltas,
+                state,
+                **integrate_kwargs,
+            )
 
         x = state["xz"]
         return x