Implement first order and second order TPS, update baseline for second order

plainerman · plainerman · commit 9d95064b4758 · 2024-05-07T15:12:16.000+02:00
diff --git a/environment.yml b/environment.yml
@@ -17,3 +17,4 @@ dependencies:
     - matplotlib==3.8.2
     - rdkit==2023.3.3
     - ParmEd==4.2.2
+    - scikit-image==0.23.2
diff --git a/tps/first_order.py b/tps/first_order.py
@@ -5,7 +5,7 @@
 MAX_STEPS = 1_000
 
 
-class System:
+class FirstOrderSystem:
     def __init__(self, start_state, target_state, step):
         self.start_state = start_state
         self.target_state = target_state
@@ -18,7 +18,7 @@ def one_way_shooting(system, trajectory, fixed_length, key):
     # pick a random point along the trajectory
     point_idx = jax.random.randint(key[0], (1,), 1, len(trajectory) - 1)[0]
     # pick a random direction, either forward or backward
-    direction = jax.random.randint(key[1], (1,), 0,  2)[0]
+    direction = jax.random.randint(key[1], (1,), 0, 2)[0]
 
     if direction == 0:
         trajectory = trajectory[:point_idx + 1]
diff --git a/tps/plot.py b/tps/plot.py
@@ -0,0 +1,106 @@
+import numpy as np
+from skimage.draw import line
+from tqdm import tqdm
+import matplotlib.pyplot as plt
+
+
+class PeriodicPathHistogram:
+    def __init__(self, bins=250, interpolate=True, scale=np.pi):
+        self.bins = bins
+        self.interpolate = interpolate
+        self.scale = scale
+        self.hist = np.zeros((bins, bins))
+
+    def add_paths(self, paths: list[np.ndarray], factors: list[float] = None):
+        for path, factor in tqdm(zip(paths, factors or [1] * len(paths)), total=len(paths)):
+            self.add_path(path, factor=factor)
+
+    def add_path(self, path: np.ndarray, factor: float = 1):
+        """
+        Adds a path to the histogram. The path is a list of 2D points in the range [-scale, scale]
+        """
+        rr, cc = np.array([], dtype=int), np.array([], dtype=int)
+
+        if self.interpolate:
+            for i in range(len(path) - 1):
+                rr_cur, cc_cur = self._add_path_segment_periodic(path[i], path[i + 1])
+                rr = np.concatenate([rr, rr_cur])
+                cc = np.concatenate([cc, cc_cur])
+        else:
+            for p in path:
+                point = ((p + self.scale) / (2 * self.scale) * (self.bins - 1)).astype(int)
+                cc = np.concatenate([cc, [point[0]]])
+                rr = np.concatenate([rr, [point[1]]])
+
+        # we only add it once for each path, so that overlapping segments are not counted multiple times
+        self.hist[rr, cc] += factor
+
+    def _add_path_segment_periodic(self, start: np.ndarray, stop: np.ndarray):
+        start = np.array(start)
+        stop = np.array(stop)
+
+        if np.linalg.norm(start - stop) < self.scale:
+            return self._determine_path_segments(start, stop)
+
+        possible_offsets = [
+            np.array([0, 2 * self.scale]),
+            np.array([0, -2 * self.scale]),
+            np.array([2 * self.scale, 0]),
+            np.array([-2 * self.scale, 0]),
+            np.array([2 * self.scale, 2 * self.scale]),
+            np.array([-2 * self.scale, 2 * self.scale]),
+            np.array([2 * self.scale, -2 * self.scale]),
+            np.array([-2 * self.scale, -2 * self.scale]),
+        ]
+
+        def add_shortest_segment(point, target):
+            distances = np.array([np.linalg.norm((target + offset) - point) for offset in possible_offsets])
+            best_offset_idx = np.argmin(distances)
+
+            best_target = target + possible_offsets[best_offset_idx]
+            return self._determine_path_segments(point, best_target)
+
+        # just try each possible combination and use the shortest path
+        rr1, cc1 = add_shortest_segment(start, stop)
+        rr2, cc2 = add_shortest_segment(stop, start)
+        return np.concatenate([rr1, rr2]), np.concatenate([cc1, cc2])
+
+    def _determine_path_segments(self, start: np.ndarray, stop: np.ndarray):
+        """
+        Start and stop are 2D points in the range [-scale, scale].
+        This function converts the points into the corresponding bins and then uses a line to connect those points
+        """
+        start = ((start + self.scale) / (2 * self.scale) * (self.bins - 1)).astype(int)
+        stop = ((stop + self.scale) / (2 * self.scale) * (self.bins - 1)).astype(int)
+
+        rr, cc = line(start[1], start[0], stop[1], stop[0])
+        rr_mask = (rr >= 0) & (rr < self.bins)
+        cc_mask = (cc >= 0) & (cc < self.bins)
+        mask = rr_mask & cc_mask
+        rr, cc = rr[mask], cc[mask]
+
+        return rr, cc
+
+    def plot(self, density=False, cmin=None, cmax=None, **kwargs):
+        H = self.hist.copy()
+        if density:
+            H /= H.sum() * (2 * self.scale / self.bins) ** 2
+
+        if cmin is not None:
+            H[H < cmin] = None
+        if cmax is not None:
+            H[H > cmax] = None
+
+        x = np.linspace(self.scale, -self.scale, self.bins)
+        y = np.linspace(self.scale, -self.scale, self.bins)
+        xv, yv = np.meshgrid(x, y)
+
+        plt.pcolormesh(xv, yv, np.flip(H), **kwargs)
+        ticks = np.arange(-self.scale, self.scale + self.scale * 0.01, self.scale / 4)
+
+        plt.xlim(-self.scale, self.scale)
+        plt.ylim(-self.scale, self.scale)
+        plt.xlabel(r"$\phi$")
+        plt.ylabel(r"$\psi$")
+        plt.xticks(ticks)
+        plt.yticks(ticks)
diff --git a/tps/second_order.py b/tps/second_order.py
@@ -0,0 +1,191 @@
+import jax
+import jax.numpy as jnp
+from tqdm import tqdm
+
+MAX_STEPS = 2_000
+MAX_ABS_VALUE = 5
+
+
+class SecondOrderSystem:
+    def __init__(self, start_state, target_state, step_forward, step_backward, sample_velocity):
+        self.start_state = start_state
+        self.target_state = target_state
+        self.step_forward = step_forward
+        self.step_backward = step_backward
+        self.sample_velocity = sample_velocity
+
+
+def one_way_shooting(system, trajectory, fixed_length, key):
+    key = jax.random.split(key)
+
+    # pick a random point along the trajectory
+    point_idx = jax.random.randint(key[0], (1,), 1, len(trajectory) - 1)[0]
+    # pick a random direction, either forward or backward
+    direction = jax.random.randint(key[1], (1,), 0, 2)[0]
+
+    # TODO: Fix correct dt in ps
+    velocity = (trajectory[point_idx] - trajectory[point_idx - 1]) / 0.001
+
+    if direction == 0:
+        trajectory = trajectory[:point_idx + 1]
+        step_function = system.step_forward
+    else:  # direction == 1:
+        trajectory = trajectory[point_idx:][::-1]
+        step_function = system.step_backward
+
+    steps = MAX_STEPS if fixed_length == 0 else fixed_length
+
+    key, iter_key = jax.random.split(key[3])
+    while len(trajectory) < steps:
+        key, iter_key = jax.random.split(key)
+        point, velocity = step_function(trajectory[-1], velocity, iter_key)
+        trajectory.append(point)
+
+        if jnp.isnan(point).any() or jnp.isnan(velocity).any():
+            return False, trajectory
+
+        # ensure that our trajectory does not explode
+        if (jnp.abs(point) > MAX_ABS_VALUE).any():
+            return False, trajectory
+
+        if system.start_state(trajectory[0]) and system.target_state(trajectory[-1]):
+            if fixed_length == 0 or len(trajectory) == fixed_length:
+                return True, trajectory
+            return False, trajectory
+
+        if system.target_state(trajectory[0]) and system.start_state(trajectory[-1]):
+            if fixed_length == 0 or len(trajectory) == fixed_length:
+                return True, trajectory[::-1]
+            return False, trajectory
+
+    return False, trajectory
+
+
+def two_way_shooting(system, trajectory, fixed_length, key):
+    key = jax.random.split(key)
+
+    # pick a random point along the trajectory
+    point_idx = jax.random.randint(key[0], (1,), 1, len(trajectory) - 1)[0]
+    point = trajectory[point_idx]
+    # simulate forward from the point until max_steps
+
+    steps = MAX_STEPS if fixed_length == 0 else fixed_length
+
+    initial_velocity = system.sample_velocity(key[1])
+
+    key, iter_key = jax.random.split(key[2])
+    new_trajectory = [point]
+
+    velocity = initial_velocity
+    while len(new_trajectory) < steps:
+        key, iter_key = jax.random.split(key)
+        point, velocity = system.step_forward(new_trajectory[-1], velocity, iter_key)
+        new_trajectory.append(point)
+
+        if jnp.isnan(point).any() or jnp.isnan(velocity).any():
+            return False, trajectory
+
+        # ensure that our trajectory does not explode
+        if (jnp.abs(point) > MAX_ABS_VALUE).any():
+            return False, trajectory
+
+        if system.start_state(point) or system.target_state(point):
+            break
+
+    velocity = initial_velocity
+    while len(new_trajectory) < steps:
+        key, iter_key = jax.random.split(key)
+        point, velocity = system.step_backward(new_trajectory[0], velocity, iter_key)
+        new_trajectory.insert(0, point)
+
+        if jnp.isnan(point).any() or jnp.isnan(velocity).any():
+            return False, trajectory
+
+        # ensure that our trajectory does not explode
+        if (jnp.abs(point) > MAX_ABS_VALUE).any():
+            return False, trajectory
+
+        if system.start_state(point) or system.target_state(point):
+            break
+
+    # throw away the trajectory if it's not the right length
+    if fixed_length != 0 and len(new_trajectory) != fixed_length:
+        return False, trajectory
+
+    if system.start_state(new_trajectory[0]) and system.target_state(new_trajectory[-1]):
+        return True, new_trajectory
+
+    if system.target_state(new_trajectory[0]) and system.start_state(new_trajectory[-1]):
+        return True, new_trajectory[::-1]
+
+    return False, trajectory
+
+
+def mcmc_shooting(system, proposal, initial_trajectory, num_paths, key, fixed_length=0, warmup=50):
+    # pick an initial trajectory
+    trajectories = [initial_trajectory]
+
+    with tqdm(total=num_paths + warmup, desc='warming up' if warmup > 0 else '') as pbar:
+        while len(trajectories) <= num_paths + warmup:
+            if len(trajectories) > warmup:
+                pbar.set_description('')
+
+            key, traj_idx_key, iter_key, accept_key = jax.random.split(key, 4)
+            traj_idx = jax.random.randint(traj_idx_key, (1,), warmup + 1, len(trajectories))[0]
+            # during warmup, we want an iterative scheme
+            traj_idx = traj_idx if traj_idx < len(trajectories) else -1
+
+            found, new_trajectory = proposal(system, trajectories[traj_idx], fixed_length, iter_key)
+
+            if not found:
+                continue
+
+            ratio = len(trajectories[-1]) / len(new_trajectory)
+            # The first trajectory might have a very unreasonable length, so we skip it
+            if len(trajectories) == 1 or jax.random.uniform(accept_key, shape=(1,)) < ratio:
+                trajectories.append(new_trajectory)
+                pbar.update(1)
+
+    return trajectories[warmup + 1:]
+
+
+def unguided_md(system, initial_point, num_paths, key, fixed_length=0):
+    trajectories = []
+    current_frame = initial_point.clone()
+    current_trajectory = []
+
+    key, velocity_key = jax.random.split(key)
+    velocity = system.sample_velocity(velocity_key)
+
+    with tqdm(total=num_paths) as pbar:
+        while len(trajectories) < num_paths:
+            key, iter_key = jax.random.split(key)
+            next_frame, velocity = system.step_forward(current_frame, velocity, iter_key)
+
+            assert not jnp.isnan(next_frame).any()
+
+            is_transition = not (system.start_state(next_frame) or system.target_state(next_frame))
+            if is_transition:
+                if len(current_trajectory) == 0:
+                    current_trajectory.append(current_frame)
+
+                if fixed_length != 0 and len(current_trajectory) > fixed_length:
+                    current_trajectory = []
+                    is_transition = False
+                else:
+                    current_trajectory.append(next_frame)
+            elif len(current_trajectory) > 0:
+                current_trajectory.append(next_frame)
+
+                if fixed_length == 0 or len(current_trajectory) == fixed_length:
+                    if system.start_state(current_trajectory[0]) and system.target_state(current_trajectory[-1]):
+                        trajectories.append(current_trajectory)
+                        pbar.update(1)
+                    elif system.target_state(current_trajectory[0]) and system.start_state(current_trajectory[-1]):
+                        trajectories.append(current_trajectory[::-1])
+                        pbar.update(1)
+                current_trajectory = []
+
+            current_frame = next_frame
+
+    return trajectories
diff --git a/tps_baseline.py b/tps_baseline.py
diff --git a/utils/animation.py b/utils/animation.py