MurrellGroup
diff --git a/‎Project.toml‎
Lines changed: 14 additions & 0 deletions b/‎Project.toml‎
Lines changed: 14 additions & 0 deletions
diff --git a/‎examples/Project.toml‎
Lines changed: 9 additions & 0 deletions b/‎examples/Project.toml‎
Lines changed: 9 additions & 0 deletions
diff --git a/‎examples/continuous.jl‎
Lines changed: 90 additions & 0 deletions b/‎examples/continuous.jl‎
Lines changed: 90 additions & 0 deletions
diff --git a/‎examples/continuous_cat_BrownianMotion{Float32}(0.0f0, 0.1f0).svg‎
Lines changed: 15072 additions & 0 deletions b/‎examples/continuous_cat_BrownianMotion{Float32}(0.0f0, 0.1f0).svg‎
Lines changed: 15072 additions & 0 deletions
diff --git a/‎examples/continuous_cat_Deterministic().svg‎
Lines changed: 15070 additions & 0 deletions b/‎examples/continuous_cat_Deterministic().svg‎
Lines changed: 15070 additions & 0 deletions
diff --git a/‎src/Flowfusion.jl‎
Lines changed: 27 additions & 1 deletion b/‎src/Flowfusion.jl‎
Lines changed: 27 additions & 1 deletion
diff --git a/‎src/bridge.jl‎
Lines changed: 156 additions & 0 deletions b/‎src/bridge.jl‎
Lines changed: 156 additions & 0 deletions
@@ -3,7 +3,21 @@ uuid = "5b4e93c8-7b6e-4682-b400-fc3b238f52b1"
 authors = ["murrellb <[email protected]> and contributors"]
 version = "1.0.0-DEV"
 
+[deps]
+Adapt = "79e6a3ab-5dfb-504d-930d-738a2a938a0e"
+ForwardBackward = "e879419d-bb0f-4252-adee-d266c51ac92d"
+Manifolds = "1cead3c2-87b3-11e9-0ccd-23c62b72b94e"
+NNlib = "872c559c-99b0-510c-b3b7-b6c96a88d5cd"
+OneHotArrays = "0b1bfda6-eb8a-41d2-88d8-f5af5cad476f"
+StatsBase = "2913bbd2-ae8a-5f71-8c99-4fb6c76f3a91"
+
 [compat]
+Adapt = "4.1.1"
+ForwardBackward = "1.0.0"
+Manifolds = "0.10.12"
+NNlib = "0.9.27"
+OneHotArrays = "0.2.6"
+StatsBase = "0.34.4"
 julia = "1.9"
 
 [extras]
 
@@ -0,0 +1,9 @@
+[deps]
+Flowfusion = "5b4e93c8-7b6e-4682-b400-fc3b238f52b1"
+Flux = "587475ba-b771-5e3f-ad9e-33799f191a9c"
+ForwardBackward = "e879419d-bb0f-4252-adee-d266c51ac92d"
+Manifolds = "1cead3c2-87b3-11e9-0ccd-23c62b72b94e"
+NNlib = "872c559c-99b0-510c-b3b7-b6c96a88d5cd"
+Optimisers = "3bd65402-5787-11e9-1adc-39752487f4e2"
+Plots = "91a5bcdd-55d7-5caf-9e0b-520d859cae80"
+RandomFeatureMaps = "780baa95-dd42-481b-93db-80fe3d88832c"
@@ -0,0 +1,90 @@
+using Pkg
+Pkg.activate(".")
+using Revise
+Pkg.develop(path="../../ForwardBackward/")
+Pkg.develop(path="../")
+using ForwardBackward, Flowfusion, NNlib, Flux, RandomFeatureMaps, Optimisers, Plots
+
+#Set up a Flux model: X̂1 = model(t,Xt)
+struct FModel{A}
+    layers::A
+end
+Flux.@layer FModel
+function FModel(; embeddim = 128, spacedim = 2, layers = 3)
+    embed_time = Chain(RandomFourierFeatures(1 => embeddim, 1f0), Dense(embeddim => embeddim, swish))
+    embed_state = Chain(RandomFourierFeatures(2 => embeddim, 1f0), Dense(embeddim => embeddim, swish))
+    ffs = [Dense(embeddim => embeddim, swish) for _ in 1:layers]
+    decode = Dense(embeddim => spacedim)
+    layers = (; embed_time, embed_state, ffs, decode)
+    FModel(layers)
+end
+
+function (f::FModel)(t, Xt)
+    l = f.layers
+    tXt = tensor(Xt)
+    tv = zero(tXt[1:1,:]) .+ expand(t, ndims(tXt))
+    x = l.embed_time(tv) .+ l.embed_state(tXt)
+    for ff in l.ffs
+        x = x .+ ff(x)
+    end
+    tXt .+ l.decode(x) .* (1.05f0 .- expand(t, ndims(tXt))) 
+end
+
+model = FModel(embeddim = 256, layers = 3, spacedim = 2)
+
+#Distributions for training:
+T = Float32
+sampleX1(n_samples) = Flowfusion.random_literal_cat(n_samples, sigma = T(0.05))
+sampleX0(n_samples) = rand(T, 2, n_samples) .+ 2
+n_samples = 200
+
+#The process:
+P = BrownianMotion(0.1f0)
+#P = Deterministic()
+
+#Optimizer:
+eta = 0.01
+opt_state = Flux.setup(AdamW(eta = eta, lambda = 0.001), model)
+
+iters = 5000
+for i in 1:iters
+    #Set up a batch of training pairs, and t:
+    X1 = ContinuousState(sampleX1(n_samples))
+    X0 = ContinuousState(sampleX0(n_samples))
+    t = rand(T, n_samples)
+    #Construct the bridge:
+    Xt = bridge(P, X0, X1, t)
+    #Gradient:
+    l,g = Flux.withgradient(model) do m
+        floss(P, m(t,Xt), X1, scalefloss(P, t, 2))
+    end
+    #Update:
+    Flux.update!(opt_state, model, g[1])
+    #Logging, and lr cooldown:
+    if i % 10 == 0
+        if i > iters - 2000
+            eta *= 0.975
+            Optimisers.adjust!(opt_state, eta)
+        end
+        println("i: $i; Loss: $l; eta: $eta")
+    end
+end
+
+#Generate samples by stepping from X0
+n_inference_samples = 5000
+X0 = ContinuousState(sampleX0(n_inference_samples))
+paths = Tracker()
+samp = gen(P, X0, model, 0f0:0.005f0:1f0, tracker = paths)
+
+#Plotting:
+pl = scatter(X0.state[1,:],X0.state[2,:], msw = 0, ms = 1, color = "blue", alpha = 0.5, size = (400,400), legend = :topleft, label = "X0")
+tvec = stack_tracker(paths, :t)
+xttraj = stack_tracker(paths, :xt)
+for i in 1:50:1000
+    plot!(xttraj[1,i,:], xttraj[2,i,:], color = "red", label = i==1 ? "Trajectory" : :none, alpha = 0.4)
+end
+X1true = sampleX1(n_inference_samples)
+scatter!(X1true[1,:],X1true[2,:], msw = 0, ms = 1, color = "orange", alpha = 0.5, label = "X1 (true)")
+scatter!(samp.state[1,:],samp.state[2,:], msw = 0, ms = 1, color = "green", alpha = 0.5, label = "X1 (generated)")
+display(pl)
+savefig("continuous_cat_$P.svg")
@@ -1,5 +1,31 @@
 module Flowfusion
 
-# Write your package code here.
+using ForwardBackward, OneHotArrays, Adapt, Manifolds, NNlib
+
+include("bridge.jl")
+include("loss.jl")
+
+export 
+    MaskedState,
+    bridge,    
+    scalefloss,
+    gen,
+    Tracker,
+    stack_tracker,
+    onehot,
+    FProcess,
+    tangent_coordinates,
+    apply_tangent_coordinates,
+    floss,
+    tcloss
+
+
+#Useful for demos etc:
+#Define a cat - from https://www.geogebra.org/m/pH8wD3rW
+cat_shape(t) = [-(721*sin(t))/4+196/3*sin(2*t)-86/3*sin(3*t)-131/2*sin(4*t)+477/14*sin(5*t)+27*sin(6*t)-29/2*sin(7*t)+68/5*sin(8*t)+1/10*sin(9*t)+23/4*sin(10*t)-19/2*sin(12*t)-85/21*sin(13*t)+2/3*sin(14*t)+27/5*sin(15*t)+7/4*sin(16*t)+17/9*sin(17*t)-4*sin(18*t)-1/2*sin(19*t)+1/6*sin(20*t)+6/7*sin(21*t)-1/8*sin(22*t)+1/3*sin(23*t)+3/2*sin(24*t)+13/5*sin(25*t)+sin(26*t)-2*sin(27*t)+3/5*sin(28*t)-1/5*sin(29*t)+1/5*sin(30*t)+(2337*cos(t))/8-43/5*cos(2*t)+322/5*cos(3*t)-117/5*cos(4*t)-26/5*cos(5*t)-23/3*cos(6*t)+143/4*cos(7*t)-11/4*cos(8*t)-31/3*cos(9*t)-13/4*cos(10*t)-9/2*cos(11*t)+41/20*cos(12*t)+8*cos(13*t)+2/3*cos(14*t)+6*cos(15*t)+17/4*cos(16*t)-3/2*cos(17*t)-29/10*cos(18*t)+11/6*cos(19*t)+12/5*cos(20*t)+3/2*cos(21*t)+11/12*cos(22*t)-4/5*cos(23*t)+cos(24*t)+17/8*cos(25*t)-7/2*cos(26*t)-5/6*cos(27*t)-11/10*cos(28*t)+1/2*cos(29*t)-1/5*cos(30*t),
+    -(637*sin(t))/2-188/5*sin(2*t)-11/7*sin(3*t)-12/5*sin(4*t)+11/3*sin(5*t)-37/4*sin(6*t)+8/3*sin(7*t)+65/6*sin(8*t)-32/5*sin(9*t)-41/4*sin(10*t)-38/3*sin(11*t)-47/8*sin(12*t)+5/4*sin(13*t)-41/7*sin(14*t)-7/3*sin(15*t)-13/7*sin(16*t)+17/4*sin(17*t)-9/4*sin(18*t)+8/9*sin(19*t)+3/5*sin(20*t)-2/5*sin(21*t)+4/3*sin(22*t)+1/3*sin(23*t)+3/5*sin(24*t)-3/5*sin(25*t)+6/5*sin(26*t)-1/5*sin(27*t)+10/9*sin(28*t)+1/3*sin(29*t)-3/4*sin(30*t)-(125*cos(t))/2-521/9*cos(2*t)-359/3*cos(3*t)+47/3*cos(4*t)-33/2*cos(5*t)-5/4*cos(6*t)+31/8*cos(7*t)+9/10*cos(8*t)-119/4*cos(9*t)-17/2*cos(10*t)+22/3*cos(11*t)+15/4*cos(12*t)-5/2*cos(13*t)+19/6*cos(14*t)+7/4*cos(15*t)+31/4*cos(16*t)-cos(17*t)+11/10*cos(18*t)-2/3*cos(19*t)+13/3*cos(20*t)-5/4*cos(21*t)+2/3*cos(22*t)+1/4*cos(23*t)+5/6*cos(24*t)+3/4*cos(26*t)-1/2*cos(27*t)-1/10*cos(28*t)-1/3*cos(29*t)-1/19*cos(30*t)]
+
+random_literal_cat(dims...; sigma = 0.05f0) = typeof(sigma).(stack([cat_shape(rand()*2pi)/200 for _ in zeros(dims...)]) .+ randn(2, dims...) * sigma)
+
 
 end
@@ -0,0 +1,156 @@
+#=#####################
+Assumptions:
+- t ∈ [0,1]. Any behavior can be controlled by manipulating the process parameters.
+- FProcess.F is a monotonic function, with F(0) = 0 and F(1) = 1.
+- Default sampling steps are FProcess.F(t) with even t intervals [NOTE TO SELF: Intervals should be F(t2)-F(t1)]
+=#####################
+
+struct FProcess{A,B}
+    P::A #Process
+    F::B #Time transform
+end
+
+UProcess = Union{Process,FProcess}
+process(P::FProcess) = P.P
+process(P::Process) = P
+
+tscale(P::Process, t) = t
+tscale(P::FProcess, t) = P.F.(t)
+
+struct MaskedState{A,B,C}
+    S::A     #State
+    cmask::B #Conditioning mask. 1 = Xt=X1
+    lmask::C #Loss mask.         1 = included in loss
+end
+
+Adapt.adapt_structure(to, S::ForwardBackward.DiscreteState) = ForwardBackward.DiscreteState(S.K, Adapt.adapt(to, S.state))
+Adapt.adapt_structure(to, S::ForwardBackward.ContinuousState) = ForwardBackward.ContinuousState(Adapt.adapt(to, S.state))
+Adapt.adapt_structure(to, S::ForwardBackward.CategoricalLikelihood) = ForwardBackward.CategoricalLikelihood(Adapt.adapt(to, S.dist), Adapt.adapt(to, S.log_norm_const))
+Adapt.adapt_structure(to, MS::MaskedState{<:State}) = MaskedState(Adapt.adapt(to, MS.S), Adapt.adapt(to, MS.cmask), Adapt.adapt(to, MS.lmask))
+Adapt.adapt_structure(to, MS::MaskedState{<:CategoricalLikelihood}) = MaskedState(Adapt.adapt(to, MS.S), Adapt.adapt(to, MS.cmask), Adapt.adapt(to, MS.lmask))
+Adapt.adapt_structure(to, S::ForwardBackward.ManifoldState) = ForwardBackward.ManifoldState(S.M, Adapt.adapt(to, S.state))
+
+UState = Union{State,MaskedState}
+
+ForwardBackward.tensor(X::MaskedState) = tensor(X.S)
+
+import Base.copy
+copy(X::MaskedState) = MaskedState(copy(X.S), copy(X.cmask), copy(X.lmask))
+
+"""
+    endslices(a,m)
+
+Returns a view of `a` where slices specified by `m` are selected. `m` can be multidimensional, but the dimensions of m must match the last dimensions of `a`.
+For example, if `m` is a boolean array, then `size(a)[ndims(a)-ndims(m):end] == size(m)`.
+"""
+endslices(a,m) = @view a[ntuple(Returns(:),ndims(a)-ndims(m))...,m]
+
+"""
+    cmask!(Xt_state, X1_state, cmask)
+    cmask!(Xt, X1)
+
+Applies, in place, a conditioning mask, forcing elements (or slices) of `Xt` to be equal to `X1`, where `cmask` is 1.
+"""
+function cmask!(Xt_state, X1_state, cmask)
+    endslices(Xt_state,cmask) .= endslices(X1_state,cmask)
+    return Xt_state
+end
+
+cmask!(Xt_state, X1_state, cmask::Nothing) = Xt_state
+cmask!(Xt, X1::State) = Xt
+cmask!(Xt, X1::StateLikelihood) = Xt
+cmask!(Xt, X1::MaskedState) = cmask!(Xt.S.state, X1.S.state, X1.cmask)
+cmask!(Xt, X1::MaskedState{<:CategoricalLikelihood}) = error("Cannot condition on a CategoricalLikelihood")
+cmask!(x̂₁::Tuple, x₀::Tuple) = map(cmask!, x̂₁, x₀)
+
+"""
+    bridge(P, X0, X1, t)
+    bridge(P, X0, X1, t0, t)
+
+Samples `Xt` at `t` conditioned on `X0` and `X1` under the process `P`. Start time is `t0` (0 if not specified). End time is 1.
+If `X1` is a `MaskedState`, then `Xt` will equal `X1` where the conditioning mask `X1.cmask` is 1.
+`P`, `X0`, `X1` can also be tuples where the Nth element of `P` will be used for the Nth elements of `X0` and `X1`.
+The same `t` and (optionally) `t0` will be used for all elements. If you need a different `t` for each Proces/State, broadcast with `bridge.(P, X0, X1, t0, t)`.
+"""
+
+function bridge(P::UProcess, X0::UState, X1, t0, t)
+    T = eltype(t)
+    tF = T.(tscale(P,t) .- tscale(P,t0))
+    tB = T.(tscale(P,1) .- tscale(P,t))
+    endpoint_conditioned_sample(cmask!(X0,X1), X1, process(P), tF, tB)
+end
+bridge(P, X0, X1, t) = bridge(P, X0, X1, eltype(t)(0.0), t)
+bridge(P::Tuple{Vararg{UProcess}}, X0::Tuple{Vararg{UState}}, X1::Tuple, t0, t) = bridge.(P, X0, X1, (t0,), (t, ))
+
+
+
+#copytensor! and predictresolve are used handle the state translation that happens in gen(...).
+#We want the user's X̂₁predictor, which is a DL model, to return a plain tensor (since that will be on the GPU, in the loss, etc).
+#This means we need to automagically create a State (typical for the continuous case) or Likelihood (typical for the discrete case) from the tensor.
+#But the user may return a State in the Discrete case (for massive state spaces with sub-linear sampling), and a Likelihood in the Continuous case (for variance matching models)
+#This also needs to handle MaskedStates (needs testing).
+#We need: X̂₁ =  fix(X̂₁predictor(t, Xₜ))
+#Plan: When X̂₁predictor(t, Xₜ) is a State or Likelihood, just pass through.
+#When X̂₁predictor(t, Xₜ) is a plain tensor, we apply default conversion rules.
+
+function copytensor!(dest, src)
+    tensor(dest) .= tensor(src)
+    return dest
+end
+#copytensor!(dest::Tuple, src::Tuple) = map(copytensor!, dest, src)
+
+#Tuple broadcast:
+resolveprediction(dest::Tuple, src::Tuple) = map(resolveprediction, dest, src)
+#Default if X̂₁ is a plain tensor:
+resolveprediction(X̂₁, X₀::DiscreteState) = copytensor!(stochastic(X₀), X̂₁) #Returns a Likelihood
+resolveprediction(X̂₁, X₀::State) = copytensor!(copy(X₀), X̂₁) #Returns a State - Handles Continuous and Manifold cases
+#Passthrough if the user returns a State or Likelihood
+resolveprediction(X̂₁::State, X₀) = X̂₁
+resolveprediction(X̂₁::State, X₀::State) = X̂₁
+resolveprediction(X̂₁::StateLikelihood, X₀) = X̂₁
+#####Add MaskedState case(s)######
+
+##################################
+
+
+
+"""
+    gen(P, X0, X̂₁predictor, steps; tracker=Returns(nothing), midpoint = false)
+
+Constructs a sequence of (stochastic) bridges between `X0` and the predicted `X̂₁` under the process `P`.
+`P`, `X0`, can also be tuples where the Nth element of `P` will be used for the Nth elements of `X0` and `X̂₁predictor`.
+X̂₁predictor is a function that takes `t` (scalar) and `Xₜ` (optionally a tuple) and returns `X̂₁` (a `UState`, a flat tensor with the right shape, or a tuple of either).
+If `X0` is a `MaskedState` (or has a ), then anything  `X̂₁` will be conditioned on `X0` where the conditioning mask `X0.cmask` is 1.
+"""
+function gen(P::Tuple{Vararg{UProcess}}, X₀::Tuple{Vararg{UState}}, X̂₁predictor, steps::AbstractVector; tracker::Function=Returns(nothing), midpoint = false)
+    Xₜ = copy.(X₀)
+    for (s₁, s₂) in zip(steps, steps[begin+1:end])
+        t = midpoint ? (s₁ + s₂) / 2 : t = s₁
+        X̂₁ = resolveprediction(X̂₁predictor(t, Xₜ), X₀)
+        cmask!(X̂₁, X₀)
+        Xₜ = bridge(P, Xₜ, X̂₁, s₁, s₂)
+        tracker(t, Xₜ, X̂₁)
+    end
+    return Xₜ
+end
+
+gen(P, X₀, X̂₁predictor, args...; kwargs...) = gen((P,), (X₀,), (t, Xₜ) -> (X̂₁predictor(t[1], Xₜ[1]),), args...; kwargs...)[1]
+
+struct Tracker <: Function
+    t::Vector
+    xt::Vector
+    x̂1::Vector
+end
+
+Tracker() = Tracker([], [], [])
+
+function (tracker::Tracker)(t, xt, x̂1)
+    push!(tracker.t, t)
+    push!(tracker.xt, xt)
+    push!(tracker.x̂1, x̂1)
+    return nothing
+end
+
+function stack_tracker(tracker, field; tuple_index = 1)
+    return stack([tensor(data[tuple_index]) for data in getproperty(tracker, field)])
+end