Method to extract loglikelihoods (#166)

torfjelde · torfjelde · commit 4b6d95d83f26 · 2020-09-28T01:27:34.000Z
For several reasons, it would be very nice to have a way of extracting the log-likelihoods from a chain. This PR implements the method `loglikelihoods` to do exactly this. # Up for discussion 1. **Return-value.** Right now it returns a `Dict{String, Vector{Float64})` with the keys being `string(varname)` and the values being an array with the i-th index corresponding to the log-likelihood for `string(varname)` in `chain[i]`. Alternatives: - Dict of the form `Dict(y => Dict(y[1] => ..., y[2] => ...), ...)`, i.e. "hierarhical" - Dict of the form `Dict(y[1] => ..., y[2] => ..., ...)`, i.e. "flattened" - ???? 2. **Project structure.** I'm a bit uncertain where to actually put the implementation. As I now experienced, what you actually need to implement for to make a `AbstractSampler` is a bit unclear, e.g. are some methods in `varinfo.jl` which also requires implementation (e.g. `getindex`). So, should I make it it's own file, like I have now, or should I follow suit with `SampleFromPrior` and `SampleFromUniform`? # Example ```julia julia> using DynamicPPL, Turing julia> @model function demo(xs, y) s ~ InverseGamma(2, 3) m ~ Normal(0, √s) for i in eachindex(xs) xs[i] ~ Normal(m, √s) end y ~ Normal(m, √s) end demo (generic function with 1 method) julia> model = demo(randn(3), randn()); julia> chain = sample(model, MH(), 10); julia> DynamicPPL.loglikelihoods(model, chain) Dict{String,Array{Float64,1}} with 4 entries: "xs[3]" => [-1.02616, -1.26931, -1.05003, -5.05458, -1.33825, -1.02904, -1.23761, -1.30128, -1.04872, -2.03716] "xs[1]" => [-2.08205, -2.51387, -3.03175, -2.5981, -2.31322, -2.62284, -2.70874, -1.18617, -1.36281, -4.39839] "xs[2]" => [-2.20604, -2.63495, -3.22802, -2.48785, -2.40941, -2.78791, -2.85013, -1.24081, -1.46019, -4.59025] "y" => [-1.36627, -1.21964, -1.03342, -7.46617, -1.3234, -1.14536, -1.14781, -2.48912, -2.23705, -1.26267] ```
diff --git a/Project.toml b/Project.toml
@@ -1,6 +1,6 @@
 name = "DynamicPPL"
 uuid = "366bfd00-2699-11ea-058f-f148b4cae6d8"
-version = "0.9.1"
+version = "0.9.2"
 
 [deps]
 AbstractMCMC = "80f14c24-f653-4e6a-9b94-39d6b0f70001"
diff --git a/src/DynamicPPL.jl b/src/DynamicPPL.jl
@@ -90,6 +90,7 @@ export  AbstractVarInfo,
 # Convenience functions
         logprior,
         logjoint,
+        elementwise_loglikelihoods,
 # Convenience macros
         @addlogprob!
 
@@ -118,5 +119,6 @@ include("context_implementations.jl")
 include("compiler.jl")
 include("prob_macro.jl")
 include("compat/ad.jl")
+include("loglikelihoods.jl")
 
 end # module
diff --git a/src/loglikelihoods.jl b/src/loglikelihoods.jl
@@ -0,0 +1,131 @@
+# Context version
+struct ElementwiseLikelihoodContext{A, Ctx} <: AbstractContext
+    loglikelihoods::A
+    ctx::Ctx
+end
+
+function ElementwiseLikelihoodContext(
+    likelihoods = Dict{VarName, Vector{Float64}}(),
+    ctx::AbstractContext = LikelihoodContext()
+)
+    return ElementwiseLikelihoodContext{typeof(likelihoods),typeof(ctx)}(likelihoods, ctx)
+end
+
+function Base.push!(
+    ctx::ElementwiseLikelihoodContext{Dict{VarName, Vector{Float64}}},
+    vn::VarName,
+    logp::Real
+)
+    lookup = ctx.loglikelihoods
+    ℓ = get!(lookup, vn, Float64[])
+    push!(ℓ, logp)
+end
+
+function Base.push!(
+    ctx::ElementwiseLikelihoodContext{Dict{VarName, Float64}},
+    vn::VarName,
+    logp::Real
+)
+    ctx.loglikelihoods[vn] = logp
+end
+
+
+function tilde_assume(rng, ctx::ElementwiseLikelihoodContext, sampler, right, vn, inds, vi)
+    return tilde_assume(rng, ctx.ctx, sampler, right, vn, inds, vi)
+end
+
+function dot_tilde_assume(rng, ctx::ElementwiseLikelihoodContext, sampler, right, left, vn, inds, vi)
+    value, logp = dot_tilde(rng, ctx.ctx, sampler, right, left, vn, inds, vi)
+    acclogp!(vi, logp)
+    return value
+end
+
+
+function tilde_observe(ctx::ElementwiseLikelihoodContext, sampler, right, left, vname, vinds, vi)
+    # This is slightly unfortunate since it is not completely generic...
+    # Ideally we would call `tilde_observe` recursively but then we don't get the
+    # loglikelihood value.
+    logp = tilde(ctx.ctx, sampler, right, left, vi)
+    acclogp!(vi, logp)
+
+    # track loglikelihood value
+    push!(ctx, vname, logp)
+
+    return left
+end
+
+
+"""
+    elementwise_loglikelihoods(model::Model, chain::Chains)
+
+Runs `model` on each sample in `chain` returning an array of arrays with
+the i-th element inner arrays corresponding to the the likelihood of the i-th
+observation for that particular sample in `chain`.
+
+# Notes
+Say `y` is a `Vector` of `n` i.i.d. `Normal(μ, σ)` variables, with `μ` and `σ`
+both being `<:Real`. Then the *observe* (i.e. when the left-hand side is an
+*observation*) statements can be implemented in two ways:
+```julia
+for i in eachindex(y)
+    y[i] ~ Normal(μ, σ)
+end
+```
+or
+```julia
+y ~ MvNormal(fill(μ, n), fill(σ, n))
+```
+Unfortunately, just by looking at the latter statement, it's impossible to tell whether or
+not this is one *single* observation which is `n` dimensional OR if we have *multiple*
+1-dimensional observations. Therefore, `loglikelihoods` will only work with the first
+example.
+
+# Examples
+```julia-repl
+julia> using DynamicPPL, Turing
+
+julia> @model function demo(xs, y)
+           s ~ InverseGamma(2, 3)
+           m ~ Normal(0, √s)
+           for i in eachindex(xs)
+               xs[i] ~ Normal(m, √s)
+           end
+
+           y ~ Normal(m, √s)
+       end
+demo (generic function with 1 method)
+
+julia> model = demo(randn(3), randn());
+
+julia> chain = sample(model, MH(), 10);
+
+julia> DynamicPPL.elementwise_loglikelihoods(model, chain)
+Dict{String,Array{Float64,1}} with 4 entries:
+  "xs[3]" => [-1.02616, -1.26931, -1.05003, -5.05458, -1.33825, -1.02904, -1.23761, -1.30128, -1.04872, -2.03716]
+  "xs[1]" => [-2.08205, -2.51387, -3.03175, -2.5981, -2.31322, -2.62284, -2.70874, -1.18617, -1.36281, -4.39839]
+  "xs[2]" => [-2.20604, -2.63495, -3.22802, -2.48785, -2.40941, -2.78791, -2.85013, -1.24081, -1.46019, -4.59025]
+  "y"     => [-1.36627, -1.21964, -1.03342, -7.46617, -1.3234, -1.14536, -1.14781, -2.48912, -2.23705, -1.26267]
+```
+"""
+function elementwise_loglikelihoods(model::Model, chain)
+    # Get the data by executing the model once
+    ctx = ElementwiseLikelihoodContext()
+    spl = SampleFromPrior()
+    vi = VarInfo(model)
+
+    iters = Iterators.product(1:size(chain, 1), 1:size(chain, 3))
+    for (sample_idx, chain_idx) in iters
+        # Update the values
+        setval!(vi, chain, sample_idx, chain_idx)
+
+        # Execute model
+        model(vi, spl, ctx)
+    end
+    return ctx.loglikelihoods
+end
+
+function elementwise_loglikelihoods(model::Model, varinfo::AbstractVarInfo)
+    ctx = ElementwiseLikelihoodContext(Dict{VarName, Float64}())
+    model(varinfo, SampleFromPrior(), ctx)
+    return ctx.loglikelihoods
+end
diff --git a/test/loglikelihoods.jl b/test/loglikelihoods.jl
@@ -0,0 +1,40 @@
+using .Turing
+
+@testset "loglikelihoods" begin
+    @model function demo(xs, y)
+        s ~ InverseGamma(2, 3)
+        m ~ Normal(0, √s)
+        for i in eachindex(xs)
+            xs[i] ~ Normal(m, √s)
+        end
+
+        y ~ Normal(m, √s)
+    end
+
+    xs = randn(3);
+    y = randn();
+    model = demo(xs, y);
+    chain = sample(model, MH(), 100);
+    results = elementwise_loglikelihoods(model, chain)
+    var_to_likelihoods = Dict(string(varname) => logliks for (varname, logliks) in results)
+    @test haskey(var_to_likelihoods, "xs[1]")
+    @test haskey(var_to_likelihoods, "xs[2]")
+    @test haskey(var_to_likelihoods, "xs[3]")
+    @test haskey(var_to_likelihoods, "y")
+
+    for (i, (s, m)) in enumerate(zip(chain[:s], chain[:m]))
+        @test logpdf(Normal(m, √s), xs[1]) == var_to_likelihoods["xs[1]"][i]
+        @test logpdf(Normal(m, √s), xs[2]) == var_to_likelihoods["xs[2]"][i]
+        @test logpdf(Normal(m, √s), xs[3]) == var_to_likelihoods["xs[3]"][i]
+        @test logpdf(Normal(m, √s), y) == var_to_likelihoods["y"][i]
+    end
+
+    var_info = VarInfo(model)
+    results = DynamicPPL.elementwise_loglikelihoods(model, var_info)
+    var_to_likelihoods = Dict(string(vn) => ℓ for (vn, ℓ) in results)
+    s, m = var_info[SampleFromPrior()]
+    @test logpdf(Normal(m, √s), xs[1]) == var_to_likelihoods["xs[1]"]
+    @test logpdf(Normal(m, √s), xs[2]) == var_to_likelihoods["xs[2]"]
+    @test logpdf(Normal(m, √s), xs[3]) == var_to_likelihoods["xs[3]"]
+    @test logpdf(Normal(m, √s), y) == var_to_likelihoods["y"]
+end
diff --git a/test/runtests.jl b/test/runtests.jl
@@ -28,6 +28,7 @@ include("test_util.jl")
     include("independence.jl")
     include("distribution_wrappers.jl")
     include("context_implementations.jl")
+    include("loglikelihoods.jl")
 
     include("threadsafe.jl")