docu: tutorial on inspecting fit

bgctw · bgctw · commit e24ff546b971 · 2025-08-19T15:45:59.000+02:00
diff --git a/dev/doubleMM.jl b/dev/doubleMM.jl
@@ -572,7 +572,7 @@ f_allsites = get_hybridproblem_PBmodel(prob0; scenario, use_all_sites = true)
 trans_mP=StackedArray(transP, size(ζsP, 2))
 trans_mMs=StackedArray(transM, size(ζsMs, 1) * size(ζsMs, 3))
 θsP, θsMs = transform_ζs(ζsP, ζsMs; trans_mP, trans_mMs)
-y = apply_process_model(θsP, θsMs, f, xP)
+y = apply_process_model(θsP, θsMs, f, xP) 
 #(; y, θsP, θsMs) = HVI.apply_f_trans(ζsP, ζsMs, f_allsites, xP; transP, transM);
 (y_hmc, θsP_hmc, θsMs_hmc) = (; y, θsP, θsMs);
 
diff --git a/docs/make.jl b/docs/make.jl
@@ -17,14 +17,15 @@ makedocs(;
         "Problem" => "problem.md",
         "Tutorials" => [        
             "Basic workflow" => "tutorials/basic_cpu.md",
-            "Test quarto markdown" => "tutorials/test1.md",
+            "Inspect results" => "tutorials/inspect_results.md",
+            #"Test quarto markdown" => "tutorials/test1.md",
         ],
         "How to" => [
             #".. model independent parameters" => "tutorials/how_to_guides/blocks_corr_site.md",
             #".. model site-global corr" => "tutorials/how_to_guides/corr_site_global.md",
         ],
         "Explanation" => [
-            "Theory" => "explanation/theory_hvi.md",
+            #"Theory" => "explanation/theory_hvi.md", TODO activate when paper is published
         ],
         "Reference" => [
             "Public" => "reference/reference_public.md",
diff --git a/docs/src/tutorials/Project.toml b/docs/src/tutorials/Project.toml
@@ -1,12 +1,14 @@
 [deps]
 Bijectors = "76274a88-744f-5084-9051-94815aaf08c4"
+CairoMakie = "13f3f980-e62b-5c42-98c6-ff1f3baf88f0"
 CommonSolve = "38540f10-b2f7-11e9-35d8-d573e4eb0ff2"
 ComponentArrays = "b0b7db55-cfe3-40fc-9ded-d10e2dbeff66"
 DistributionFits = "45214091-1ed4-4409-9bcf-fdb48a05e921"
 HybridVariationalInference = "a108c475-a4e2-4021-9a84-cfa7df242f64"
 JLD2 = "033835bb-8acc-5ee8-8aae-3f567f8a3819"
 MLUtils = "f1d291b0-491e-4a28-83b9-f70985020b54"
 OptimizationOptimisers = "42dfb2eb-d2b4-4451-abcd-913932933ac1"
+PairPlots = "43a3c2be-4208-490b-832a-a21dcd55d7da"
 Plots = "91a5bcdd-55d7-5caf-9e0b-520d859cae80"
 SimpleChains = "de6bee2f-e2f4-4ec7-b6ed-219cc6f6e9e5"
 StableRNGs = "860ef19b-820b-49d6-a774-d7a799459cd3"
diff --git a/docs/src/tutorials/_pbm_matrix.qmd b/docs/src/tutorials/_pbm_matrix.qmd
@@ -0,0 +1,20 @@
+```{julia}
+function f_doubleMM_sites(θc::CA.ComponentMatrix, xPc::CA.ComponentMatrix)
+    # extract several covariates from xP
+    ST = typeof(CA.getdata(xPc)[1:1,:])  # workaround for non-type-stable Symbol-indexing
+    S1 = (CA.getdata(xPc[:S1,:])::ST)   
+    S2 = (CA.getdata(xPc[:S2,:])::ST)
+    #
+    # extract the parameters as row-repeated vectors
+    n_obs = size(S1, 1)
+    VT = typeof(CA.getdata(θc)[:,1])   # workaround for non-type-stable Symbol-indexing
+    (r0, r1, K1, K2) = map((:r0, :r1, :K1, :K2)) do par
+        p1 = CA.getdata(θc[:, par]) ::VT
+        repeat(p1', n_obs)  # matrix: same for each concentration row in S1
+    end
+    #
+    # each variable is a matrix (n_obs x n_site)
+    r0 .+ r1 .* S1 ./ (K1 .+ S1) .* S2 ./ (K2 .+ S2)
+end
+```
+
diff --git a/docs/src/tutorials/basic_cpu.md b/docs/src/tutorials/basic_cpu.md
@@ -247,10 +247,9 @@ import Zygote
 
 solver = HybridPosteriorSolver(; alg=Adam(0.02), n_MC=3)
 
-(; probo, interpreters) = solve(prob, solver; scenario, rng,
+(; probo, interpreters) = solve(prob, solver; rng,
     callback = callback_loss(100), # output during fitting
     epochs = 2,
-    gdev = identity, # do not use GPU, here
 );
 ```
 
@@ -326,10 +325,9 @@ As a test of the new applicator, the results are refined by running a few more
 epochs of the optimization.
 
 ``` julia
-(; probo) = solve(probo_sites, solver; scenario, rng,
+(; probo) = solve(probo_sites, solver; rng,
     callback = callback_loss(100), # output during fitting
     epochs = 10,
-    gdev = identity, # do not use GPU, here
     #is_inferred = Val(true), # activate type-checks 
 );
 ```
diff --git a/docs/src/tutorials/basic_cpu.qmd b/docs/src/tutorials/basic_cpu.qmd
@@ -282,10 +282,9 @@ import Zygote
 
 solver = HybridPosteriorSolver(; alg=Adam(0.02), n_MC=3)
 
-(; probo, interpreters) = solve(prob, solver; scenario, rng,
+(; probo, interpreters) = solve(prob, solver; rng,
     callback = callback_loss(100), # output during fitting
     epochs = 2,
-    gdev = identity, # do not use GPU, here
 );
 ```
 
@@ -317,25 +316,7 @@ For the parameters, one row corresponds to
 one site. For the drivers and predictions, one column corresponds to one site.
 
 
-```{julia}
-function f_doubleMM_sites(θc::CA.ComponentMatrix, xPc::CA.ComponentMatrix)
-    # extract several covariates from xP
-    ST = typeof(CA.getdata(xPc)[1:1,:])  # workaround for non-type-stable Symbol-indexing
-    S1 = (CA.getdata(xPc[:S1,:])::ST)   
-    S2 = (CA.getdata(xPc[:S2,:])::ST)
-    #
-    # extract the parameters as row-repeated vectors
-    n_obs = size(S1, 1)
-    VT = typeof(CA.getdata(θc)[:,1])   # workaround for non-type-stable Symbol-indexing
-    (r0, r1, K1, K2) = map((:r0, :r1, :K1, :K2)) do par
-        p1 = CA.getdata(θc[:, par]) ::VT
-        repeat(p1', n_obs)  # matrix: same for each concentration row in S1
-    end
-    #
-    # each variable is a matrix (n_obs x n_site)
-    r0 .+ r1 .* S1 ./ (K1 .+ S1) .* S2 ./ (K2 .+ S2)
-end
-```
+{{< include _pbm_matrix.qmd >}}
 
 Again, the function should not rely on the order of parameters but use symbolic indexing 
 to extract the parameter vectors. For type stability of this symbolic indexing,
@@ -362,10 +343,9 @@ As a test of the new applicator, the results are refined by running a few more
 epochs of the optimization.
 
 ```{julia}
-(; probo) = solve(probo_sites, solver; scenario, rng,
+(; probo) = solve(probo_sites, solver; rng,
     callback = callback_loss(100), # output during fitting
     epochs = 10,
-    gdev = identity, # do not use GPU, here
     #is_inferred = Val(true), # activate type-checks 
 );
 ```
diff --git a/docs/src/tutorials/inspect_results.md b/docs/src/tutorials/inspect_results.md
@@ -0,0 +1,164 @@
+# Inspect results of fitted problem
+
+
+``` @meta
+CurrentModule = HybridVariationalInference  
+```
+
+First load necessary packages.
+
+``` julia
+using HybridVariationalInference
+using StableRNGs
+using ComponentArrays: ComponentArrays as CA
+using SimpleChains # for reloading the optimized problem
+using DistributionFits
+using JLD2
+using CairoMakie
+using PairPlots   # scatterplot matrices
+```
+
+After redefinig the process-based model (currently JLD2 cannot save functions),
+the previously optimized Problem can be loaded.
+
+``` julia
+function f_doubleMM_sites(θc::CA.ComponentMatrix, xPc::CA.ComponentMatrix)
+    # extract several covariates from xP
+    ST = typeof(CA.getdata(xPc)[1:1,:])  # workaround for non-type-stable Symbol-indexing
+    S1 = (CA.getdata(xPc[:S1,:])::ST)   
+    S2 = (CA.getdata(xPc[:S2,:])::ST)
+    #
+    # extract the parameters as row-repeated vectors
+    n_obs = size(S1, 1)
+    VT = typeof(CA.getdata(θc)[:,1])   # workaround for non-type-stable Symbol-indexing
+    (r0, r1, K1, K2) = map((:r0, :r1, :K1, :K2)) do par
+        p1 = CA.getdata(θc[:, par]) ::VT
+        repeat(p1', n_obs)  # matrix: same for each concentration row in S1
+    end
+    #
+    # each variable is a matrix (n_obs x n_site)
+    r0 .+ r1 .* S1 ./ (K1 .+ S1) .* S2 ./ (K2 .+ S2)
+end
+```
+
+``` julia
+fname = "intermediate/basic_cpu_results.jld2"
+print(abspath(fname))
+probo, interpreters = load(fname, "probo", "interpreters");
+```
+
+## Sample the posterior
+
+A sample of both, posterior, and predictive posterior can be obtained
+using function [`sample_posterior`](@ref).
+
+``` julia
+using StableRNGs
+rng = StableRNG(112)
+n_sample_pred = 400
+(; θsP, θsMs) = sample_posterior(rng, probo; n_sample_pred)
+```
+
+Lets look at the results.
+
+``` julia
+size(θsP), size(θsMs)
+```
+
+    ((1, 400), (800, 2, 400))
+
+The last dimension is the number of samples, the second-last dimension is
+the respective parameter. `θsMs` has an additional dimension denoting
+the site for which parameters are samples.
+
+They are ComponentArrays with the parameter dimension names that can be used:
+
+``` julia
+θsMs[1,:r1,:] # sample of r1 of the first site
+```
+
+### Corner plots
+
+The relation between different variables can be well inspected by
+scatterplot matrices, also called corner plots or pair plots.
+`PairPlots.jl` provides a Makie-implementation of those.
+
+Here, we plot the global parameters and the site-parameters for the first site.
+
+``` julia
+i_site = 1
+θ1 = vcat(θsP, θsMs[i_site,:,:])
+θ1_nt = NamedTuple(k => CA.getdata(θ1[k,:]) for k in keys(θ1[:,1])) # 
+plt = pairplot(θ1_nt)
+```
+
+![](inspect_results_files/figure-commonmark/cell-9-output-1.png)
+
+The plot shows that parameters for the first site, *K*₁ and *r*₁, are correlated,
+but that we did not model correlation with the global parameter, *K*₂.
+
+Note that this plots shows only the first out of 800 sites.
+HVI estimated a 1602-dimensional posterior distribution including
+covariances among parameters.
+
+### Expected values and marginal variances
+
+Lets look at how the estimated uncertainty of a site parameter changes with
+its expected value.
+
+``` julia
+par = :K1
+θmean = [mean(θsMs[s,par,:]) for s in axes(θsMs, 1)]
+θsd = [std(θsMs[s,par,:]) for s in axes(θsMs, 1)]
+fig = Figure(); ax = Axis(fig[1,1], xlabel="mean($par)",ylabel="sd($par)")
+scatter!(ax, θmean, θsd) 
+fig
+```
+
+![](inspect_results_files/figure-commonmark/cell-11-output-1.png)
+
+We see that *K*₁ across sites ranges from about 0.18 to 0.25, and that
+its estimated uncertainty is aobut 0.034, slightly decreasing with the
+values of the parameter.
+
+## Predictive Posterior
+
+In addition to the uncertainty in parameters, we are also interested in
+the uncertainty of predictions, i.e. the predictive posterior.
+
+We cam either run the PBM for all the parameter samples that we obtained already,
+using [`apply_process_model`](@ref), or use [`predict_hvi`](@ref) which combines
+sampling the posterior and predictive posterior and returns the additional
+`NamedTuple` entry `y`.
+
+``` julia
+(; y, θsP, θsMs) = predict_hvi(rng, probo; n_sample_pred)
+```
+
+``` julia
+size(y)
+```
+
+    (8, 800, 400)
+
+Again, the last dimension is the sample.
+The other dimensions correspond to the observations we provided for the fitting:
+The first dimension is the observation within one site, the second dimension is the site.
+
+Lets look on how the uncertainty of the 4th observations scales with its
+predicted magnitude across sites.
+
+``` julia
+i_obs = 4
+ymean = [mean(y[i_obs,s,:]) for s in axes(θsMs, 1)]
+ysd = [std(y[i_obs,s,:]) for s in axes(θsMs, 1)]
+fig = Figure(); ax = Axis(fig[1,1], xlabel="mean(y$i_obs)",ylabel="sd(y$i_obs)")
+scatter!(ax, ymean, ysd) 
+fig
+```
+
+![](inspect_results_files/figure-commonmark/cell-14-output-1.png)
+
+We see that observed values for associated substrate concentrations range about from
+0.51 to 0.59 with an estimated standard deviation around 0.005 that decreases
+with the observed value.
diff --git a/docs/src/tutorials/inspect_results.qmd b/docs/src/tutorials/inspect_results.qmd
diff --git a/src/AbstractHybridProblem.jl b/src/AbstractHybridProblem.jl
diff --git a/src/HybridVariationalInference.jl b/src/HybridVariationalInference.jl