Update 1D heateq example #102

New issue
Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.
By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.
Already on GitHub? Sign in to your account
Open
bgroenks96 wants to merge 4 commits into ODINN-SciML:main from bgroenks96:update-heateq-example
code/SolverMethods/1DHeatEquation_with_Phase_Change.jl
            
                      Original file line number
                      Diff line number
                      Diff line change
                  
    @@ -1,3 +1,4 @@
  
    using BenchmarkTools

    using ComponentArrays

    using FreezeCurves

    using LinearAlgebra

    @@ -12,14 +13,14 @@ import Plots
  
    const L = 3.34e8 # volumetric latent heat of fusion of water [J/m^3]

    const default_p = ComponentVector(

        θwi=0.5,  # total water+ice content; 1.0 would correspond to a block of pure ice/water

        θwi=0.3,  # total water+ice content; 1.0 would correspond to a block of pure ice/water

        k_s=2.5,  # thermal conductivity of solid material [W/(m.K)]

        k_w=0.57, # thermal conductivity of unfrozen water [W/(m.K)]

        k_i=2.2,  # thermal conductivity of ice [W/(m.K)]

        c_s=2.5e6, # heat capacity of solid material [J/(m^3.K)]

        c_w=4.2e6, # heat capacity of unfrozen water [J/(m^3.K)]

        c_i=1.9e6, # heat capacity of ice [J/(m^3.K)]

        jH_lb=0.05, # lower boundary flux [W/m^2]

        jH_lb=0.1, # lower boundary flux [W/m^2]

    )

    struct Grid1D{TA}

    @@ -73,6 +74,7 @@ function enthalpyinv(H, p)
  
                zero(T_f)

            )

        )

        return T, θw

    end

    function heateq_with_phase_change(

    @@ -85,10 +87,11 @@ function heateq_with_phase_change(
  
            T = map(first, Hinv_res)

            θw = map(last, Hinv_res)

            θwi = p.θwi

            k = (1-θwi)*p.k_s .+ θw*p.k_w .+ (1.0.-θw)*p.k_i

            jH = k[1:end-1].*(T[1:end-1] .- T[2:end]) ./ grid.dists

            kc = (1-θwi)*p.k_s .+ θw*p.k_w .+ (1.0.-θw)*p.k_i

            k = (kc[1:end-1] .+ kc[2:end])./2

            jH = k.*(T[1:end-1] .- T[2:end]) ./ grid.dists

            jH_lb = p.jH_lb

            jH_ub = -2*(T[1] - T_ub(u,p,t)) / grid.thick[1]

            jH_ub = 2*(T_ub(u,p,t) - T[1]) / grid.thick[1]

            dH = vcat(

                (jH_ub - jH[1]) / grid.thick[1],

                (jH[1:end-1] .- jH[2:end]) ./ grid.thick[2:end-1],

    @@ -100,26 +103,137 @@ function heateq_with_phase_change(
  
    end

    # upper boundary temperature

    T_ub(u,p,t) = 10*sin(2π*t/(24*3600))

    T_ub(u,p,t) = 10*sin(2π*t/(24*3600)) - 1.0

    p = default_p

    grid_edges = vcat(0.0:0.05:5.0, 5.1:0.1:20.0, 20.5:0.5:50.0, 51.0:1.0:100.0)

    grid_edges = vcat(0.0:0.05:5.0, 5.1:0.1:10)

    # grid_edges = vcat(0.0:0.05:1.0, 1.1:0.1:10.0)

    grid = Grid1D(grid_edges)

    T0, H0 = steady_state_init(grid, p; Tsurf=-10.0)

    f = heateq_with_phase_change(grid, T_ub)

    jac_prototype = Tridiagonal(ones(length(H0)-1), ones(length(H0)), ones(length(H0)-1))

    tspan = (0.0, 48*3600.0)

    tspan = (0.0, 30*24*3600.0)

    prob = ODEProblem(ODEFunction(f; jac_prototype), H0, tspan, p)

    sol = @time solve(prob, SSPRK43(), abstol=1e-2, reltol=1e-6)

    H_sol = reduce(hcat, sol.u)

    T_sol = enthalpyinv.(H_sol, Ref(p))

    Plots.plot(T_sol[1:5:50,:]', leg=nothing)

    T_sol = first.(enthalpyinv.(H_sol, Ref(p)))

    Plots.plot(T_sol', leg=nothing)

    Plots.heatmap(sol.t./3600.0, grid.cells, T_sol, yflip=true)

    function loss(p)

        sensealg = sensealg=InterpolatingAdjoint(autojacvec=EnzymeVJP(), checkpointing=true)

        sol_p = solve(prob, SSPRK43(); p, sensealg)

        return mean(sol_p.u[end])/L

    buildalg(::Type{InterpolatingAdjoint}; autojacvec, checkpointing, kwargs...) = InterpolatingAdjoint(; autojacvec, checkpointing)

    buildalg(::Type{GaussAdjoint}; autojacvec, checkpointing, kwargs...) = GaussAdjoint(; autojacvec, checkpointing)

    buildalg(::Type{BacksolveAdjoint}; autojacvec, checkpointing, kwargs...) = BacksolveAdjoint(; autojacvec, checkpointing)

    buildalg(::Type{QuadratureAdjoint}; autojacvec, kwargs...) = QuadratureAdjoint(; autojacvec)

    function benchmark_sensealg(::Type{algType}, tspan_end, p; saveat=nothing, dealg=SSPRK43(), sensealg_kwargs...) where {algType}

        sensealg = buildalg(algType; sensealg_kwargs...)

        newprob = remake(prob; p=p, tspan=(0.0, tspan_end))

        if isnothing(saveat)

            sol = solve(newprob, dealg)

        else

            sol = solve(newprob, dealg; saveat)

        end

        @assert sol.retcode == ReturnCode.Success

        @assert sol.t[end] == tspan_end

        dgdu(out,u,p,t,i) = (out .= u .- 1.0)

        bench_result = @benchmark adjoint_sensitivities(

            $sol,

            $dealg;

            sensealg=$sensealg,

            t=[$sol.t[end]],

            dgdu_discrete=$dgdu,

            abstol=1e-10,

            reltol=1e-10,

        )

        # bench = @benchmark Zygote.gradient($loss, $p)

        return (

            t=tspan_end,

            allocs=bench_result.allocs,

            memory=bench_result.memory,

            runtime_mean=mean(bench_result.times),

            runtime_mid=median(bench_result.times),

            runtime_std=std(bench_result.times),

            alg=string(algType),

            sensealg_kwargs...

        )

    end

    # simple tests

    res_ia_with_chckpointing = benchmark_sensealg(InterpolatingAdjoint, 24*3600.0, p; autojacvec=EnzymeVJP(), checkpointing=true, saveat=3600.0)

    res_ia_without_checkpointing = benchmark_sensealg(InterpolatingAdjoint, 24*3600.0, p; autojacvec=EnzymeVJP(), checkpointing=false, saveat=3600.0)

    res_qa_enzyme = benchmark_sensealg(QuadratureAdjoint, 24*3600.0, p; autojacvec=EnzymeVJP(), saveat=3600.0)

    # zygote VJP appears to be several orders of magnitude slower than Enzyme...

    res_qa_zygote = benchmark_sensealg(QuadratureAdjoint, 24*3600.0, p; autojacvec=ZygoteVJP(), saveat=3600.0)

    # forward mode VJP is about 1-2 orders of magnitude slower

    res_qa_forward = benchmark_sensealg(QuadratureAdjoint, 24*3600.0, p; autojacvec=true, saveat=3600.0)

    # doesn't work; weird internal error:

    # ERROR: MethodError: no method matching increment_deriv!(::Float64, ::Float64)

    # res_qa_reverse = benchmark_sensealg(QuadratureAdjoint, 24*3600.0, p; autojacvec=ReverseDiffVJP(), saveat=3600.0)

    configs = [

        (InterpolatingAdjoint, (autojacvec=EnzymeVJP(), checkpointing=false)),

        (InterpolatingAdjoint, (autojacvec=EnzymeVJP(), checkpointing=true)),

        (GaussAdjoint, (autojacvec=EnzymeVJP(), checkpointing=false)),

        (GaussAdjoint, (autojacvec=EnzymeVJP(), checkpointing=true)),

        (QuadratureAdjoint, (autojacvec=EnzymeVJP(), checkpointing=false)),

        # backsolve appears to fail for longer integration periods

        # (BacksolveAdjoint, (autojacvec=EnzymeVJP(), checkpointing=true)),

    ]

    # target simulation time periods ranging from 1 minute to 1 year

    tspans = [60.0, 3600.0, 24*3600.0, 30*24*3600.0, 12*30*24*3600.0]

    # lossfunc = buildloss(prob, InterpolatingAdjoint(autojacvec=EnzymeVJP()), tspan=(0.0,24*3600.0))

    # Zygote.gradient(lossfunc, p)

    results = []

    for t in tspans

        for c in configs

            algtype, kwargs = c

            @info "Running benchmark for $algtype with $kwargs and tspan of $t sec."

            if haskey(kwargs, :checkpointing) && kwargs.checkpointing

                res = benchmark_sensealg(algtype, t, p; saveat=min(t/10.0, 3600.0), kwargs...)

            else

                res = benchmark_sensealg(algtype, t, p; kwargs...)

            end

            push!(results, res)

        end

    end

    grad = @time Zygote.gradient(loss, p)

    using DataFrames

    results_df = DataFrame(results)

    show(stdout, "text/plain", results_df)

    function matchesconfig(config, row)

        alg, kwargs = config

        return row.alg == string(alg) && kwargs.autojacvec == row.autojacvec && kwargs.checkpointing == row.checkpointing

    end

    df1 = filter(row -> matchesconfig(configs[1], row), results_df)

    Plots.plot(df1.t./60.0, df1.memory./1024, marker=:dot, label="InterpolatingAdjoint", xscale=:log10, yscale=:log10, xlabel="Simulation tspan / min", ylabel="Memory / KiB", leg=:topleft)

    df2 = filter(row -> matchesconfig(configs[2], row), results_df)

    Plots.plot!(df2.t./60.0, df2.memory./1024, marker=:dot, label="InterpolatingAdjoint w/ checkpointing")

    df3 = filter(row -> matchesconfig(configs[3], row), results_df)

    Plots.plot!(df3.t./60.0, df3.memory./1024, marker=:dot, label="GaussAdjoint")

    df4 = filter(row -> matchesconfig(configs[4], row), results_df)

    Plots.plot!(df4.t./60.0, df4.memory./1024, marker=:dot, label="GaussAdjoint w/ checkpointing")

    df5 = filter(row -> matchesconfig(configs[5], row), results_df)

    Plots.plot!(df5.t./60.0, df5.memory./1024, marker=:dot, label="QuadratureAdjoint")

    # df6 = filter(row -> matchesconfig(configs[6], row), results_df)

    # Plots.plot!(df6.t./60.0, df6.memory./1024, marker=:dot, label="QuadratureAdjoint w/ ForwardDiff VJP")

    Plots.savefig("plots/heateq1D_memory_vs_simulation_tspan.png")

    df1 = filter(row -> matchesconfig(configs[1], row), results_df)

    Plots.plot(df1.t./60.0, df1.runtime_mid./1e9, marker=:dot, label="InterpolatingAdjoint", xscale=:log10, yscale=:log10, xlabel="Simulation tspan / min", ylabel="Wallclock runtime / s", leg=:topleft)

    df2 = filter(row -> matchesconfig(configs[2], row), results_df)

    Plots.plot!(df2.t./60.0, df2.runtime_mid./1e9, marker=:dot, label="InterpolatingAdjoint w/ checkpointing")

    df3 = filter(row -> matchesconfig(configs[3], row), results_df)

    Plots.plot!(df3.t./60.0, df3.runtime_mid./1e9, marker=:dot, label="GaussAdjoint")

    df4 = filter(row -> matchesconfig(configs[4], row), results_df)

    Plots.plot!(df4.t./60.0, df4.runtime_mid./1e9, marker=:dot, label="GaussAdjoint w/ checkpointing")

    df5 = filter(row -> matchesconfig(configs[5], row), results_df)

    Plots.plot!(df5.t./60.0, df5.runtime_mid./1e9, marker=:dot, label="QuadratureAdjoint")

    # df6 = filter(row -> matchesconfig(configs[6], row), results_df)

    # Plots.plot!(df6.t./60.0, df6.runtime_mid./1e9, marker=:dot, label="QuadratureAdjoint w/ ForwardDiff VJP")

    Plots.savefig("plots/heateq1D_runtime_vs_simulation_tspan.png")
Provide feedback

Saved searches

Use saved searches to filter your results more quickly

Update 1D heateq example #102

Uh oh!

Diff view

Diff view

There are no files selected for viewing

Update 1D heateq example #102

Are you sure you want to change the base?

Uh oh!

Update 1D heateq example #102

Uh oh!

Uh oh!

Diff view

Diff view

There are no files selected for viewing