update GPU exercise

vchuravy · vchuravy · commit 6ab868b0b178 · 2025-09-17T08:12:58.000+02:00
diff --git a/exercise_03_intro_accelerated.jl b/exercise_03_intro_accelerated.jl
@@ -42,6 +42,9 @@ begin
 	using CairoMakie
 end
 
+# ╔═╡ 1b9844e2-2e2b-47c2-8a5e-3ff3dbfacc16
+using OrdinaryDiffEqTsit5
+
 # ╔═╡ 3e5c3c97-4401-41d4-a701-d9b24f9acdc6
 PlutoUI.TableOfContents(; depth=4)
 
@@ -214,7 +217,7 @@ begin
 end
 
 # ╔═╡ 0ad45abb-0d9f-4e8d-b097-b0b42ba024f7
-dt = dx^2 * dy^2 / (2.0 * a * (dx^2 + dy^2)) # Largest stable time step
+t_final = 3.0
 
 # ╔═╡ 83042a1e-f964-483d-b316-a486cfabd7e0
 N = 64
@@ -234,28 +237,32 @@ $dU = a * dt * (\frac{U[i+1, j] - 2U[i,j] + U[i-1,j]}{dx^2} + \frac{U[i, j+1] -
 """
 
 # ╔═╡ 9eb166fa-360e-4a5d-a2ac-9113c2f264b3
-@kernel function diffuse(dU, @Const(U), a, dt, dx, dy)
+@kernel function heat_2D_kernel!(du, @Const(u), a, dx, dy)
 	# implement me
 end
 
 # ╔═╡ aa2d455e-c9fc-4a7b-b50e-77709481c2a7
-function diffuse!(U, a, dt, dx, dy)
-    dU = zero(U)
-	diffuse(get_backend(U))(dU, U, a, dt, dx, dy; ndrange=(N,N))
-	U .+= dU
+function heat_2D!(du, u, (a, dx, dy), t)
+	N, M = size(u)
+    N = N - 2
+    M = M - 2
+	
+	# update boundary condition (wrap around)
+    u[0, :]   .= u[N, :]
+    u[N+1, :] .= u[1, :]
+    u[:, 0]   .= u[:, N]
+    u[:, N+1] .= u[:, 0]
 	
-    # update boundary condition (wrap around)
-    U[0, :]   .= U[N, :]
-    U[N+1, :] .= U[1, :]
-    U[:, 0]   .= U[:, N]
-    U[:, N+1] .= U[:, 0]
-    U
+	kernel = heat_2D_kernel!(get_backend(du))
+	kernel(du, u, a, dx, dy; ndrange=(N,M))
+
+	return nothing
 end
 
 # ╔═╡ f912ee44-15ed-469f-b417-cf7d8d87146e
 answer_box(hint(md"""
 ```julia
-@kernel function diffuse(dU, @Const(U), a, dt, dx, dy)
+@kernel function heat_2D_kernel(du, @Const(u), a, dx, dy)
 	i, j = @index(Global, NTuple)
 	out[i, j] = a * dt * (
 		(U[i + 1, j] - 2 * U[i, j] + U[i - 1, j]) / dx^2 +
@@ -265,24 +272,55 @@ end
 ```
 """))
 
-# ╔═╡ 2a986721-f513-488d-970e-4797f0de135f
-let
+# ╔═╡ 7147bba2-78ae-49fa-ae35-2c815ee188ae
+begin
 	xs = 0:(N+1)
 	ys = 0:(N+1)
-	domain = OffsetArray(
-		KernelAbstractions.zeros(backend, Float32, N+2, N+2),
-		xs, ys)
-	# TODO: Split out into initalize function
-	parent(domain)[16:32, 16:32] .= 5
-	
-	fig, ax, hm = heatmap(xs, ys, Array(parent(domain)))
+
+	u₀ = OffsetArray(
+		KernelAbstractions.zeros(
+			backend, Float32, N+2, N+2)
+		, xs, ys)
+	parent(u₀)[16:32, 16:32] .= 5
+
+	heatmap(xs, ys, parent(u₀))
+end
+
+# ╔═╡ cdf61aff-ec98-4174-9d48-c287977742cb
+prob = ODEProblem(heat_2D!, u₀, (0.0, t_final), (a, dx, dy))
+
+# ╔═╡ 8e963ae6-06fd-47fc-a1de-e884468de234
+sol = solve(prob, Tsit5(), saveat=0.2);
+
+# ╔═╡ 78f7884c-3523-4d96-9dfc-fbe9de36a86b
+let
+	idx = Observable(1)
+	data = @lift Array(parent(sol.u[$idx]))
+	fig, ax, hm = heatmap(xs, ys, data)
 	
-	Makie.Record(fig, 1:250) do i
-	    diffuse!(domain, a, dt, dx, dy)  # update data
-	    autolimits!(ax) # update limits
+	Makie.Record(fig, 1:length(sol.u), framerate=5) do i
+	    idx[] = i
 	end
 end
 
+# ╔═╡ 2a986721-f513-488d-970e-4797f0de135f
+# let
+# 	xs = 0:(N+1)
+# 	ys = 0:(N+1)
+# 	domain = OffsetArray(
+# 		KernelAbstractions.zeros(backend, Float32, N+2, N+2),
+# 		xs, ys)
+# 	# TODO: Split out into initalize function
+# 	parent(domain)[16:32, 16:32] .= 5
+	
+# 	fig, ax, hm = heatmap(xs, ys, Array(parent(domain)))
+	
+# 	Makie.Record(fig, 1:250) do i
+# 	    diffuse!(domain, a, dt, dx, dy)  # update data
+# 	    autolimits!(ax) # update limits
+# 	end
+# end
+
 # ╔═╡ 00000000-0000-0000-0000-000000000001
 PLUTO_PROJECT_TOML_CONTENTS = """
 [deps]
@@ -314,7 +352,7 @@ oneAPI = "~2.0.3"
 PLUTO_MANIFEST_TOML_CONTENTS = """
 # This file is machine-generated - editing it directly is not advised
 
-julia_version = "1.11.5"
+julia_version = "1.11.6"
 manifest_format = "2.0"
 project_hash = "81e4ea397ec4528af2733db8b8dce3926ca44ef1"
 
@@ -2314,13 +2352,18 @@ version = "3.6.0+0"
 # ╠═fc859cea-a41a-4d96-bf86-5a23bca19589
 # ╟─1c76d376-ef91-4410-a981-d8a6dea3033f
 # ╠═f7829706-3981-45b5-bdc3-d8b21155229a
+# ╠═1b9844e2-2e2b-47c2-8a5e-3ff3dbfacc16
 # ╠═0b20861c-995c-4890-81b9-98b8aca5095a
 # ╠═0ad45abb-0d9f-4e8d-b097-b0b42ba024f7
 # ╠═83042a1e-f964-483d-b316-a486cfabd7e0
 # ╟─d2d925a0-8fd5-4345-8ee2-fa4dc4a75407
 # ╠═9eb166fa-360e-4a5d-a2ac-9113c2f264b3
 # ╠═aa2d455e-c9fc-4a7b-b50e-77709481c2a7
 # ╟─f912ee44-15ed-469f-b417-cf7d8d87146e
+# ╠═7147bba2-78ae-49fa-ae35-2c815ee188ae
+# ╠═cdf61aff-ec98-4174-9d48-c287977742cb
+# ╠═8e963ae6-06fd-47fc-a1de-e884468de234
+# ╠═78f7884c-3523-4d96-9dfc-fbe9de36a86b
 # ╠═2a986721-f513-488d-970e-4797f0de135f
 # ╟─00000000-0000-0000-0000-000000000001
 # ╟─00000000-0000-0000-0000-000000000002
diff --git a/lecture_04_interop.jl b/lecture_04_interop.jl
@@ -42,6 +42,9 @@ using CondaPkg; CondaPkg.add("seaborn")
 # ╔═╡ 1a7f20f9-a69c-49a2-a012-ed59657cc29f
 using PythonCall, RDatasets
 
+# ╔═╡ e036e0b1-60f5-4670-9956-15e74d010ee9
+using MPI, Serialization, StaticArrays
+
 # ╔═╡ 0e88ed74-261d-4aad-82dc-ed8076684406
 using Measurements
 
@@ -200,6 +203,22 @@ macro mpi(np, expr)
 	end
 end
 
+# ╔═╡ fa98c58b-e61b-4762-a89f-58cf6b5a50d0
+@mpi np let
+	using StaticArrays
+	
+	MPI.Init()
+	comm = MPI.COMM_WORLD
+
+	x = ones(SVector{3, Float64})
+	sum = MPI.Allreduce([x], +, comm)
+
+	if MPI.Comm_rank(comm) == 0
+		@show sum
+	end
+	nothing
+end
+
 # ╔═╡ c739f61d-7104-4ae4-9934-fc98657fc2fc
 md"""
 Compute $\int_0^1 \frac{4}{1+x^2} dx = [4 * atan(x)]_0^1$ which evaluates to π
@@ -514,25 +533,6 @@ md"""
 - [2025 RSE Course](https://vchuravy.dev/rse-course)
 """
 
-# ╔═╡ fa98c58b-e61b-4762-a89f-58cf6b5a50d0
-@mpi np let
-	using StaticArrays
-	
-	MPI.Init()
-	comm = MPI.COMM_WORLD
-
-	x = ones(SVector{3, Float64})
-	sum = MPI.Allreduce([x], +, comm)
-
-	if MPI.Comm_rank(comm) == 0
-		@show sum
-	end
-	nothing
-end
-
-# ╔═╡ e036e0b1-60f5-4670-9956-15e74d010ee9
-using MPI, Serialization, StaticArrays
-
 # ╔═╡ 00000000-0000-0000-0000-000000000001
 PLUTO_PROJECT_TOML_CONTENTS = """
 [deps]