diff --git a/.github/workflows/ci.yml b/.github/workflows/ci.yml
index 4876530..a50bb30 100644
--- a/.github/workflows/ci.yml
+++ b/.github/workflows/ci.yml
@@ -22,7 +22,7 @@ jobs:
         version:
           - 'lts'
           - '1'
-          # - 'pre' # TODO: tests on pre-release version
+          - 'pre'
     steps:
       - uses: actions/checkout@v4
       - uses: julia-actions/setup-julia@v2
diff --git a/Project.toml b/Project.toml
index b65b8dc..ef0e644 100644
--- a/Project.toml
+++ b/Project.toml
@@ -22,4 +22,4 @@ Reexport = "1"
 Statistics = "<0.0.1, 1"
 XAIBase = "4"
 Zygote = "0.6"
-julia = "1.6"
+julia = "1.10"
diff --git a/README.md b/README.md
index e383bfd..e08b9cd 100644
--- a/README.md
+++ b/README.md
@@ -16,7 +16,7 @@ and [iNNvestigate][innvestigate-repo] for Keras models.
 [^1]: More specifically, models currently have to be differentiable with [Zygote.jl](https://github.com/FluxML/Zygote.jl).
 
 ## Installation 
-This package supports Julia ≥1.6. To install it, open the Julia REPL and run 
+This package supports Julia ≥1.10. To install it, open the Julia REPL and run 
 ```julia-repl
 julia> ]add ExplainableAI
 ```
diff --git a/benchmark/Project.toml b/benchmark/Project.toml
index 6bb7d4e..d2a943a 100644
--- a/benchmark/Project.toml
+++ b/benchmark/Project.toml
@@ -2,9 +2,8 @@
 BenchmarkTools = "6e4b80f9-dd63-53aa-95a3-0cdb28fa8baf"
 ExplainableAI = "4f1bc3e1-d60d-4ed0-9367-9bdff9846d3b"
 Flux = "587475ba-b771-5e3f-ad9e-33799f191a9c"
-LoopVectorization = "bdcacae8-1622-11e9-2a5c-532679323890"
 PkgBenchmark = "32113eaa-f34f-5b0d-bd6c-c81e245fc73d"
-Tullio = "bc48ee85-29a4-5162-ae0b-a64e1601d4bc"
+PkgJogger = "10150987-6cc1-4b76-abee-b1c1cbd91c01"
 
 [compat]
 BenchmarkTools = "1"
diff --git a/benchmark/bench_jogger.jl b/benchmark/bench_jogger.jl
new file mode 100644
index 0000000..e786975
--- /dev/null
+++ b/benchmark/bench_jogger.jl
@@ -0,0 +1,47 @@
+using BenchmarkTools
+using Flux
+using ExplainableAI
+
+on_CI = haskey(ENV, "GITHUB_ACTIONS")
+
+T = Float32
+input_size = (32, 32, 3, 1)
+input = rand(T, input_size)
+
+model = Chain(
+    Chain(
+        Conv((3, 3), 3 => 8, relu; pad=1),
+        Conv((3, 3), 8 => 8, relu; pad=1),
+        MaxPool((2, 2)),
+        Conv((3, 3), 8 => 16, relu; pad=1),
+        Conv((3, 3), 16 => 16, relu; pad=1),
+        MaxPool((2, 2)),
+    ),
+    Chain(
+        Flux.flatten,
+        Dense(1024 => 512, relu),         # 102_764_544 parameters
+        Dropout(0.5),
+        Dense(512 => 100, relu),
+    ),
+)
+Flux.testmode!(model, true)
+
+# Use one representative algorithm of each type
+METHODS = Dict(
+    "Gradient"            => Gradient,
+    "InputTimesGradient"  => InputTimesGradient,
+    "SmoothGrad"          => model -> SmoothGrad(model, 5),
+    "IntegratedGradients" => model -> IntegratedGradients(model, 5),
+)
+
+# Define benchmark
+construct(method, model) = method(model) # for use with @benchmarkable macro
+
+suite = BenchmarkGroup()
+suite["CNN"] = BenchmarkGroup([k for k in keys(METHODS)])
+for (name, method) in METHODS
+    analyzer = method(model)
+    suite["CNN"][name] = BenchmarkGroup(["construct analyzer", "analyze"])
+    suite["CNN"][name]["constructor"] = @benchmarkable construct($(method), $(model))
+    suite["CNN"][name]["analyze"] = @benchmarkable analyze($(input), $(analyzer))
+end
diff --git a/benchmark/benchmarks.jl b/benchmark/benchmarks.jl
index a601058..37cdbf3 100644
--- a/benchmark/benchmarks.jl
+++ b/benchmark/benchmarks.jl
@@ -1,95 +1,5 @@
-using BenchmarkTools
-using LoopVectorization
-using Tullio
-using Flux
+using PkgJogger
 using ExplainableAI
-using ExplainableAI: lrp!, modify_layer
-
-on_CI = haskey(ENV, "GITHUB_ACTIONS")
-
-T = Float32
-input_size = (32, 32, 3, 1)
-input = rand(T, input_size)
-
-model = Chain(
-    Chain(
-        Conv((3, 3), 3 => 8, relu; pad=1),
-        Conv((3, 3), 8 => 8, relu; pad=1),
-        MaxPool((2, 2)),
-        Conv((3, 3), 8 => 16, relu; pad=1),
-        Conv((3, 3), 16 => 16, relu; pad=1),
-        MaxPool((2, 2)),
-    ),
-    Chain(
-        Flux.flatten,
-        Dense(1024 => 512, relu),         # 102_764_544 parameters
-        Dropout(0.5),
-        Dense(512 => 100, relu),
-    ),
-)
-Flux.testmode!(model, true)
-
-# Use one representative algorithm of each type
-algs = Dict(
-    "Gradient"            => Gradient,
-    "InputTimesGradient"  => InputTimesGradient,
-    "LRP"                 => LRP,
-    "LREpsilonPlusFlat"   => model -> LRP(model, EpsilonPlusFlat()),
-    "SmoothGrad"          => model -> SmoothGrad(model, 5),
-    "IntegratedGradients" => model -> IntegratedGradients(model, 5),
-)
-
-# Define benchmark
-_alg(alg, model) = alg(model) # for use with @benchmarkable macro
-
-SUITE = BenchmarkGroup()
-SUITE["CNN"] = BenchmarkGroup([k for k in keys(algs)])
-for (name, alg) in algs
-    analyzer = alg(model)
-    SUITE["CNN"][name] = BenchmarkGroup(["construct analyzer", "analyze"])
-    SUITE["CNN"][name]["construct analyzer"] = @benchmarkable _alg($(alg), $(model))
-    SUITE["CNN"][name]["analyze"] = @benchmarkable analyze($(input), $(analyzer))
-end
-
-# generate input for conv layers
-insize = (32, 32, 3, 1)
-in_dense = 64
-out_dense = 10
-aᵏ = rand(T, insize)
-
-layers = Dict(
-    "Conv"  => (Conv((3, 3), 3 => 2), aᵏ),
-    "Dense" => (Dense(in_dense, out_dense, relu), randn(T, in_dense, 1)),
-)
-rules = Dict(
-    "ZeroRule"      => ZeroRule(),
-    "EpsilonRule"   => EpsilonRule(),
-    "GammaRule"     => GammaRule(),
-    "WSquareRule"   => WSquareRule(),
-    "FlatRule"      => FlatRule(),
-    "AlphaBetaRule" => AlphaBetaRule(),
-    "ZPlusRule"     => ZPlusRule(),
-    "ZBoxRule"      => ZBoxRule(zero(T), oneunit(T)),
-)
-
-layernames = String.(keys(layers))
-rulenames  = String.(keys(rules))
-
-SUITE["modify layer"] = BenchmarkGroup(rulenames)
-SUITE["apply rule"]   = BenchmarkGroup(rulenames)
-for rname in rulenames
-    SUITE["modify layer"][rname] = BenchmarkGroup(layernames)
-    SUITE["apply rule"][rname] = BenchmarkGroup(layernames)
-end
-
-for (lname, (layer, aᵏ)) in layers
-    Rᵏ = similar(aᵏ)
-    Rᵏ⁺¹ = layer(aᵏ)
-    for (rname, rule) in rules
-        modified_layer = modify_layer(rule, layer)
-        SUITE["modify layer"][rname][lname] = @benchmarkable modify_layer($(rule), $(layer))
-        SUITE["apply rule"][rname][lname] = @benchmarkable lrp!(
-            $(Rᵏ), $(rule), $(layer), $(modified_layer), $(aᵏ), $(Rᵏ⁺¹)
-        )
-    end
-end
+# Use PkgJogger.@jog to create the JogExplainableAI module
+@jog ExplainableAI
+SUITE = JogExplainableAI.suite()
diff --git a/src/ExplainableAI.jl b/src/ExplainableAI.jl
index f999b15..567971f 100644
--- a/src/ExplainableAI.jl
+++ b/src/ExplainableAI.jl
@@ -14,7 +14,6 @@ using DifferentiationInterface: value_and_pullback
 using Zygote
 const DEFAULT_AD_BACKEND = AutoZygote()
 
-include("compat.jl")
 include("bibliography.jl")
 include("input_augmentation.jl")
 include("gradient.jl")
diff --git a/src/compat.jl b/src/compat.jl
deleted file mode 100644
index aa98e07..0000000
--- a/src/compat.jl
+++ /dev/null
@@ -1,12 +0,0 @@
-# https://github.com/JuliaLang/julia/pull/39794
-if VERSION < v"1.7.0-DEV.793"
-    export Returns
-
-    struct Returns{V} <: Function
-        value::V
-        Returns{V}(value) where {V} = new{V}(value)
-        Returns(value) = new{Core.Typeof(value)}(value)
-    end
-
-    (obj::Returns)(args...; kw...) = obj.value
-end
diff --git a/test/Project.toml b/test/Project.toml
index 48d2ec4..a616a45 100644
--- a/test/Project.toml
+++ b/test/Project.toml
@@ -1,13 +1,15 @@
 [deps]
 Aqua = "4c88cf16-eb10-579e-8560-4a9242c79595"
+BenchmarkTools = "6e4b80f9-dd63-53aa-95a3-0cdb28fa8baf"
 Distributions = "31c24e10-a181-5473-b8eb-7969acd0382f"
 Flux = "587475ba-b771-5e3f-ad9e-33799f191a9c"
 JET = "c3a54625-cd67-489e-a8e7-0a5a0ff4e31b"
 JLD2 = "033835bb-8acc-5ee8-8aae-3f567f8a3819"
 JuliaFormatter = "98e50ef6-434e-11e9-1051-2b60c6c9e899"
 LinearAlgebra = "37e2e46d-f89d-539d-b4ee-838fcccc9c8e"
+PkgJogger = "10150987-6cc1-4b76-abee-b1c1cbd91c01"
 Random = "9a3f8284-a2c9-5f02-9a11-845980a1fd5c"
 ReferenceTests = "324d217c-45ce-50fc-942e-d289b448e8cf"
-Suppressor = "fd094767-a336-5f1f-9728-57cf17d0bbfb"
+StableRNGs = "860ef19b-820b-49d6-a774-d7a799459cd3"
 Test = "8dfed614-e22c-5e08-85e1-65c5234f0b40"
 XAIBase = "9b48221d-a747-4c1b-9860-46a1d8ba24a7"
diff --git a/test/references/cnn/GradCAM_max.jld2 b/test/references/cnn/GradCAM_max.jld2
index 5031171..944423b 100644
Binary files a/test/references/cnn/GradCAM_max.jld2 and b/test/references/cnn/GradCAM_max.jld2 differ
diff --git a/test/references/cnn/Gradient_max.jld2 b/test/references/cnn/Gradient_max.jld2
index 8b774c4..8818624 100644
Binary files a/test/references/cnn/Gradient_max.jld2 and b/test/references/cnn/Gradient_max.jld2 differ
diff --git a/test/references/cnn/InputTimesGradient_max.jld2 b/test/references/cnn/InputTimesGradient_max.jld2
index dd54f3d..0951dea 100644
Binary files a/test/references/cnn/InputTimesGradient_max.jld2 and b/test/references/cnn/InputTimesGradient_max.jld2 differ
diff --git a/test/references/cnn/IntegratedGradients_max.jld2 b/test/references/cnn/IntegratedGradients_max.jld2
index 01b02f2..f78ec5a 100644
Binary files a/test/references/cnn/IntegratedGradients_max.jld2 and b/test/references/cnn/IntegratedGradients_max.jld2 differ
diff --git a/test/references/cnn/SmoothGrad_max.jld2 b/test/references/cnn/SmoothGrad_max.jld2
index 89c9f15..f0676f8 100644
Binary files a/test/references/cnn/SmoothGrad_max.jld2 and b/test/references/cnn/SmoothGrad_max.jld2 differ
diff --git a/test/runtests.jl b/test/runtests.jl
index e73db4d..8bd5819 100644
--- a/test/runtests.jl
+++ b/test/runtests.jl
@@ -6,14 +6,13 @@ using Aqua
 using JET
 
 @testset "ExplainableAI.jl" begin
-    if VERSION >= v"1.10"
-        @info "Testing formalities..."
+    @testset verbose = true "Linting" begin
         @testset "Code formatting" begin
             @info "- running JuliaFormatter code formatting tests..."
             @test JuliaFormatter.format(ExplainableAI; verbose=false, overwrite=false)
         end
         @testset "Aqua.jl" begin
-            @info "- running Aqua.jl tests. These might print warnings from dependencies..."
+            @info "- running Aqua.jl tests..."
             Aqua.test_all(ExplainableAI; ambiguities=false)
         end
         @testset "JET tests" begin
@@ -34,4 +33,8 @@ using JET
         @info "Testing analyzers on batches..."
         include("test_batches.jl")
     end
+    @testset "Benchmark correctness" begin
+        @info "Testing whether benchmarks are up-to-date..."
+        include("test_benchmarks.jl")
+    end
 end
diff --git a/test/test_batches.jl b/test/test_batches.jl
index 473073d..832d86e 100644
--- a/test/test_batches.jl
+++ b/test/test_batches.jl
@@ -3,9 +3,10 @@ using Test
 
 using Flux
 using Random
+using StableRNGs: StableRNG
 using Distributions: Laplace
 
-pseudorand(dims...) = rand(MersenneTwister(123), Float32, dims...)
+pseudorand(dims...) = rand(StableRNG(123), Float32, dims...)
 
 ## Test `fuse_batchnorm` on Dense and Conv layers
 ins = 20
@@ -15,16 +16,16 @@ batchsize = 15
 model = Chain(Dense(ins, 15, relu; init=pseudorand), Dense(15, outs, relu; init=pseudorand))
 
 # Input 1 with batch dimension
-input1 = rand(MersenneTwister(1), Float32, ins, 1)
+input1 = rand(StableRNG(1), Float32, ins, 1)
 # Input 2 with batch dimension
-input2 = rand(MersenneTwister(2), Float32, ins, 1)
+input2 = rand(StableRNG(2), Float32, ins, 1)
 # Batch containing inputs 1 & 2
 input_batch = cat(input1, input2; dims=2)
 
 ANALYZERS = Dict(
     "Gradient"            => Gradient,
     "InputTimesGradient"  => InputTimesGradient,
-    "SmoothGrad"          => m -> SmoothGrad(m, 5, 0.1, MersenneTwister(123)),
+    "SmoothGrad"          => m -> SmoothGrad(m, 5, 0.1, StableRNG(123)),
     "IntegratedGradients" => m -> IntegratedGradients(m, 5),
     "GradCAM"             => m -> GradCAM(m[1], m[2]),
 )
diff --git a/test/test_benchmarks.jl b/test/test_benchmarks.jl
new file mode 100644
index 0000000..45ee42e
--- /dev/null
+++ b/test/test_benchmarks.jl
@@ -0,0 +1,4 @@
+using PkgJogger
+using ExplainableAI
+
+PkgJogger.@test_benchmarks ExplainableAI
diff --git a/test/test_cnn.jl b/test/test_cnn.jl
index 6e7f6a8..b8ff8f3 100644
--- a/test/test_cnn.jl
+++ b/test/test_cnn.jl
@@ -4,21 +4,22 @@ using ReferenceTests
 
 using Flux
 using Random
+using StableRNGs: StableRNG
 using JLD2
 
 const GRADIENT_ANALYZERS = Dict(
     "InputTimesGradient"  => InputTimesGradient,
-    "SmoothGrad"          => m -> SmoothGrad(m, 5, 0.1, MersenneTwister(123)),
+    "SmoothGrad"          => m -> SmoothGrad(m, 5, 0.1, StableRNG(123)),
     "IntegratedGradients" => m -> IntegratedGradients(m, 5),
     "GradCAM"             => m -> GradCAM(m[1], m[2]),
 )
 
-pseudorand(dims...) = rand(MersenneTwister(123), Float32, dims...)
+pseudorand(dims...) = rand(StableRNG(123), Float32, dims...)
 
 input_size = (32, 32, 3, 1)
 input = pseudorand(input_size)
 
-init(dims...) = Flux.glorot_uniform(MersenneTwister(123), dims...)
+init(dims...) = Flux.glorot_uniform(StableRNG(123), dims...)
 
 model = Chain(
     Chain(