trixi-framework
diff --git a/‎benchmarks/benchmarks.jl‎
Lines changed: 1 addition & 1 deletion b/‎benchmarks/benchmarks.jl‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎benchmarks/count_neighbors.jl‎
Lines changed: 2 additions & 1 deletion b/‎benchmarks/count_neighbors.jl‎
Lines changed: 2 additions & 1 deletion
diff --git a/‎benchmarks/n_body.jl‎
Lines changed: 2 additions & 2 deletions b/‎benchmarks/n_body.jl‎
Lines changed: 2 additions & 2 deletions
diff --git a/‎benchmarks/plot.jl‎
Lines changed: 0 additions & 86 deletions b/‎benchmarks/plot.jl‎
Lines changed: 0 additions & 86 deletions
diff --git a/‎benchmarks/run_benchmarks.jl‎
Lines changed: 228 additions & 0 deletions b/‎benchmarks/run_benchmarks.jl‎
Lines changed: 228 additions & 0 deletions
@@ -3,4 +3,4 @@ include("n_body.jl")
 include("smoothed_particle_hydrodynamics.jl")
 include("update.jl")
 
-include("plot.jl")
+include("run_benchmarks.jl")
@@ -2,7 +2,8 @@ using PointNeighbors
 using BenchmarkTools
 
 """
-    benchmark_count_neighbors(neighborhood_search, coordinates; parallel = true)
+    benchmark_count_neighbors(neighborhood_search, coordinates;
+                              parallelization_backend = default_backend(coordinates))
 
 A very cheap and simple neighborhood search benchmark, only counting the neighbors of each
 point. For each point-neighbor pair, only an array entry is incremented.
 
@@ -2,7 +2,8 @@ using PointNeighbors
 using BenchmarkTools
 
 """
-    benchmark_n_body(neighborhood_search, coordinates; parallel = true)
+    benchmark_n_body(neighborhood_search, coordinates;
+                     parallelization_backend = default_backend(coordinates))
 
 A simple neighborhood search benchmark, computing the right-hand side of an n-body
 simulation with a cutoff (corresponding to the search radius of `neighborhood_search`).
@@ -16,7 +17,6 @@ function benchmark_n_body(neighborhood_search, coordinates_;
                           parallelization_backend = default_backend(coordinates_))
     # Passing a different backend like `CUDA.CUDABackend`
     # allows us to change the type of the array to run the benchmark on the GPU.
-    # Passing `parallel = true` or `parallel = false` will not change anything here.
     coordinates = PointNeighbors.Adapt.adapt(parallelization_backend, coordinates_)
     nhs = PointNeighbors.Adapt.adapt(parallelization_backend, neighborhood_search)
 
 
@@ -0,0 +1,228 @@
+using Plots
+using BenchmarkTools
+
+# Generate a rectangular point cloud
+include("../test/point_cloud.jl")
+
+"""
+    run_benchmarks(benchmark, n_points_per_dimension, iterations, neighborhood_searches;
+                   parallelization_backend = PolyesterBackend(),
+                   names = ["NeighborhoodSearch 1" "NeighborhoodSearch 2" ...],
+                   seed = 1, perturbation_factor_position = 1.0)
+
+Run a benchmark with several neighborhood searches multiple times for increasing numbers
+of points and return the results as `(n_particles_vec, times)`, where `n_particles_vec`
+is a vector containing the number of particles for each iteration and `times` is a matrix
+containing the runtimes for each neighborhood search and iteration.
+
+See also
+- [`plot_benchmark`](@ref) to plot the results,
+- [`run_benchmark_default`](@ref) to run the benchmark with the most commonly used
+  neighborhood search implementations,
+- [`run_benchmark_gpu`](@ref) to run the benchmark with all GPU-compatible neighborhood
+  search implementations.
+
+# Arguments
+- `benchmark`:              The benchmark function. See [`benchmark_count_neighbors`](@ref),
+                            [`benchmark_n_body`](@ref), [`benchmark_wcsph`](@ref),
+                            [`benchmark_wcsph_fp32`](@ref) and [`benchmark_tlsph`](@ref).
+- `n_points_per_dimension`: Initial resolution as tuple. The product is the initial number
+                            of points. For example, use `(100, 100)` for a 2D benchmark or
+                            `(10, 10, 10)` for a 3D benchmark.
+- `iterations`:             Number of refinement iterations
+
+# Keywords
+- `parallelization_backend = PolyesterBackend()`: Parallelization strategy to use. See
+                                                  [`@threaded`](@ref) for a list of available
+                                                  backends.
+- `seed = 1`:               Seed to perturb the point positions. Different seeds yield
+                            slightly different point positions.
+- `perturbation_factor_position = 1.0`: Scale the point position perturbation by this factor.
+                                        A factor of `1.0` corresponds to a standard deviation
+                                        similar to that of a realistic simulation.
+
+# Examples
+```julia
+include("benchmarks/benchmarks.jl")
+
+run_benchmark(benchmark_count_neighbors, (10, 10), 3,
+              [TrivialNeighborhoodSearch{2}(), GridNeighborhoodSearch{2}()])
+```
+"""
+function run_benchmark(benchmark, n_points_per_dimension, iterations, neighborhood_searches;
+                       parallelization_backend = PolyesterBackend(),
+                       names = ["Neighborhood search $i"
+                                for i in 1:length(neighborhood_searches)]',
+                       seed = 1, perturbation_factor_position = 1.0)
+    # Multiply number of points in each iteration (roughly) by this factor
+    scaling_factor = 4
+    per_dimension_factor = scaling_factor^(1 / length(n_points_per_dimension))
+    sizes = [round.(Int, n_points_per_dimension .* per_dimension_factor^(iter - 1))
+             for iter in 1:iterations]
+
+    n_particles_vec = prod.(sizes)
+    times = zeros(iterations, length(neighborhood_searches))
+
+    for iter in 1:iterations
+        coordinates = point_cloud(sizes[iter]; seed, perturbation_factor_position)
+        domain_size = maximum(sizes[iter]) + 1
+
+        # Normalize domain size to 1
+        coordinates ./= domain_size
+
+        # Make this Float32 to make sure that Float32 benchmarks use Float32 exclusively
+        search_radius = 4.0f0 / domain_size
+        n_particles = size(coordinates, 2)
+
+        neighborhood_searches_copy = copy_neighborhood_search.(neighborhood_searches,
+                                                               search_radius, n_particles)
+
+        for i in eachindex(neighborhood_searches_copy)
+            neighborhood_search = neighborhood_searches_copy[i]
+            PointNeighbors.initialize!(neighborhood_search, coordinates, coordinates)
+
+            time = benchmark(neighborhood_search, coordinates; parallelization_backend)
+            times[iter, i] = time
+            time_string = BenchmarkTools.prettytime(time * 1e9)
+            time_string_per_particle = BenchmarkTools.prettytime(time * 1e9 / n_particles)
+            println("$(names[i])")
+            println("with $(join(sizes[iter], "x")) = $(prod(sizes[iter])) particles " *
+                    "finished in $time_string ($time_string_per_particle per particle)\n")
+        end
+    end
+
+    return n_particles_vec, times
+end
+
+"""
+    run_benchmark_default(benchmark, n_points_per_dimension, iterations; kwargs...)
+
+Shortcut to call [`run_benchmark`](@ref) with the most commonly used neighborhood search
+implementations:
+- `GridNeighborhoodSearch`
+- `GridNeighborhoodSearch` with `FullGridCellList`
+- `PrecomputedNeighborhoodSearch`
+
+# Arguments
+- `benchmark`:              The benchmark function. See [`benchmark_count_neighbors`](@ref),
+                            [`benchmark_n_body`](@ref), [`benchmark_wcsph`](@ref),
+                            [`benchmark_wcsph_fp32`](@ref) and [`benchmark_tlsph`](@ref).
+- `n_points_per_dimension`: Initial resolution as tuple. The product is the initial number
+                            of points. For example, use `(100, 100)` for a 2D benchmark or
+                            `(10, 10, 10)` for a 3D benchmark.
+- `iterations`:             Number of refinement iterations
+
+# Keywords
+See [`run_benchmark`](@ref) for a list of available keywords.
+
+# Examples
+```julia
+include("benchmarks/benchmarks.jl")
+
+run_benchmark_default(benchmark_n_body, (10, 10), 3)
+```
+"""
+function run_benchmark_default(benchmark, n_points_per_dimension, iterations; kwargs...)
+    NDIMS = length(n_points_per_dimension)
+    min_corner = 0.0f0 .* n_points_per_dimension
+    max_corner = Float32.(n_points_per_dimension ./ maximum(n_points_per_dimension))
+
+    neighborhood_searches = [
+        GridNeighborhoodSearch{NDIMS}(),
+        GridNeighborhoodSearch{NDIMS}(search_radius = 0.0f0,
+                                      cell_list = FullGridCellList(; search_radius = 0.0f0,
+                                                                   min_corner, max_corner)),
+        PrecomputedNeighborhoodSearch{NDIMS}()
+    ]
+
+    names = ["GridNeighborhoodSearch";;
+             "GridNeighborhoodSearch with FullGridCellList";;
+             "PrecomputedNeighborhoodSearch"]
+
+    run_benchmark(benchmark, n_points_per_dimension, iterations,
+                  neighborhood_searches; names, kwargs...)
+end
+
+"""
+    run_benchmark_gpu(benchmark, n_points_per_dimension, iterations; kwargs...)
+
+Shortcut to call [`run_benchmark`](@ref) with all GPU-compatible neighborhood search
+implementations:
+- `GridNeighborhoodSearch` with `FullGridCellList`
+
+# Arguments
+- `benchmark`:              The benchmark function. See [`benchmark_count_neighbors`](@ref),
+                            [`benchmark_n_body`](@ref), [`benchmark_wcsph`](@ref),
+                            [`benchmark_wcsph_fp32`](@ref) and [`benchmark_tlsph`](@ref).
+- `n_points_per_dimension`: Initial resolution as tuple. The product is the initial number
+                            of points. For example, use `(100, 100)` for a 2D benchmark or
+                            `(10, 10, 10)` for a 3D benchmark.
+- `iterations`:             Number of refinement iterations
+
+# Keywords
+See [`run_benchmark`](@ref) for a list of available keywords.
+
+# Examples
+```julia
+include("benchmarks/benchmarks.jl")
+
+run_benchmark_gpu(benchmark_n_body, (10, 10), 3)
+```
+"""
+function run_benchmark_gpu(benchmark, n_points_per_dimension, iterations; kwargs...)
+    NDIMS = length(n_points_per_dimension)
+
+    min_corner = 0.0f0 .* n_points_per_dimension
+    max_corner = Float32.(n_points_per_dimension ./ maximum(n_points_per_dimension))
+    neighborhood_searches = [
+        GridNeighborhoodSearch{NDIMS}(search_radius = 0.0f0,
+                                      cell_list = FullGridCellList(; search_radius = 0.0f0,
+                                                                   min_corner, max_corner))
+    ]
+
+    names = ["GridNeighborhoodSearch with FullGridCellList";;]
+
+    run_benchmark(benchmark, n_points_per_dimension, iterations,
+                  neighborhood_searches; names, kwargs...)
+end
+
+"""
+    plot_benchmark(n_particles_vec, times; kwargs...)
+
+Plot the results of a benchmark run with [`run_benchmark`](@ref).
+Note that the arguments are the outputs of that function.
+
+# Arguments
+- `n_particles_vec`: Vector containing the number of particles for each iteration.
+- `times`:           Matrix containing the runtimes for each neighborhood search and iteration.
+
+# Keywords
+Keyword arguments are passed to `Plots.plot`. For example, use `title = "My title"`.
+
+# Examples
+```julia
+include("benchmarks/benchmarks.jl")
+
+n_particles_vec, times = run_benchmark_default(benchmark_count_neighbors, (10, 10), 3)
+plot_benchmark(n_particles_vec, times; title = "Count neighbors benchmark")
+```
+"""
+function plot_benchmark(n_particles_vec, times; kwargs...)
+    function format_n_particles(n)
+        if n >= 1_000_000
+            return "$(round(Int, n / 1_000_000))M"
+        elseif n >= 1_000
+            return "$(round(Int, n / 1_000))k"
+        else
+            return string(n)
+        end
+    end
+    xticks = format_n_particles.(n_particles_vec)
+
+    plot(n_particles_vec, times ./ n_particles_vec .* 1e9;
+         xaxis = :log,
+         xticks = (n_particles_vec, xticks), linewidth = 2,
+         xlabel = "#particles", ylabel = "runtime per particle [ns]",
+         legend = :outerright, size = (700, 350), dpi = 200, margin = 4 * Plots.mm,
+         palette = palette(:tab10), kwargs...)
+end