Tweak plotting to collect outliers into a single bin; drop UnicodePlots dependency (#13)

ericphanson · brenhinkeller · web-flow · commit 1089a2528b5f · 2021-05-25T12:55:55.000+02:00
* Add `simpleunicodehistogram`


Co-authored-by: C. Brenhin Keller &lt;cbkeller@dartmouth.edu&gt;

* tweak `simpleunicodehistogram` for outliers

* rename things, add configuration, fix tests, update readme

* use Julia 1.0 compatible syntax

* fix omission of minimum

* bump version

Co-authored-by: C. Brenhin Keller &lt;cbkeller@dartmouth.edu&gt;
diff --git a/Project.toml b/Project.toml
@@ -1,17 +1,15 @@
 name = "BenchmarkHistograms"
 uuid = "a80a1652-aad8-438d-b80b-ecb1a674e33b"
 authors = ["Eric Hanson <5846501+ericphanson@users.noreply.github.com> and contributors"]
-version = "0.1.1"
+version = "0.2.0"
 
 [deps]
 BenchmarkTools = "6e4b80f9-dd63-53aa-95a3-0cdb28fa8baf"
 Printf = "de0858da-6303-5e67-8744-51eddeeeb8d7"
 Statistics = "10745b16-79ce-11e8-11f9-7d13ad32a3b2"
-UnicodePlots = "b8865327-cd53-5732-bb35-84acbb429228"
 
 [compat]
 BenchmarkTools = "0.7, 1.0"
-UnicodePlots = "1.3"
 julia = "1"
 
 [extras]
diff --git a/README.md b/README.md
@@ -3,19 +3,19 @@
 
 # BenchmarkHistograms
 
-Wraps [BenchmarkTools.jl](https://github.com/JuliaCI/BenchmarkTools.jl/) to provide a UnicodePlots.jl-powered `show` method for `@benchmark`. This is accomplished by a custom `@benchmark` method which wraps the output in a `BenchmarkPlot` struct with a custom show method.
+Wraps [BenchmarkTools.jl](https://github.com/JuliaCI/BenchmarkTools.jl/) to provide a unicode histogram `show` method for `@benchmark`. This is accomplished by a custom `@benchmark` method which wraps the output in a `BenchmarkPlot` struct with a custom show method.
 
 This means one should not call `using` on both BenchmarkHistograms and BenchmarkTools in the same namespace, or else these `@benchmark` macros will conflict ("WARNING: using `BenchmarkTools.@benchmark` in module Main conflicts with an existing identifier.")
 
-However, BenchmarkHistograms re-exports all of BenchmarkTools (including the module `BenchmarkTools` itself), so you can simply call `using BenchmarkHistograms` instead.
+However, BenchmarkHistograms re-exports all the export of BenchmarkTools, so you can simply call `using BenchmarkHistograms`.
 
 Providing this functionality in BenchmarkTools itself was discussed in <https://github.com/JuliaCI/BenchmarkTools.jl/pull/180>.
+Thanks to @brenhinkeller for providing the initial plotting code there.
 
-Use the setting `BenchmarkHistograms.NBINS[]` to change the number of histogram bins used, e.g.
-```julia
-BenchmarkHistograms.NBINS[] = 10
-```
-to use 10 bins.
+Use the setting `BenchmarkHistograms.NBINS` to change the number of histogram bins used, e.g. `BenchmarkHistograms.NBINS[] = 10` for 10 bins.
+
+Likewise use the setting `BenchmarkHistograms.OUTLIER_QUANTILE` to tweak which values count as outliers and may be grouped into a single bin.
+For example, `BenchmarkHistograms.OUTLIER_QUANTILE[] = 0.99` counts any values past the 99 percentile as possible outliers. This value defaults to `0.999` and is disabled by setting it to `1.0`.
 
 ## Example
 
@@ -29,22 +29,27 @@ using BenchmarkHistograms
 
 ```
 samples: 10000; evals/sample: 1000; memory estimate: 0 bytes; allocs estimate: 0
-                   ┌                                        ┐ 
-      [ 4.0,  6.0) ┤▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇ 7823   
-      [ 6.0,  8.0) ┤▇▇▇▇▇▇▇ 1643                              
-      [ 8.0, 10.0) ┤▇▇ 529                                    
-      [10.0, 12.0) ┤ 2                                        
-      [12.0, 14.0) ┤ 2                                        
-   ns [14.0, 16.0) ┤ 0                                        
-      [16.0, 18.0) ┤ 0                                        
-      [18.0, 20.0) ┤ 0                                        
-      [20.0, 22.0) ┤ 0                                        
-      [22.0, 24.0) ┤ 0                                        
-      [24.0, 26.0) ┤ 0                                        
-      [26.0, 28.0) ┤ 1                                        
-                   └                                        ┘ 
-                                    Counts
-min: 4.916 ns (0.00% GC); mean: 5.724 ns (0.00% GC); median: 5.208 ns (0.00% GC); max: 27.458 ns (0.00% GC).
+ns
+
+ (8.04  - 8.53 ]  ██████████████████████████████▏7673
+ (8.53  - 9.02 ]  ▌109
+ (9.02  - 9.51 ]  ▏3
+ (9.51  - 10.01]   0
+ (10.01 - 10.5 ]   0
+ (10.5  - 10.99]  █████▋1431
+ (10.99 - 11.48]  ██▌624
+ (11.48 - 11.97]  ▍70
+ (11.97 - 12.46]  ▎38
+ (12.46 - 12.95]  ▏4
+ (12.95 - 13.44]  ▏1
+ (13.44 - 13.93]  ▏2
+ (13.93 - 14.42]  ▏7
+ (14.42 - 14.92]  ▏22
+ (14.92 - 21.88]  ▏16
+
+                  Counts
+
+min: 8.041 ns (0.00% GC); mean: 8.812 ns (0.00% GC); median: 8.166 ns (0.00% GC); max: 21.875 ns (0.00% GC).
 ```
 
 That benchmark does not have a very interesting distribution, but it's not hard to find more interesting cases.
@@ -54,18 +59,26 @@ That benchmark does not have a very interesting distribution, but it's not hard
 ```
 
 ```
-samples: 3192; evals/sample: 1000; memory estimate: 0 bytes; allocs estimate: 0
-                       ┌                                        ┐ 
-      [   0.0,  500.0) ┤▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇ 2036   
-      [ 500.0, 1000.0) ┤ 0                                        
-      [1000.0, 1500.0) ┤ 0                                        
-   ns [1500.0, 2000.0) ┤ 0                                        
-      [2000.0, 2500.0) ┤ 0                                        
-      [2500.0, 3000.0) ┤ 0                                        
-      [3000.0, 3500.0) ┤▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇ 1156                  
-                       └                                        ┘ 
-                                        Counts
-min: 1.875 ns (0.00% GC); mean: 1.141 μs (0.00% GC); median: 4.521 ns (0.00% GC); max: 3.315 μs (0.00% GC).
+samples: 3110; evals/sample: 1000; memory estimate: 0 bytes; allocs estimate: 0
+ns
+
+ (0.0    - 280.0 ]  ██████████████████████████████ 1964
+ (280.0  - 570.0 ]   0
+ (570.0  - 850.0 ]   0
+ (850.0  - 1130.0]   0
+ (1130.0 - 1410.0]   0
+ (1410.0 - 1690.0]   0
+ (1690.0 - 1970.0]   0
+ (1970.0 - 2250.0]   0
+ (2250.0 - 2540.0]   0
+ (2540.0 - 2820.0]   0
+ (2820.0 - 3100.0]   0
+ (3100.0 - 3380.0]  █████████████████1105
+ (3380.0 - 3660.0]  ▊41
+
+                  Counts
+
+min: 2.500 ns (0.00% GC); mean: 1.181 μs (0.00% GC); median: 5.334 ns (0.00% GC); max: 3.663 μs (0.00% GC).
 ```
 
 Here, we see a bimodal distribution; in the case `5` is indeed in the vector, we find it very quickly, in the 0-1000 ns range (thanks to `sort` which places it at the front). In the case 5 is not present, we need to check every entry to be sure, and we end up in the 3000-4000 ns range.
@@ -77,18 +90,26 @@ Without the `sort`, we end up with more of a uniform distribution:
 ```
 
 ```
-samples: 2461; evals/sample: 999; memory estimate: 0 bytes; allocs estimate: 0
-                       ┌                                        ┐ 
-      [   0.0,  500.0) ┤▇▇▇▇▇▇▇▇▇▇▇▇▇▇ 364                        
-      [ 500.0, 1000.0) ┤▇▇▇▇▇▇▇▇▇▇▇▇ 327                          
-      [1000.0, 1500.0) ┤▇▇▇▇▇▇▇▇▇▇ 266                            
-   ns [1500.0, 2000.0) ┤▇▇▇▇▇▇▇▇ 214                              
-      [2000.0, 2500.0) ┤▇▇▇▇▇▇▇▇ 213                              
-      [2500.0, 3000.0) ┤▇▇▇▇▇ 146                                 
-      [3000.0, 3500.0) ┤▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇ 931   
-                       └                                        ┘ 
-                                        Counts
-min: 8.842 ns (0.00% GC); mean: 1.972 μs (0.00% GC); median: 2.154 μs (0.00% GC); max: 3.364 μs (0.00% GC).
+samples: 2393; evals/sample: 1000; memory estimate: 0 bytes; allocs estimate: 0
+ns
+
+ (0.0    - 310.0 ]  ███████▏214
+ (310.0  - 610.0 ]  ██████▍191
+ (610.0  - 910.0 ]  █████▊173
+ (910.0  - 1220.0]  █████▊174
+ (1220.0 - 1520.0]  █████▏155
+ (1520.0 - 1830.0]  ████▍133
+ (1830.0 - 2130.0]  ████119
+ (2130.0 - 2430.0]  ███▍100
+ (2430.0 - 2740.0]  ██▉86
+ (2740.0 - 3040.0]  ███▍102
+ (3040.0 - 3350.0]  ██████████████████████████████ 912
+ (3350.0 - 3650.0]  █30
+ (3650.0 - 5870.0]  ▎4
+
+                  Counts
+
+min: 2.334 ns (0.00% GC); mean: 2.037 μs (0.00% GC); median: 2.236 μs (0.00% GC); max: 5.869 μs (0.00% GC).
 ```
 
 This function gives a somewhat more Gaussian distribution of times, kindly supplied by Mason Protter:
@@ -100,28 +121,33 @@ f() = sum((sin(i) for i in 1:round(Int, 1000 + 100*randn())))
 ```
 
 ```
-samples: 10000; evals/sample: 1; memory estimate: 0 bytes; allocs estimate: 0
-                         ┌                                        ┐ 
-      [ 8000.0,  9000.0) ┤ 12                                       
-      [ 9000.0, 10000.0) ┤▇ 117                                     
-      [10000.0, 11000.0) ┤▇▇▇▇▇▇▇ 635                               
-      [11000.0, 12000.0) ┤▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇ 1810                
-      [12000.0, 13000.0) ┤▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇ 2959   
-      [13000.0, 14000.0) ┤▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇ 2460         
-   ns [14000.0, 15000.0) ┤▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇ 1451                    
-      [15000.0, 16000.0) ┤▇▇▇▇▇ 456                                 
-      [16000.0, 17000.0) ┤▇ 89                                      
-      [17000.0, 18000.0) ┤ 9                                        
-      [18000.0, 19000.0) ┤ 1                                        
-      [19000.0, 20000.0) ┤ 0                                        
-      [20000.0, 21000.0) ┤ 1                                        
-                         └                                        ┘ 
-                                          Counts
-min: 8.109 μs (0.00% GC); mean: 12.865 μs (0.00% GC); median: 12.820 μs (0.00% GC); max: 20.459 μs (0.00% GC).
+samples: 10000; evals/sample: 3; memory estimate: 0 bytes; allocs estimate: 0
+ns
+
+ (7030.0  - 7480.0 ]  ▏11
+ (7480.0  - 7930.0 ]  █▍128
+ (7930.0  - 8380.0 ]  ████████▏788
+ (8380.0  - 8830.0 ]  █████████████████████▏2044
+ (8830.0  - 9280.0 ]  ██████████████████████████████ 2916
+ (9280.0  - 9730.0 ]  ███████████████████████▉2309
+ (9730.0  - 10180.0]  ████████████▎1182
+ (10180.0 - 10630.0]  ████▎413
+ (10630.0 - 11080.0]  █▌140
+ (11080.0 - 11530.0]  ▌44
+ (11530.0 - 11980.0]  ▏6
+ (11980.0 - 12430.0]  ▏3
+ (12430.0 - 12880.0]   0
+ (12880.0 - 13330.0]  ▏5
+ (13330.0 - 18330.0]  ▏11
+
+                  Counts
+
+min: 7.028 μs (0.00% GC); mean: 9.184 μs (0.00% GC); median: 9.153 μs (0.00% GC); max: 18.333 μs (0.00% GC).
 ```
 
 See also <https://tratt.net/laurie/blog/entries/minimum_times_tend_to_mislead_when_benchmarking.html> for another example of where looking at the whole histogram can be useful in benchmarking.
 
 ---
 
 *This page was generated using [Literate.jl](https://github.com/fredrikekre/Literate.jl).*
+
diff --git a/generate_readme/README.jl b/generate_readme/README.jl
@@ -3,15 +3,19 @@
 
 # # BenchmarkHistograms
 
-# Wraps [BenchmarkTools.jl](https://github.com/JuliaCI/BenchmarkTools.jl/) to provide a UnicodePlots.jl-powered `show` method for `@benchmark`. This is accomplished by a custom `@benchmark` method which wraps the output in a `BenchmarkPlot` struct with a custom show method.
+# Wraps [BenchmarkTools.jl](https://github.com/JuliaCI/BenchmarkTools.jl/) to provide a unicode histogram `show` method for `@benchmark`. This is accomplished by a custom `@benchmark` method which wraps the output in a `BenchmarkPlot` struct with a custom show method.
 
 # This means one should not call `using` on both BenchmarkHistograms and BenchmarkTools in the same namespace, or else these `@benchmark` macros will conflict ("WARNING: using `BenchmarkTools.@benchmark` in module Main conflicts with an existing identifier.")
 
 # However, BenchmarkHistograms re-exports all the export of BenchmarkTools, so you can simply call `using BenchmarkHistograms`.
 
 # Providing this functionality in BenchmarkTools itself was discussed in <https://github.com/JuliaCI/BenchmarkTools.jl/pull/180>.
+# Thanks to @brenhinkeller for providing the initial plotting code there.
 
-# Use the setting `BenchmarkHistograms.NBINS[] = 10` to change the number of histogram bins used.
+# Use the setting `BenchmarkHistograms.NBINS` to change the number of histogram bins used, e.g. `BenchmarkHistograms.NBINS[] = 10` for 10 bins.
+
+# Likewise use the setting `BenchmarkHistograms.OUTLIER_QUANTILE` to tweak which values count as outliers and may be grouped into a single bin.
+# For example, `BenchmarkHistograms.OUTLIER_QUANTILE[] = 0.99` counts any values past the 99 percentile as possible outliers. This value defaults to `0.999` and is disabled by setting it to `1.0`.
 
 # ## Example
 
diff --git a/src/BenchmarkHistograms.jl b/src/BenchmarkHistograms.jl
@@ -1,6 +1,5 @@
 module BenchmarkHistograms
 
-using UnicodePlots
 using Statistics
 using Printf
 using BenchmarkTools: BenchmarkTools
@@ -20,10 +19,18 @@ export @benchmark
     const NBINS = Ref(0)
 
 Controls the number of histogram bins used.
-When `NBINS[] <= 0`, the number is chosen automatically by UnicodePlots.
+When `NBINS[] <= 0`, the number is chosen automatically by Sturge's rule (i.e. `log2(length(data))+1`).
 """
 const NBINS = Ref(0)
 
+"""
+    OUTLIER_QUANTILE = Ref(0.999)
+
+Controls which benchmarking times count as outliers and may be grouped into a single bin.
+Set `OUTLIER_QUANTILE[] = 1.0` to avoid this behavior.
+"""
+const OUTLIER_QUANTILE = Ref(0.999)
+
 struct BenchmarkHistogram
     trial::BenchmarkTools.Trial
 end
@@ -53,7 +60,8 @@ function Base.show(io::IO, ::MIME"text/plain", bp::BenchmarkHistogram; nbins=NBI
     println(io, "samples: ", length(t), "; evals/sample: ", t.params.evals, "; memory estimate: ", memorystr, "; allocs estimate: ", allocsstr)
     if length(t) > 0
         bin_arg = nbins <= 0 ? NamedTuple() : (; nbins=nbins)
-        show(io, histogram(t.times; ylabel="ns", xlabel="Counts", bin_arg...))
+        simple_unicode_histogram(io, t.times; ylabel="ns", xlabel="Counts",
+        outlier_quantile=OUTLIER_QUANTILE[], bin_arg...)
         println(io)
     end
     print(io, "min: ", minstr, "; mean: ", meanstr, "; median: ", medstr, "; max: ", maxstr, ".")
@@ -70,4 +78,7 @@ end
 # so that we don't have to rely on internals.
 include("vendor.jl")
 
+# The code to draw the histograms
+include("simple_unicode_histogram.jl")
+
 end
diff --git a/src/simple_unicode_histogram.jl b/src/simple_unicode_histogram.jl
@@ -0,0 +1,68 @@
+# Modified from https://github.com/JuliaCI/BenchmarkTools.jl/pull/180#issuecomment-711128281 by @brenhinkeller
+
+const BLOCKS = [" ","▏","▎","▍","▌","▋","▊","▉","█","█"]
+
+function simple_unicode_histogram(io::IO, x::AbstractArray;
+                                  nbins::Integer=ceil(Int, log2(length(x))+1),
+                                  plot_width::Integer=30, show_counts::Bool=true,
+                                  outlier_quantile = 0.999,
+                                  xlabel="", ylabel="")
+    # Find bounds. Our naive attempt is to use equal width
+    # bins from the minimum to the maximum.
+    l, M = extrema(x)
+    # our lower bounds are exclusive, so we want to be sure to get the min
+    l = prevfloat(l)
+
+    # Now, we check: if we don't have some big outliers, we'd expect
+    # the 99.9 percentile, `Q`, to be within a few bins of the maximum.
+    # Here, we choose 2. If it is not, then we decide that indeed
+    # there are outliers. We will instead divide the range from
+    # the minimum to `Q` equally with `nbins-1` bins, and then reserve
+    # the last bin to hold everything greater than `Q`.
+    Q = quantile(x, outlier_quantile)
+    initial_dx = (M - l) / nbins
+    truncate = M - Q > 2*initial_dx
+
+    # our "upper bound"
+    u = truncate ? Q : M
+
+    # Fill histogram
+    hist_counts = fill(0, nbins)
+    dx = truncate ? (u - l) / (nbins - 1) : initial_dx
+    for xi in x
+        index = ceil(Int, (xi - l) / dx)
+        if 1 <= index <= nbins
+            hist_counts[index] += 1
+        else
+            hist_counts[end] += 1
+        end
+    end
+
+    if truncate
+        bin_edges = [range(l;stop=u,length=nbins); M]
+    else
+        bin_edges = range(l;stop=u,length=nbins+1)
+    end
+
+    # Print the histogram
+    d = ceil(Int, -log10(u-l))+1
+    scale = plot_width/maximum(hist_counts)
+    lower_labels = string.(round.(bin_edges[1:end-1], digits=d+ceil(Int,log10(nbins)-1)))
+    upper_labels = string.(round.(bin_edges[2:end], digits=d+ceil(Int,log10(nbins)-1)))
+    longest_lower = maximum(length.(lower_labels))
+    longest_upper = maximum(length.(upper_labels))
+    !isempty(ylabel) && println(io, ylabel, "\n")
+    for i=1:nbins
+        nblocks = hist_counts[i] * scale
+        block_string = repeat("█", floor(Int, nblocks)) * BLOCKS[ceil(Int,(nblocks - floor(nblocks))*8)+1]
+        print(io, " (", lower_labels[i], " "^(longest_lower - length(lower_labels[i])))
+        print(io, " - ", upper_labels[i], " "^(longest_upper - length(upper_labels[i])), "]  ")
+        printstyled(io, block_string; color=:green)
+        if show_counts
+            print(io, hist_counts[i])
+        end
+        println(io)
+    end
+    isempty(xlabel) || println(io, "\n", " "^max(plot_width ÷2 + 6 - length(xlabel)÷2, 0), xlabel)
+    return nothing
+end
diff --git a/test/runtests.jl b/test/runtests.jl