Refactor to make it easier to test fixed-length

jaja360 · jaja360 · commit c7cce34612db · 2025-05-13T13:47:07.000-04:00
diff --git a/README.md b/README.md
@@ -102,6 +102,9 @@ algorithms that output fixed-length representation of a given length:
 ./build/benchmarks/benchmark -f data/canada.txt -F [length]
 ```
 
+Note that this only works when we are comparing speeds, not measuring properties
+of the algorithms, i.e., we can't use both `-F/--fixed` and `-t/--test` at the same time.
+
 ## Other existing benchmarks
 
 - [dtoa Benchmark](https://github.com/miloyip/dtoa-benchmark)
diff --git a/benchmarks/algorithms.h b/benchmarks/algorithms.h
@@ -44,44 +44,24 @@
 #define YY_DOUBLE_SUPPORTED 0
 #endif
 
-namespace Benchmarks {
-
-enum Algorithm {
-  DRAGON4 = 0,
-  ERROL3 = 1,
-  TO_STRING = 2,
-  FMT_FORMAT = 3,
-  NETLIB = 4,
-  SNPRINTF = 5,
-  GRISU2 = 6,
-  GRISU_EXACT = 7,
-  SCHUBFACH = 8,
-  DRAGONBOX = 9,
-  RYU = 10,
-  TEJU_JAGUA = 11,
-  DOUBLE_CONVERSION = 12,
-  ABSEIL = 13,
-  STD_TO_CHARS = 14,
-  GRISU3 = 15,
-  SWIFT_DTOA = 16,
-  YY_DOUBLE = 17,
-  COUNT // Keep last
-};
-
 template<arithmetic_float T>
 struct BenchArgs {
   using Type = T;
+  using BenchFn = std::function<int(T, std::span<char>&, size_t fixed_size)>;
 
-  BenchArgs(const std::string& name = {}, int (*func)(T, std::span<char>&) = {},
-            bool used = true, size_t testRepeat = 100)
-      : name(name), func(func), used(used), testRepeat(testRepeat) {}
+  BenchArgs(const std::string& name = {}, BenchFn func = {}, bool used = true,
+            size_t testRepeat = 100, size_t fixedSize = 9)
+      : name(name), func(func), used(used), testRepeat(testRepeat), fixedSize(fixedSize) {}
 
   std::string name{};
-  int (*func)(T, std::span<char>&){};
+  BenchFn func{};
   bool used{};
   size_t testRepeat{100};
+  size_t fixedSize{9};
 };
 
+namespace BenchmarkShortest {
+
 template<arithmetic_float T>
 int dragon4(T d, std::span<char>& buffer) {
   if constexpr (std::is_same_v<T, float>)
@@ -187,14 +167,6 @@ int netlib(T d, std::span<char>& buffer) {
 #endif
 }
 
-template<arithmetic_float T>
-int snprintf(T d, std::span<char>& buffer) {
-  if constexpr (std::is_same_v<T, float>)
-    return std::snprintf(buffer.data(), buffer.size(), "%.9g", d);
-  else
-    return std::snprintf(buffer.data(), buffer.size(), "%.17g", d);
-}
-
 // grisu2 is hardcoded for double.
 template<arithmetic_float T>
 int grisu2(T d, std::span<char>& buffer) {
@@ -284,19 +256,6 @@ int yy_double(T d, std::span<char>& buffer) {
 #endif
 }
 
-template<arithmetic_float T>
-int abseil(T d, std::span<char>& buffer) {
-  // StrAppend is faster but only outputs 6 digits after the decimal point
-  // std::string s;
-  // absl::StrAppend(&s, d);
-  // std::copy(s.begin(), s.end(), buffer.begin());
-  // return size(s);
-  if constexpr (std::is_same_v<T, float>)
-    return absl::SNPrintF(buffer.data(), buffer.size(), "%.9g", d);
-  else
-    return absl::SNPrintF(buffer.data(), buffer.size(), "%.17g", d);
-}
-
 template<arithmetic_float T>
 int std_to_chars(T d, std::span<char>& buffer) {
 #if TO_CHARS_SUPPORTED
@@ -313,34 +272,91 @@ int std_to_chars(T d, std::span<char>& buffer) {
 #endif
 }
 
+}  // namespace BenchmarksShortest
+
+namespace BenchmarkFixedSize {
+
+template<arithmetic_float T>
+int abseil(T d, std::span<char>& buffer, size_t fixed_size) {
+  // StrAppend is faster but only outputs 6 digits after the decimal point
+  // std::string s;
+  // absl::StrAppend(&s, d);
+  // std::copy(s.begin(), s.end(), buffer.begin());
+  // return size(s);
+  if constexpr (std::is_same_v<T, float>)
+    return absl::SNPrintF(buffer.data(), buffer.size(), "%.9g", d);
+  else
+    return absl::SNPrintF(buffer.data(), buffer.size(), "%.17g", d);
+}
+
+template<arithmetic_float T>
+int snprintf(T d, std::span<char>& buffer, size_t fixed_size) {
+  if constexpr (std::is_same_v<T, float>)
+    return std::snprintf(buffer.data(), buffer.size(), "%.9g", d);
+  else
+    return std::snprintf(buffer.data(), buffer.size(), "%.17g", d);
+}
+
+}  // namespace BenchmarksShortest
+
+template <typename T>
+auto make_shortest_adapter(int (*fn)(T, std::span<char>&)) {
+  return [fn](T v, std::span<char>& buf, size_t /*fixed_size*/) -> int {
+    return fn(v, buf);
+  };
+}
+
+template <typename T>
+auto make_fixed_adapter(int (*fn)(T, std::span<char>&, size_t)) {
+  return [fn](T v, std::span<char>& buf, size_t fixed_size) -> int {
+    return fn(v, buf, fixed_size);
+  };
+}
+
 template <arithmetic_float T>
-std::array<BenchArgs<T>, Benchmarks::COUNT> initArgs(size_t fixed_size, bool use_errol = false) {
-  if (fixed_size == 0) {  // shortest length representation
-    std::array<BenchArgs<T>, Benchmarks::COUNT> args;
-    args[Benchmarks::DRAGON4]           = { "dragon4"           , Benchmarks::dragon4<T>           , true                          , 10 };
-    args[Benchmarks::ERROL3]            = { "errol3"            , Benchmarks::errol3<T>            , ERROL_SUPPORTED && use_errol };
-    args[Benchmarks::TO_STRING]         = { "std::to_string"    , Benchmarks::to_string<T>         , true };
-    args[Benchmarks::FMT_FORMAT]        = { "fmt::format"       , Benchmarks::fmt_format<T>        , true };
-    args[Benchmarks::NETLIB]            = { "netlib"            , Benchmarks::netlib<T>            , NETLIB_SUPPORTED  && std::is_same_v<T, double>, 10 };
-    args[Benchmarks::SNPRINTF]          = { "snprintf"          , Benchmarks::snprintf<T>          , true };
-    args[Benchmarks::GRISU2]            = { "grisu2"            , Benchmarks::grisu2<T>            , std::is_same_v<T, double> };
-    args[Benchmarks::GRISU_EXACT]       = { "grisu_exact"       , Benchmarks::grisu_exact<T>       , true };
-    args[Benchmarks::SCHUBFACH]         = { "schubfach"         , Benchmarks::schubfach<T>         , true };
-    args[Benchmarks::DRAGONBOX]         = { "dragonbox"         , Benchmarks::dragonbox<T>         , true };
-    args[Benchmarks::RYU]               = { "ryu"               , Benchmarks::ryu<T>               , true };
-    args[Benchmarks::TEJU_JAGUA]        = { "teju_jagua"        , Benchmarks::teju_jagua<T>        , true };
-    args[Benchmarks::DOUBLE_CONVERSION] = { "double_conversion" , Benchmarks::double_conversion<T> , true };
-    args[Benchmarks::ABSEIL]            = { "abseil"            , Benchmarks::abseil<T>            , ABSEIL_SUPPORTED };
-    args[Benchmarks::STD_TO_CHARS]      = { "std::to_chars"     , Benchmarks::std_to_chars<T>      , TO_CHARS_SUPPORTED };
-    args[Benchmarks::GRISU3]            = { "grisu3"            , Benchmarks::grisu3<T>            , std::is_same_v<T, double> };
-    args[Benchmarks::SWIFT_DTOA]        = { "SwiftDtoa"         , Benchmarks::swiftDtoa<T>         , SWIFT_LIB_SUPPORTED };
-    args[Benchmarks::YY_DOUBLE]         = { "yy_double"         , Benchmarks::yy_double<T>         , YY_DOUBLE_SUPPORTED && std::is_same_v<T, double> };
-    return args;
+std::vector<BenchArgs<T>> initArgs(bool use_errol = false, size_t repeat = 0, size_t fixed_size = 0) {
+  std::vector<BenchArgs<T>> args;
+  if (fixed_size == 0) {  // shortest-length representation
+    auto&& wrap = make_shortest_adapter<T>;
+    namespace s = BenchmarkShortest;
+    args.emplace_back("dragon4"           , wrap(s::dragon4<T>)           , true                                           , 10);
+    args.emplace_back("netlib"            , wrap(s::netlib<T>)            , NETLIB_SUPPORTED && std::is_same_v<T, double>  , 10);
+    args.emplace_back("errol3"            , wrap(s::errol3<T>)            , ERROL_SUPPORTED && use_errol);
+    args.emplace_back("fmt_format"        , wrap(s::fmt_format<T>)        , true);
+    args.emplace_back("grisu2"            , wrap(s::grisu2<T>)            , std::is_same_v<T, double>);
+    args.emplace_back("grisu3"            , wrap(s::grisu3<T>)            , std::is_same_v<T, double>);
+    args.emplace_back("grisu_exact"       , wrap(s::grisu_exact<T>)       , true);
+    args.emplace_back("schubfach"         , wrap(s::schubfach<T>)         , true);
+    args.emplace_back("dragonbox"         , wrap(s::dragonbox<T>)         , true);
+    args.emplace_back("ryu"               , wrap(s::ryu<T>)               , true);
+    args.emplace_back("teju_jagua"        , wrap(s::teju_jagua<T>)        , true);
+    args.emplace_back("double_conversion" , wrap(s::double_conversion<T>) , true);
+    args.emplace_back("swiftDtoa"         , wrap(s::swiftDtoa<T>)         , SWIFT_LIB_SUPPORTED);
+    args.emplace_back("yy_double"         , wrap(s::yy_double<T>)         , YY_DOUBLE_SUPPORTED && std::is_same_v<T, double>);
+    args.emplace_back("std::to_chars"     , wrap(s::std_to_chars<T>)      , TO_CHARS_SUPPORTED);
+
+    // to_string, snprintf and abseil do not support shortest-length representation
   } else {  // fixed-length representation
-    throw std::runtime_error("fixed length representation not yet implemented");
+    auto&& wrap = make_fixed_adapter<T>;
+    namespace f = BenchmarkFixedSize;
+    args.emplace_back("snprintf" , wrap(f::snprintf<T>) , true);
+    args.emplace_back("abseil"   , wrap(f::abseil<T>)   , ABSEIL_SUPPORTED);
+
+    // to_string is hard-coded for 6 digits after the decimal point
+    // args.emplace_back("to_string", BenchmarkFixedSize::to_string<T>, true);
+
+    fmt::println("# testing fixed-size output to {} digits", fixed_size);
+    for (auto &arg : args)
+      arg.fixedSize = fixed_size;
   }
-};
 
-}  // namespace Benchmarks
+  if (repeat > 0) {
+      fmt::println("# forcing repeat count to {}", repeat);
+      for (auto &arg : args)
+          arg.testRepeat = repeat;
+  }
+
+  return args;
+};
 
 #endif
diff --git a/benchmarks/benchmark.cpp b/benchmarks/benchmark.cpp
@@ -25,11 +25,9 @@
 #include <fast_float/fast_float.h>
 #include <fmt/core.h>
 
-using Benchmarks::BenchArgs;
-
 template <arithmetic_float T>
 void evaluateProperties(const std::vector<TestCase<T>> &lines,
-                        const std::array<BenchArgs<T>, Benchmarks::COUNT> &args,
+                        const std::vector<BenchArgs<T>> &args,
                         const std::vector<std::string> &algo_filter) {
   evaluate_properties_helper<T>(lines, algo_filter, args);
 }
@@ -44,7 +42,7 @@ struct diy_float_t {
 
 template <arithmetic_float T>
 void process(const std::vector<TestCase<T>> &lines,
-             const std::array<BenchArgs<T>, Benchmarks::COUNT> &args,
+             const std::vector<BenchArgs<T>> &args,
              const std::vector<std::string> &algo_filter) {
   // We have a special algorithm for the string generation:
   if (!algo_filtered_out("just_string", algo_filter)) {
@@ -95,7 +93,7 @@ void process(const std::vector<TestCase<T>> &lines,
       char buf[100];
       std::span<char> bufspan(buf, sizeof(buf));
       for (const auto d : lines)
-        volume += algo.func(d.value, bufspan);
+        volume += algo.func(d.value, bufspan, algo.fixedSize);
       return volume;
     }, algo.testRepeat);
   }
@@ -170,7 +168,6 @@ int main(int argc, char **argv) {
       fmt::print("{}\n", options.help());
       return EXIT_SUCCESS;
     }
-    const size_t repeat = result["repeat"].as<size_t>();
     const bool single = result["single"].as<bool>();
     const auto filter = result.count("algo-filter")
                       ? result["algo-filter"].as<std::vector<std::string>>()
@@ -197,22 +194,14 @@ int main(int argc, char **argv) {
         numbers = fileload<double>(filename);
     }
 
-    std::variant<std::array<BenchArgs<float>, Benchmarks::COUNT>,
-                 std::array<BenchArgs<double>, Benchmarks::COUNT>> algorithms;
+    std::variant<std::vector<BenchArgs<float>>, std::vector<BenchArgs<double>>> algorithms;
     const bool errol = result["errol"].as<bool>();
+    const size_t repeat = result["repeat"].as<size_t>();
     const size_t fixed_size = result["fixed"].as<size_t>();
     if (single)
-      algorithms = Benchmarks::initArgs<float>(fixed_size, errol);
+      algorithms = initArgs<float>(errol, repeat, fixed_size);
     else
-      algorithms = Benchmarks::initArgs<double>(fixed_size, errol);
-
-    if(repeat > 0) {
-      fmt::println("# forcing repeat count to {}", repeat);
-      std::visit([repeat](auto &args) {
-        for (auto &arg : args)
-          arg.testRepeat = repeat;
-      }, algorithms);
-    }
+      algorithms = initArgs<double>(errol, repeat, fixed_size);
 
     const bool test = result["test"].as<bool>();
     std::visit([test, &filter](const auto &lines, const auto &args) {
diff --git a/benchmarks/benchutil.h b/benchmarks/benchutil.h
@@ -13,8 +13,6 @@
 #include "algorithms.h"
 #include "counters/event_counter.h"
 
-using Benchmarks::BenchArgs;
-
 event_collector collector;
 
 bool algo_filtered_out(const std::string &algo_name,
@@ -50,11 +48,11 @@ concept TestCaseRange
 template<arithmetic_float T, typename Range> requires TestCaseRange<Range, T>
 void evaluate_properties_helper(Range&& cases,
                                 const std::vector<std::string> &algo_filter,
-                                std::variant<std::array<BenchArgs<T>, Benchmarks::COUNT>, bool> argsOpt) {
+                                std::variant<std::vector<BenchArgs<T>>, bool> argsOpt) {
   fmt::println("{:20} {:20}", "Algorithm", "Valid shortest serialization");
   const auto args = std::holds_alternative<bool>(argsOpt)
-                  ? Benchmarks::initArgs<T>(std::get<bool>(argsOpt))
-                  : std::get<std::array<BenchArgs<T>, Benchmarks::COUNT>>(argsOpt);
+                  ? initArgs<T>(std::get<bool>(argsOpt))
+                  : std::get<std::vector<BenchArgs<T>>>(argsOpt);
 
   // Get number of cases for progress display
   uint64_t total = 0;
@@ -69,7 +67,7 @@ void evaluate_properties_helper(Range&& cases,
       fmt::println("# skipping {}", algo.name);
       continue;
     }
-    if (algo.func == Benchmarks::dragonbox<T>) {
+    if (algo.name == "dragonbox") {
       fmt::println("# skipping {} because it is the reference.", algo.name);
       continue;
     }
@@ -102,8 +100,8 @@ void evaluate_properties_helper(Range&& cases,
       // the shortest representation, which is not necessarily the same as the
       // representation using the fewest significant digits.
       // So we use dragonbox, which serves as the reference implementation.
-      const size_t vRef  = Benchmarks::dragonbox(d, bufRef);
-      const size_t vAlgo = algo.func(d, bufAlgo);
+      const size_t vRef  = BenchmarkShortest::dragonbox(d, bufRef);
+      const size_t vAlgo = algo.func(d, bufAlgo, algo.fixedSize);
 
       std::string_view svRef{bufRef.data(), vRef},
                        svAlgo{bufAlgo.data(), vAlgo};
diff --git a/benchmarks/exhaustivefloat32.cpp b/benchmarks/exhaustivefloat32.cpp
@@ -8,8 +8,6 @@
 #include "floatutils.h"
 #include "benchutil.h"
 
-using Benchmarks::BenchArgs;
-
 void run_exhaustive32(bool errol, const std::vector<std::string>& algo_filter = {}) {
   static_assert(sizeof(float) == sizeof(uint32_t));
   auto floats_view