Add and base-10 specialization

mborland · mborland · commit c98f81a47047 · 2025-07-23T13:52:54.000-04:00
diff --git a/include/boost/decimal/charconv.hpp b/include/boost/decimal/charconv.hpp
@@ -324,7 +324,7 @@ BOOST_DECIMAL_CONSTEXPR auto to_chars_scientific_impl(char* first, char* last, c
     }
 
     // Offset the value of first by 1 so that we can copy the leading digit and insert a decimal point
-    auto r = to_chars_integer_impl<uint_type, uint_type>(first + 1, last, significand, 10);
+    auto r = to_chars_integer_impl<uint_type>(first + 1, last, significand);
 
     // Only real reason we will hit this is a buffer overflow
     if (BOOST_DECIMAL_UNLIKELY(!r))
@@ -398,7 +398,7 @@ BOOST_DECIMAL_CONSTEXPR auto to_chars_scientific_impl(char* first, char* last, c
         *first++ = '0';
     }
 
-    r = to_chars_integer_impl<int, unsigned>(first, last, abs_exp, 10);
+    r = to_chars_integer_impl<int>(first, last, abs_exp);
     if (BOOST_DECIMAL_UNLIKELY(!r))
     {
         return r; // LCOV_EXCL_LINE
@@ -544,7 +544,7 @@ BOOST_DECIMAL_CONSTEXPR auto to_chars_fixed_impl(char* first, char* last, const
                                           std::numeric_limits<std::uint64_t>::digits),
                                           int128::uint128_t, std::uint64_t>;
 
-    auto r = to_chars_integer_impl<uint_type, uint_type>(first, last, significand, 10);
+    auto r = to_chars_integer_impl<uint_type>(first, last, significand);
 
     if (BOOST_DECIMAL_UNLIKELY(!r))
     {
@@ -775,7 +775,7 @@ BOOST_DECIMAL_CONSTEXPR auto to_chars_hex_impl(char* first, char* last, const Ta
         *first++ = '0';
     }
 
-    return to_chars_integer_impl<std::uint32_t, std::uint32_t>(first, last, static_cast<std::uint32_t>(abs_exp), 10);
+    return to_chars_integer_impl<std::uint32_t>(first, last, static_cast<std::uint32_t>(abs_exp));
 }
 
 #ifdef _MSC_VER
diff --git a/include/boost/decimal/detail/to_chars_integer_impl.hpp b/include/boost/decimal/detail/to_chars_integer_impl.hpp
@@ -105,6 +105,268 @@ BOOST_DECIMAL_CONSTEXPR auto to_chars_integer_impl(char* first, char* last, Inte
     return {first + num_chars, std::errc()};
 }
 
+// Specialization for base-10
+
+BOOST_DECIMAL_CONSTEXPR_VARIABLE char radix_table[] = {
+    '0', '0', '0', '1', '0', '2', '0', '3', '0', '4',
+    '0', '5', '0', '6', '0', '7', '0', '8', '0', '9',
+    '1', '0', '1', '1', '1', '2', '1', '3', '1', '4',
+    '1', '5', '1', '6', '1', '7', '1', '8', '1', '9',
+    '2', '0', '2', '1', '2', '2', '2', '3', '2', '4',
+    '2', '5', '2', '6', '2', '7', '2', '8', '2', '9',
+    '3', '0', '3', '1', '3', '2', '3', '3', '3', '4',
+    '3', '5', '3', '6', '3', '7', '3', '8', '3', '9',
+    '4', '0', '4', '1', '4', '2', '4', '3', '4', '4',
+    '4', '5', '4', '6', '4', '7', '4', '8', '4', '9',
+    '5', '0', '5', '1', '5', '2', '5', '3', '5', '4',
+    '5', '5', '5', '6', '5', '7', '5', '8', '5', '9',
+    '6', '0', '6', '1', '6', '2', '6', '3', '6', '4',
+    '6', '5', '6', '6', '6', '7', '6', '8', '6', '9',
+    '7', '0', '7', '1', '7', '2', '7', '3', '7', '4',
+    '7', '5', '7', '6', '7', '7', '7', '8', '7', '9',
+    '8', '0', '8', '1', '8', '2', '8', '3', '8', '4',
+    '8', '5', '8', '6', '8', '7', '8', '8', '8', '9',
+    '9', '0', '9', '1', '9', '2', '9', '3', '9', '4',
+    '9', '5', '9', '6', '9', '7', '9', '8', '9', '9'
+};
+
+// See: https://jk-jeon.github.io/posts/2022/02/jeaiii-algorithm/
+// https://arxiv.org/abs/2101.11408
+constexpr char* decompose32(std::uint32_t value, char* buffer) noexcept
+{
+    constexpr auto mask = (UINT64_C(1) << 57) - 1;
+    auto y = value * UINT64_C(1441151881);
+
+    for (std::size_t i {}; i < 10; i += 2)
+    {
+        boost::decimal::detail::memcpy(buffer + i, radix_table + static_cast<std::size_t>(y >> 57) * 2, 2);
+        y &= mask;
+        y *= 100U;
+    }
+
+    return buffer + 10;
+}
+
+#ifdef _MSC_VER
+# pragma warning(push)
+# pragma warning(disable: 4127 4146)
+#endif
+
+template <typename Integer>
+constexpr to_chars_result to_chars_integer_impl(char* first, char* last, Integer value) noexcept
+{
+    using Unsigned_Integer = typename std::make_unsigned<Integer>::type;
+    Unsigned_Integer unsigned_value {};
+
+    char buffer[10] {};
+    int converted_value_digits {};
+    bool is_negative = false;
+
+    if (first > last)
+    {
+        return {last, std::errc::invalid_argument};
+    }
+
+    // Strip the sign from the value and apply at the end after parsing if the type is signed
+    BOOST_DECIMAL_IF_CONSTEXPR (std::is_signed<Integer>::value)
+    {
+        if (value < 0)
+        {
+            is_negative = true;
+            unsigned_value = apply_sign(value);
+        }
+        else
+        {
+            unsigned_value = static_cast<Unsigned_Integer>(value);
+        }
+    }
+    else
+    {
+        unsigned_value = static_cast<Unsigned_Integer>(value);
+    }
+
+    const std::ptrdiff_t user_buffer_size = last - first - static_cast<std::ptrdiff_t>(is_negative);
+
+    // If the type is less than 32 bits we can use this without change
+    // If the type is greater than 32 bits we use a binary search tree to figure out how many digits
+    // are present and then decompose the value into two (or more) std::uint32_t of known length so that we
+    // don't have the issue of removing leading zeros from the least significant digits
+
+    // Yields: warning C4127: conditional expression is constant because first half of the expression is constant,
+    // but we need to short circuit to avoid UB on the second half
+    if (std::numeric_limits<Integer>::digits <= std::numeric_limits<std::uint32_t>::digits ||
+        unsigned_value <= static_cast<Unsigned_Integer>((std::numeric_limits<std::uint32_t>::max)()))
+    {
+        const auto converted_value = static_cast<std::uint32_t>(unsigned_value);
+        converted_value_digits = num_digits(converted_value);
+
+        if (converted_value_digits > user_buffer_size)
+        {
+            return {last, std::errc::value_too_large};
+        }
+
+        decompose32(converted_value, buffer);
+
+        if (is_negative)
+        {
+            *first++ = '-';
+        }
+
+        boost::decimal::detail::memcpy(first, buffer + (sizeof(buffer) - static_cast<unsigned>(converted_value_digits)),
+                                        static_cast<std::size_t>(converted_value_digits));
+    }
+    else if (std::numeric_limits<Integer>::digits <= std::numeric_limits<std::uint64_t>::digits ||
+             static_cast<std::uint64_t>(unsigned_value) <= (std::numeric_limits<std::uint64_t>::max)())
+    {
+        auto converted_value = static_cast<std::uint64_t>(unsigned_value);
+        converted_value_digits = num_digits(converted_value);
+
+        if (converted_value_digits > user_buffer_size)
+        {
+            return {last, std::errc::value_too_large};
+        }
+
+        if (is_negative)
+        {
+            *first++ = '-';
+        }
+
+        // Only store 9 digits in each to avoid overflow
+        if (num_digits(converted_value) <= 18)
+        {
+            const auto x = static_cast<std::uint32_t>(converted_value / UINT64_C(1000000000));
+            const auto y = static_cast<std::uint32_t>(converted_value % UINT64_C(1000000000));
+            const int first_value_chars = num_digits(x);
+
+            decompose32(x, buffer);
+            boost::decimal::detail::memcpy(first, buffer + (sizeof(buffer) - static_cast<unsigned>(first_value_chars)),
+                                            static_cast<std::size_t>(first_value_chars));
+
+            decompose32(y, buffer);
+            boost::decimal::detail::memcpy(first + first_value_chars, buffer + 1, sizeof(buffer) - 1);
+        }
+        else
+        {
+            const auto x = static_cast<std::uint32_t>(converted_value / UINT64_C(100000000000));
+            converted_value -= x * UINT64_C(100000000000);
+            const auto y = static_cast<std::uint32_t>(converted_value / UINT64_C(100));
+            const auto z = static_cast<std::uint32_t>(converted_value % UINT64_C(100));
+
+            if (converted_value_digits == 19)
+            {
+                decompose32(x, buffer);
+                boost::decimal::detail::memcpy(first, buffer + 2, sizeof(buffer) - 2);
+
+                decompose32(y, buffer);
+                boost::decimal::detail::memcpy(first + 8, buffer + 1, sizeof(buffer) - 1);
+
+                // Always prints 2 digits last
+                boost::decimal::detail::memcpy(first + 17, radix_table + z * 2, 2);
+            }
+            else // 20
+            {
+                decompose32(x, buffer);
+                boost::decimal::detail::memcpy(first, buffer + 1, sizeof(buffer) - 1);
+
+                decompose32(y, buffer);
+                boost::decimal::detail::memcpy(first + 9, buffer + 1, sizeof(buffer) - 1);
+
+                // Always prints 2 digits last
+                boost::decimal::detail::memcpy(first + 18, radix_table + z * 2, 2);
+            }
+        }
+    }
+
+    return {first + converted_value_digits, std::errc()};
+}
+
+template <typename Integer, typename Unsigned_Integer = boost::int128::uint128_t>
+constexpr to_chars_result to_chars_128integer_impl(char* first, char* last, Integer value) noexcept
+{
+    Unsigned_Integer unsigned_value {};
+
+    const std::ptrdiff_t user_buffer_size = last - first;
+    BOOST_DECIMAL_ATTRIBUTE_UNUSED bool is_negative = false;
+
+    if (first > last)
+    {
+        return {last, std::errc::invalid_argument};
+    }
+
+    // Strip the sign from the value and apply at the end after parsing if the type is signed
+    BOOST_DECIMAL_IF_CONSTEXPR (std::numeric_limits<Integer>::is_signed
+                        #ifdef BOOST_DECIMAL_HAS_INT128
+                        || std::is_same<boost::decimal::detail::builtin_uint128_t, Integer>::value
+                        #endif
+                        )
+    {
+        if (value < 0)
+        {
+            is_negative = true;
+            unsigned_value = -(static_cast<Unsigned_Integer>(value));
+        }
+        else
+        {
+            unsigned_value = static_cast<Unsigned_Integer>(value);
+        }
+    }
+    else
+    {
+        unsigned_value = static_cast<Unsigned_Integer>(value);
+    }
+
+    auto converted_value = static_cast<Unsigned_Integer>(unsigned_value);
+
+    const int converted_value_digits = num_digits(converted_value);
+
+    if (converted_value_digits > user_buffer_size)
+    {
+        return {last, std::errc::value_too_large};
+    }
+
+    if (is_negative)
+    {
+        *first++ = '-';
+    }
+
+    // If the value fits into 64 bits use the other method of processing
+    if (converted_value < (std::numeric_limits<std::uint64_t>::max)())
+    {
+        return to_chars_integer_impl(first, last, static_cast<std::uint64_t>(value));
+    }
+
+    constexpr std::uint32_t ten_9 = UINT32_C(1000000000);
+    char buffer[5][10] {};
+    int num_chars[5] {};
+    int i = 0;
+
+    while (converted_value != 0)
+    {
+        auto digits = static_cast<std::uint32_t>(converted_value % ten_9);
+        num_chars[i] = num_digits(digits);
+        decompose32(digits, buffer[i]); // Always returns 10 digits (to include leading 0s) which we want
+        converted_value = (converted_value - digits) / ten_9;
+        ++i;
+    }
+
+    --i;
+    auto offset = static_cast<std::size_t>(num_chars[i]);
+    boost::decimal::detail::memcpy(first, buffer[i] + 10 - offset, offset);
+
+    while (i > 0)
+    {
+        --i;
+        boost::decimal::detail::memcpy(first + offset, buffer[i] + 1, 9);
+        offset += 9;
+    }
+
+    return {first + converted_value_digits, std::errc()};
+}
+
+#ifdef _MSC_VER
+# pragma warning(pop)
+#endif
+
 #if defined(__GNUC__) && __GNUC__ == 7
 #pragma GCC diagnostic pop
 #endif

Original file line number	Diff line number	Diff line change
`@@ -324,7 +324,7 @@ BOOST_DECIMAL_CONSTEXPR auto to_chars_scientific_impl(char* first, char* last, c`
`324`	`324`	`}`
`325`	`325`
`326`	`326`	`// Offset the value of first by 1 so that we can copy the leading digit and insert a decimal point`
`327`		`- auto r = to_chars_integer_impl<uint_type, uint_type>(first + 1, last, significand, 10);`
	`327`	`+ auto r = to_chars_integer_impl<uint_type>(first + 1, last, significand);`
`328`	`328`
`329`	`329`	`// Only real reason we will hit this is a buffer overflow`
`330`	`330`	`if (BOOST_DECIMAL_UNLIKELY(!r))`
`@@ -398,7 +398,7 @@ BOOST_DECIMAL_CONSTEXPR auto to_chars_scientific_impl(char* first, char* last, c`
`398`	`398`	`*first++ = '0';`
`399`	`399`	`}`
`400`	`400`
`401`		`- r = to_chars_integer_impl<int, unsigned>(first, last, abs_exp, 10);`
	`401`	`+ r = to_chars_integer_impl<int>(first, last, abs_exp);`
`402`	`402`	`if (BOOST_DECIMAL_UNLIKELY(!r))`
`403`	`403`	`{`
`404`	`404`	`return r; // LCOV_EXCL_LINE`
`@@ -544,7 +544,7 @@ BOOST_DECIMAL_CONSTEXPR auto to_chars_fixed_impl(char* first, char* last, const`
`544`	`544`	`std::numeric_limits<std::uint64_t>::digits),`
`545`	`545`	`int128::uint128_t, std::uint64_t>;`
`546`	`546`
`547`		`- auto r = to_chars_integer_impl<uint_type, uint_type>(first, last, significand, 10);`
	`547`	`+ auto r = to_chars_integer_impl<uint_type>(first, last, significand);`
`548`	`548`
`549`	`549`	`if (BOOST_DECIMAL_UNLIKELY(!r))`
`550`	`550`	`{`
`@@ -775,7 +775,7 @@ BOOST_DECIMAL_CONSTEXPR auto to_chars_hex_impl(char* first, char* last, const Ta`
`775`	`775`	`*first++ = '0';`
`776`	`776`	`}`
`777`	`777`
`778`		`- return to_chars_integer_impl<std::uint32_t, std::uint32_t>(first, last, static_cast<std::uint32_t>(abs_exp), 10);`
	`778`	`+ return to_chars_integer_impl<std::uint32_t>(first, last, static_cast<std::uint32_t>(abs_exp));`
`779`	`779`	`}`
`780`	`780`
`781`	`781`	`#ifdef _MSC_VER`