Impl expm1 64/128 and other small repairs

ckormanyos · ckormanyos · commit a145fdcf293e · 2024-05-11T09:36:34.000+02:00
diff --git a/include/boost/decimal/detail/cmath/expm1.hpp b/include/boost/decimal/detail/cmath/expm1.hpp
@@ -7,13 +7,14 @@
 #define BOOST_DECIMAL_DETAIL_CMATH_EXPM1_HPP
 
 #include <boost/decimal/fwd.hpp> // NOLINT(llvm-include-order)
-#include <boost/decimal/detail/type_traits.hpp>
+#include <boost/decimal/detail/cmath/impl/expm1_impl.hpp>
 #include <boost/decimal/detail/concepts.hpp>
 #include <boost/decimal/detail/config.hpp>
+#include <boost/decimal/detail/type_traits.hpp>
 #include <boost/decimal/numbers.hpp>
 
 #ifndef BOOST_DECIMAL_BUILD_MODULE
-#include <array>
+#include <cmath>
 #include <type_traits>
 #endif
 
@@ -70,66 +71,7 @@ constexpr auto expm1_impl(T x) noexcept
         }
         else
         {
-            // Specifically derive a polynomial expansion for Exp[x] - 1 for this work.
-            //   Table[{x, Exp[x] - 1}, {x, -Log[2], Log[2], 1/60}]
-            //   N[%, 48]
-            //   Fit[%, {x, x^2, x^3, x^4, x^5, x^6, x^7, x^8, x^9, x^10, x^11, x^12, x^13, x^14}, x]
-
-            //   0.1000000000000000003213692169066381945529176657E+01 x
-            // + 0.4999999999999999998389405741198241227273662223E+00 x^2
-            // + 0.1666666666666664035765593562709186076539985328E+00 x^3
-            // + 0.4166666666666666934614928838666442575683452206E-01 x^4
-            // + 0.8333333333339521841328202617206868796855583809E-02 x^5
-            // + 0.1388888888888953513176946682731620625302469979E-02 x^6
-            // + 0.1984126983488689186859793276462049624439889135E-03 x^7
-            // + 0.2480158730001499149369647648735612017495156006E-04 x^8
-            // + 0.2755732258782898252481007286813761544775538366E-05 x^9
-            // + 0.2755732043147979013276287368071846972098889744E-06 x^10
-            // + 0.2505116286861719378770371641094067075234027345E-07 x^11
-            // + 0.2087632598463662328337672597832718168295672334E-08 x^12
-            // + 0.1619385892296180390338553597911165126625722485E-09 x^13
-            // + 0.1154399218598221557485183048765404442959841646E-10 x^14
-
-            using coefficient_array_type = std::array<T, static_cast<std::size_t>(UINT8_C(14))>;
-
-            #if (defined(__clang__) && (__clang__ < 6))
-            #  pragma clang diagnostic push
-            #  pragma clang diagnostic ignored "-Wmissing-braces"
-            #endif
-
-            constexpr auto coefficient_table =
-                coefficient_array_type
-                {
-                    T { UINT64_C(100000000000000000), -17 -  0 }, // * x
-                    T { UINT64_C(500000000000000000), -18 -  0 }, // * x^2
-                    T { UINT64_C(166666666666666404), -18 -  0 }, // * x^3
-                    T { UINT64_C(416666666666666693), -18 -  1 }, // * x^4
-                    T { UINT64_C(833333333333952184), -18 -  2 }, // * x^5
-                    T { UINT64_C(138888888888895351), -18 -  2 }, // * x^6
-                    T { UINT64_C(198412698348868919), -18 -  3 }, // * x^7
-                    T { UINT64_C(248015873000149915), -18 -  4 }, // * x^8
-                    T { UINT64_C(275573225878289825), -18 -  5 }, // * x^9
-                    T { UINT64_C(275573204314797901), -18 -  6 }, // * x^10
-                    T { UINT64_C(250511628686171938), -18 -  7 }, // * x^11
-                    T { UINT64_C(208763259846366233), -18 -  8 }, // * x^12
-                    T { UINT64_C(161938589229618039), -18 -  9 }, // * x^13
-                    T { UINT64_C(115439921859822156), -18 - 10 }  // * x^14
-                };
-
-            #if (defined(__clang__) && (__clang__ < 6))
-            #  pragma clang diagnostic pop
-            #endif
-
-            auto rit = coefficient_table.crbegin() + static_cast<std::size_t>((sizeof(T) == 4U) ? 5U : 0U);
-
-            result = *rit;
-
-            while(rit != coefficient_table.crend())
-            {
-                result = fma(result, x, *rit++);
-            }
-
-            result *= x;
+            result = x * detail::expm1_series_expansion(x);
         }
     }
 
diff --git a/include/boost/decimal/detail/cmath/ilogb.hpp b/include/boost/decimal/detail/cmath/ilogb.hpp
@@ -22,26 +22,30 @@ BOOST_DECIMAL_EXPORT template <typename T>
 constexpr auto ilogb(T d) noexcept
     BOOST_DECIMAL_REQUIRES_RETURN(detail::is_decimal_floating_point_v, T, int)
 {
-    const auto fpc_d = fpclassify(d);
+    const auto fpc = fpclassify(d);
 
-    if (fpc_d == FP_ZERO)
+    int result { };
+
+    if (fpc == FP_ZERO)
     {
-        return FP_ILOGB0;
+        result = static_cast<int>(FP_ILOGB0);
     }
-    else if (fpc_d == FP_INFINITE)
+    else if (fpc == FP_INFINITE)
     {
-        return INT_MAX;
+        result = static_cast<int>(INT_MAX);
     }
-    else if (fpc_d == FP_NAN)
+    else if (fpc == FP_NAN)
     {
-        return FP_ILOGBNAN;
+        result = static_cast<int>(FP_ILOGBNAN);
     }
+    else
+    {
+        const auto offset = detail::num_digits(d.full_significand()) - 1;
 
-    const auto offset = detail::num_digits(d.full_significand()) - 1;
-
-    const auto expval = static_cast<int>(static_cast<int>(d.unbiased_exponent()) + offset);
+        result = static_cast<int>(static_cast<int>(d.unbiased_exponent()) + offset);
+    }
 
-    return expval;
+    return result;
 }
 
 } // namespace decimal
diff --git a/include/boost/decimal/detail/cmath/impl/expm1_impl.hpp b/include/boost/decimal/detail/cmath/impl/expm1_impl.hpp
@@ -0,0 +1,158 @@
+// Copyright 2023 - 2024 Matt Borland
+// Copyright 2023 - 2024 Christopher Kormanyos
+// Distributed under the Boost Software License, Version 1.0.
+// https://www.boost.org/LICENSE_1_0.txt
+
+#ifndef BOOST_DECIMAL_DETAIL_CMATH_IMPL_EXPM1_IMPL_HPP
+#define BOOST_DECIMAL_DETAIL_CMATH_IMPL_EXPM1_IMPL_HPP
+
+#include <boost/decimal/detail/concepts.hpp>
+#include <boost/decimal/detail/cmath/impl/taylor_series_result.hpp>
+
+#ifndef BOOST_DECIMAL_BUILD_MODULE
+#include <array>
+#include <cstddef>
+#include <cstdint>
+#endif
+
+namespace boost {
+namespace decimal {
+namespace detail {
+
+namespace expm1_detail {
+
+template <bool b>
+struct expm1_table_imp
+{
+private:
+    using d32_coeffs_t  = std::array<decimal32,  10>;
+    using d64_coeffs_t  = std::array<decimal64,  14>;
+    using d128_coeffs_t = std::array<decimal128, 32>;
+
+public:
+    static constexpr d32_coeffs_t d32_coeffs =
+    {{
+        // Specifically derive a polynomial expansion for Exp[x] - 1 for this work.
+        //   Table[{x, Exp[x] - 1}, {x, -Log[2], Log[2], 1/60}]
+        //   N[%, 48]
+        //   Fit[%, {x, x^2, x^3, x^4, x^5, x^6, x^7, x^8, x^9, x^10}, x]
+
+        ::boost::decimal::decimal32 { UINT64_C(1000000000005449334), - 19 + 1 }, // * x
+        ::boost::decimal::decimal32 { UINT64_C(5000000000003881336), - 19 - 0 }, // * x^2
+        ::boost::decimal::decimal32 { UINT64_C(1666666664242981149), - 19 - 0 }, // * x^3
+        ::boost::decimal::decimal32 { UINT64_C(4166666665026072773), - 19 - 1 }, // * x^4
+        ::boost::decimal::decimal32 { UINT64_C(8333336317448167991), - 19 - 2 }, // * x^5
+        ::boost::decimal::decimal32 { UINT64_C(1388889096793935619), - 19 - 2 }, // * x^6
+        ::boost::decimal::decimal32 { UINT64_C(1983978347911205530), - 19 - 3 }, // * x^7
+        ::boost::decimal::decimal32 { UINT64_C(2480049494648544583), - 19 - 4 }, // * x^8
+        ::boost::decimal::decimal32 { UINT64_C(2787876201220259352), - 19 - 5 }, // * x^9
+        ::boost::decimal::decimal32 { UINT64_C(2780855729673643225), - 19 - 6 }, // * x^10
+    }};
+
+    static constexpr d64_coeffs_t d64_coeffs =
+    {{
+        // Specifically derive a polynomial expansion for Exp[x] - 1 for this work.
+        //   Table[{x, Exp[x] - 1}, {x, -Log[2], Log[2], 1/60}]
+        //   N[%, 48]
+        //   Fit[%, {x, x^2, x^3, x^4, x^5, x^6, x^7, x^8, x^9, x^10, x^11, x^12, x^13, x^14}, x]
+
+        ::boost::decimal::decimal64 { UINT64_C(1000000000000000003), - 19 +  1 }, // * x
+        ::boost::decimal::decimal64 { UINT64_C(4999999999999999998), - 19 -  0 }, // * x^2
+        ::boost::decimal::decimal64 { UINT64_C(1666666666666664035), - 19 -  0 }, // * x^3
+        ::boost::decimal::decimal64 { UINT64_C(4166666666666666934), - 19 -  1 }, // * x^4
+        ::boost::decimal::decimal64 { UINT64_C(8333333333339521841), - 19 -  2 }, // * x^5
+        ::boost::decimal::decimal64 { UINT64_C(1388888888888953513), - 19 -  2 }, // * x^6
+        ::boost::decimal::decimal64 { UINT64_C(1984126983488689186), - 19 -  3 }, // * x^7
+        ::boost::decimal::decimal64 { UINT64_C(2480158730001499149), - 19 -  4 }, // * x^8
+        ::boost::decimal::decimal64 { UINT64_C(2755732258782898252), - 19 -  5 }, // * x^9
+        ::boost::decimal::decimal64 { UINT64_C(2755732043147979013), - 19 -  6 }, // * x^10
+        ::boost::decimal::decimal64 { UINT64_C(2505116286861719378), - 19 -  7 }, // * x^11
+        ::boost::decimal::decimal64 { UINT64_C(2087632598463662328), - 19 -  8 }, // * x^12
+        ::boost::decimal::decimal64 { UINT64_C(1619385892296180390), - 19 -  9 }, // * x^13
+        ::boost::decimal::decimal64 { UINT64_C(1154399218598221557), - 19 - 10 }  // * x^14
+     }};
+
+    static constexpr d128_coeffs_t d128_coeffs =
+    {{
+        // Specifically derive a polynomial expansion for Exp[x] - 1 for this work.
+        //   Table[{x, Exp[x] - 1}, {x, -Log[2], Log[2], 1/60}]
+        //   N[%, 48]
+        //   Fit[%, {x, x^2, x^3, x^4, x^5, x^6, x^7, x^8, x^9, x^10, x^11, x^12, x^13, x^14, x^15, x^16, x^17, x^18, x^19, x^20, x^21, x^22, x^23, x^24, x^25, x^26, x^27, x^28, x^29, x^30, x^31, x^32 }, x]
+        ::boost::decimal::decimal128 { boost::decimal::detail::uint128 { UINT64_C(54210108624275),  UINT64_C(4089650035136921600)  }, -33 }, // * x
+        ::boost::decimal::decimal128 { boost::decimal::detail::uint128 { UINT64_C(271050543121376), UINT64_C(2001506101975056384)  }, -34 }, // * x^2
+        ::boost::decimal::decimal128 { boost::decimal::detail::uint128 { UINT64_C(90350181040458),  UINT64_C(12964998083131386532) }, -34 }, // * x^3
+        ::boost::decimal::decimal128 { boost::decimal::detail::uint128 { UINT64_C(225875452601146), UINT64_C(13965751134118914724) }, -35 }, // * x^4
+        ::boost::decimal::decimal128 { boost::decimal::detail::uint128 { UINT64_C(451750905202293), UINT64_C(9484758194528277842)  }, -36 }, // * x^5
+        ::boost::decimal::decimal128 { boost::decimal::detail::uint128 { UINT64_C(75291817533715),  UINT64_C(10804165069276155440) }, -36 }, // * x^6
+        ::boost::decimal::decimal128 { boost::decimal::detail::uint128 { UINT64_C(107559739333879), UINT64_C(7528774067376128516)  }, -37 }, // * x^7
+        ::boost::decimal::decimal128 { boost::decimal::detail::uint128 { UINT64_C(134449674167349), UINT64_C(4799281565792772746)  }, -38 }, // * x^8
+        ::boost::decimal::decimal128 { boost::decimal::detail::uint128 { UINT64_C(149388526852610), UINT64_C(5332535073103080820)  }, -39 }, // * x^9
+        ::boost::decimal::decimal128 { boost::decimal::detail::uint128 { UINT64_C(149388526852610), UINT64_C(5332535073103080820)  }, -40 }, // * x^10
+        ::boost::decimal::decimal128 { boost::decimal::detail::uint128 { UINT64_C(135807751684191), UINT64_C(3170782423392841514)  }, -41 }, // * x^11
+        ::boost::decimal::decimal128 { boost::decimal::detail::uint128 { UINT64_C(113173126403492), UINT64_C(11865690723015477068) }, -42 }, // * x^12
+        ::boost::decimal::decimal128 { boost::decimal::detail::uint128 { UINT64_C(87056251079609),  UINT64_C(13384395342406416636) }, -43 }, // * x^13
+        ::boost::decimal::decimal128 { boost::decimal::detail::uint128 { UINT64_C(62183036485435),  UINT64_C(9560282387433156335)  }, -44 }, // * x^14
+        ::boost::decimal::decimal128 { boost::decimal::detail::uint128 { UINT64_C(414553576569570), UINT64_C(2246069003862680020)  }, -46 }, // * x^15
+        ::boost::decimal::decimal128 { boost::decimal::detail::uint128 { UINT64_C(259095985355981), UINT64_C(6015479145828949264)  }, -47 }, // * x^16
+        ::boost::decimal::decimal128 { boost::decimal::detail::uint128 { UINT64_C(152409403150577), UINT64_C(4623619732418095578)  }, -48 }, // * x^17
+        ::boost::decimal::decimal128 { boost::decimal::detail::uint128 { UINT64_C(84671890639209),  UINT64_C(10767230558026320466) }, -49 }, // * x^18
+        ::boost::decimal::decimal128 { boost::decimal::detail::uint128 { UINT64_C(445641529680050), UINT64_C(8125595620937745600)  }, -51 }, // * x^19
+        ::boost::decimal::decimal128 { boost::decimal::detail::uint128 { UINT64_C(222820764840025), UINT64_C(4062767274683195140)  }, -52 }, // * x^20
+        ::boost::decimal::decimal128 { boost::decimal::detail::uint128 { UINT64_C(106105126114297), UINT64_C(13344759429965740488) }, -53 }, // * x^21
+        ::boost::decimal::decimal128 { boost::decimal::detail::uint128 { UINT64_C(482296027792262), UINT64_C(7088674266265745598)  }, -55 }, // * x^22
+        ::boost::decimal::decimal128 { boost::decimal::detail::uint128 { UINT64_C(209693925127072), UINT64_C(336105452763225878)   }, -56 }, // * x^23
+        ::boost::decimal::decimal128 { boost::decimal::detail::uint128 { UINT64_C(87372468802945),  UINT64_C(10013088901203012320) }, -57 }, // * x^24
+        ::boost::decimal::decimal128 { boost::decimal::detail::uint128 { UINT64_C(349489875208886), UINT64_C(9445768661182748344)  }, -59 }, // * x^25
+        ::boost::decimal::decimal128 { boost::decimal::detail::uint128 { UINT64_C(134419182774415), UINT64_C(9680981560342232810)  }, -60 }, // * x^26
+        ::boost::decimal::decimal128 { boost::decimal::detail::uint128 { UINT64_C(497848829278818), UINT64_C(16288994997110182382) }, -62 }, // * x^27
+        ::boost::decimal::decimal128 { boost::decimal::detail::uint128 { UINT64_C(177803151475355), UINT64_C(16680206430774781810) }, -63 }, // * x^28
+        ::boost::decimal::decimal128 { boost::decimal::detail::uint128 { UINT64_C(61311025561137),  UINT64_C(7837795588749518446)  }, -64 }, // * x^29
+        ::boost::decimal::decimal128 { boost::decimal::detail::uint128 { UINT64_C(204371229207757), UINT64_C(18366861741830034248) }, -66 }, // * x^30
+        ::boost::decimal::decimal128 { boost::decimal::detail::uint128 { UINT64_C(66162682638108),  UINT64_C(6755035083974089930)  }, -67 }, // * x^31
+        ::boost::decimal::decimal128 { boost::decimal::detail::uint128 { UINT64_C(206436477688751), UINT64_C(15666750779045089894) }, -69 }, // * x^32
+    }};
+};
+
+#if !(defined(__cpp_inline_variables) && __cpp_inline_variables >= 201606L) && (!defined(_MSC_VER) || _MSC_VER != 1900)
+
+template <bool b>
+constexpr typename expm1_table_imp<b>::d32_coeffs_t expm1_table_imp<b>::d32_coeffs;
+
+template <bool b>
+constexpr typename expm1_table_imp<b>::d64_coeffs_t expm1_table_imp<b>::d64_coeffs;
+
+template <bool b>
+constexpr typename expm1_table_imp<b>::d128_coeffs_t expm1_table_imp<b>::d128_coeffs;
+
+#endif
+
+} //namespace expm1_detail
+
+using expm1_table = expm1_detail::expm1_table_imp<true>;
+
+template <BOOST_DECIMAL_DECIMAL_FLOATING_TYPE T>
+constexpr auto expm1_series_expansion(T x) noexcept;
+
+template <>
+constexpr auto expm1_series_expansion<decimal32>(decimal32 x) noexcept
+{
+    return taylor_series_result(x, expm1_table::d32_coeffs);
+}
+
+template <>
+constexpr auto expm1_series_expansion<decimal64>(decimal64 x) noexcept
+{
+    return taylor_series_result(x, expm1_table::d64_coeffs);
+}
+
+template <>
+constexpr auto expm1_series_expansion<decimal128>(decimal128 x) noexcept
+{
+    return taylor_series_result(x, expm1_table::d128_coeffs);
+}
+
+} //namespace detail
+} //namespace decimal
+} //namespace boost
+
+#endif //BOOST_DECIMAL_DETAIL_CMATH_IMPL_EXPM1_IMPL_HPP
diff --git a/include/boost/decimal/detail/cmath/log.hpp b/include/boost/decimal/detail/cmath/log.hpp
@@ -52,6 +52,11 @@ constexpr auto log_impl(T x) noexcept
     }
     else if(x > one)
     {
+        // Use the implementation of log10 in order to compute the natural
+        // logarithm. The base of the boost::decimal library is, in fact,
+        // base-10. And so, somewhat uncommonly, the fastest and most accurate
+        // logarithm in this system is log10 in base-10.
+
         result = log10(x) * numbers::ln10_v<T>;
     }
     else
diff --git a/test/test_expm1.cpp b/test/test_expm1.cpp
diff --git a/test/test_pow.cpp b/test/test_pow.cpp

Original file line number	Diff line number	Diff line change
`@@ -22,26 +22,30 @@ BOOST_DECIMAL_EXPORT template <typename T>`
`22`	`22`	`constexpr auto ilogb(T d) noexcept`
`23`	`23`	`BOOST_DECIMAL_REQUIRES_RETURN(detail::is_decimal_floating_point_v, T, int)`
`24`	`24`	`{`
`25`		`- const auto fpc_d = fpclassify(d);`
	`25`	`+ const auto fpc = fpclassify(d);`
`26`	`26`
`27`		`- if (fpc_d == FP_ZERO)`
	`27`	`+ int result { };`
	`28`	`+`
	`29`	`+ if (fpc == FP_ZERO)`
`28`	`30`	`{`
`29`		`- return FP_ILOGB0;`
	`31`	`+ result = static_cast<int>(FP_ILOGB0);`
`30`	`32`	`}`
`31`		`- else if (fpc_d == FP_INFINITE)`
	`33`	`+ else if (fpc == FP_INFINITE)`
`32`	`34`	`{`
`33`		`- return INT_MAX;`
	`35`	`+ result = static_cast<int>(INT_MAX);`
`34`	`36`	`}`
`35`		`- else if (fpc_d == FP_NAN)`
	`37`	`+ else if (fpc == FP_NAN)`
`36`	`38`	`{`
`37`		`- return FP_ILOGBNAN;`
	`39`	`+ result = static_cast<int>(FP_ILOGBNAN);`
`38`	`40`	`}`
	`41`	`+ else`
	`42`	`+ {`
	`43`	`+ const auto offset = detail::num_digits(d.full_significand()) - 1;`
`39`	`44`
`40`		`- const auto offset = detail::num_digits(d.full_significand()) - 1;`
`41`		`-`
`42`		`- const auto expval = static_cast<int>(static_cast<int>(d.unbiased_exponent()) + offset);`
	`45`	`+ result = static_cast<int>(static_cast<int>(d.unbiased_exponent()) + offset);`
	`46`	`+ }`
`43`	`47`
`44`		`- return expval;`
	`48`	`+ return result;`
`45`	`49`	`}`
`46`	`50`
`47`	`51`	`} // namespace decimal`
Original file line number	Diff line number	Diff line change
`@@ -52,6 +52,11 @@ constexpr auto log_impl(T x) noexcept`
`52`	`52`	`}`
`53`	`53`	`else if(x > one)`
`54`	`54`	`{`
	`55`	`+ // Use the implementation of log10 in order to compute the natural`
	`56`	`+ // logarithm. The base of the boost::decimal library is, in fact,`
	`57`	`+ // base-10. And so, somewhat uncommonly, the fastest and most accurate`
	`58`	`+ // logarithm in this system is log10 in base-10.`
	`59`	`+`
`55`	`60`	`result = log10(x) * numbers::ln10_v<T>;`
`56`	`61`	`}`
`57`	`62`	`else`