Merge pull request #952 from cppalliance/951

mborland · web-flow · commit 40762516e956 · 2025-07-31T14:42:04.000-04:00
Bugfixes for Intel Benchmarks and update docs with complete results
diff --git a/doc/modules/ROOT/pages/benchmarks.adoc b/doc/modules/ROOT/pages/benchmarks.adoc
@@ -24,6 +24,13 @@ To run the benchmarks yourself, navigate to the test folder and define `BOOST_DE
 An example on Linux with b2: `../../../b2 cxxstd=20 toolset=gcc-13 define=BOOST_DECIMAL_RUN_BENCHMARKS benchmarks -a release`, or
 `../../../b2 cxxstd=20 toolset=gcc-13 define=BOOST_DECIMAL_RUN_BENCHMARKS=1,BOOST_DECIMAL_BENCHMARK_CHARCONV=1 benchmarks -a release` to also run the `<charconv>` benchmarks
 
+To run the GCC benchmarks you can use the following command: `gcc benchmark_libdfp.c -O3 -std=c17` followed by: `./a.out`
+
+To run the Intel benchmarks you will need both the https://www.intel.com/content/www/us/en/developer/tools/oneapi/overview.html[Intel Compiler], and the https://www.intel.com/content/www/us/en/developer/articles/tool/intel-decimal-floating-point-math-library.html[library].
+You can the use the following command: `icx benchmark_libbid.c -O3 $PATH_TO_LIBBID/libbid.a -std=c17` followed by: `./a.out`
+
+NOTE: The Intel benchmarks can only be run on one of their supported architectures: IA-32, IA-64, and Intel x64
+
 == Methodology
 
 === Comparisons
@@ -85,14 +92,14 @@ Intel Compiler:
 | 698,945
 | 4.856
 | Intel `Decimal32`
-| 2,023,493
-| 14.059
+| 2,411,294
+| 16.754
 | Intel `Decimal64`
-| 2,386,409
-| 16.581
+| 3,158,422
+| 21.945
 | Intel `Decimal128`
-| 3,203,050
-| 22.255
+| 3,389,883
+| 23.553
 |===
 
 GCC:
@@ -165,14 +172,14 @@ Intel Compiler:
 | 1,367,004
 | 15.092
 | Intel `Decimal32`
-| 1,159,069
-| 12.796
+| 1,242,797
+| 13.721
 | Intel `Decimal64`
-| 1,248,111
-| 13.779
+| 1,689,585
+| 18.653
 | Intel `Decimal128`
-| 2,099,084
-| 23.174
+| 1,958,345
+| 21.620
 |===
 
 GCC:
@@ -245,14 +252,14 @@ Intel Compiler:
 | 1,212,405
 | 16.564
 | Intel `Decimal32`
-| 1,275,562
-| 17.427
+| 1,922,108
+| 26.261
 | Intel `Decimal64`
-| 1,019,947
-| 13.935
+| 1,793,879
+| 24.509
 | Intel `Decimal128`
-| 2,162,490
-| 29.545
+| 2,397,372
+| 32.754
 |===
 
 GCC:
@@ -325,15 +332,14 @@ Intel Compiler:
 | 5,959,977
 | 81.870
 | Intel `Decimal32`
-| 931,655
-| 12.798
+| 1,375,434
+| 18.894
 | Intel `Decimal64`
-| 963,464
-| 13.235
-// For unknown reasons this function segfaults
-//| Intel `Decimal128`
-//| 2,162,490
-//| 29.545
+| 2,052,278
+| 28.191
+| Intel `Decimal128`
+| 5,964,489
+| 81.932
 |===
 
 GCC:
@@ -405,16 +411,15 @@ Intel Compiler:
 | `decimal_fast128_t`
 | 8,277,721
 | 79.750
-// For unknown reasons this function segfaults
-//| Intel `Decimal32`
-//| 931,655
-//| 12.798
-//| Intel `Decimal64`
-//| 963,464
-//| 13.235
-//| Intel `Decimal128`
-//| 2,162,490
-//| 29.545
+| Intel `Decimal32`
+| 1,561,213
+| 15.041
+| Intel `Decimal64`
+| 3,115,862
+| 30.019
+| Intel `Decimal128`
+| 7,474,712
+| 72.013
 |===
 
 GCC:
diff --git a/test/benchmark_libbid.c b/test/benchmark_libbid.c
@@ -3,8 +3,6 @@
 // https://www.boost.org/LICENSE_1_0.txt
 
 #define _POSIX_C_SOURCE 199309L
-#define DECIMAL_GLOBAL_ROUNDING 1
-#define DECIMAL_GLOBAL_EXCEPTION_FLAGS 1
 
 #include <stdio.h>
 #include <stdlib.h>
@@ -23,6 +21,8 @@ typedef BID_UINT128 Decimal128;
 #define K 20000000
 #define N 5
 
+uint32_t flag = 0;
+
 uint32_t random_uint32(void) 
 {
     uint32_t r = 0;
@@ -36,20 +36,20 @@ uint32_t random_uint32(void)
 
 uint64_t random_uint64(void) 
 {
-    uint32_t r = 0;
+    uint64_t r = 0;
     for (int i = 0; i < 4; i++) 
     {
         r = (r << 16) | (rand() & 0xFFFF);
     }
-    
+
     return r;
 }
 
 __attribute__ ((noinline)) void generate_vector_32(Decimal32* buffer, size_t buffer_len)
 {
     for (size_t i = 0; i < buffer_len; ++i)
     {
-        buffer[i] = bid32_from_uint32(random_uint32() % 100);
+        buffer[i] = bid32_from_uint32(random_uint32(), BID_ROUNDING_DOWN, &flag);
     }
 }
 
@@ -67,12 +67,12 @@ __attribute__ ((noinline)) void test_comparisons_32(Decimal32* data, const char*
             Decimal32 val1 = data[k];
             Decimal32 val2 = data[k + 1];
 
-            s += (size_t)bid32_quiet_less(val1, val2);
-            s += (size_t)bid32_quiet_less_equal(val1, val2);
-            s += (size_t)bid32_quiet_greater(val1, val2);
-            s += (size_t)bid32_quiet_greater_equal(val1, val2);
-            s += (size_t)bid32_quiet_equal(val1, val2);
-            s += (size_t)bid32_quiet_not_equal(val1, val2);
+            s += (size_t)bid32_quiet_less(val1, val2, &flag);
+            s += (size_t)bid32_quiet_less_equal(val1, val2, &flag);
+            s += (size_t)bid32_quiet_greater(val1, val2, &flag);
+            s += (size_t)bid32_quiet_greater_equal(val1, val2, &flag);
+            s += (size_t)bid32_quiet_equal(val1, val2, &flag);
+            s += (size_t)bid32_quiet_not_equal(val1, val2, &flag);
         }
     }
 
@@ -86,7 +86,7 @@ __attribute__ ((noinline)) void generate_vector_64(Decimal64* buffer, size_t buf
 {
     for (size_t i = 0; i < buffer_len; ++i)
     {
-        buffer[i] = bid64_from_uint64(random_uint64() % 10000);
+        buffer[i] = bid64_from_uint64(random_uint64(), BID_ROUNDING_DOWN, &flag);
     }
 }
 
@@ -104,12 +104,12 @@ __attribute__ ((noinline)) void test_comparisons_64(Decimal64* data, const char*
             Decimal64 val1 = data[k];
             Decimal64 val2 = data[k + 1];
 
-            s += (size_t)bid64_quiet_less(val1, val2);
-            s += (size_t)bid64_quiet_less_equal(val1, val2);
-            s += (size_t)bid64_quiet_greater(val1, val2);
-            s += (size_t)bid64_quiet_greater_equal(val1, val2);
-            s += (size_t)bid64_quiet_equal(val1, val2);
-            s += (size_t)bid64_quiet_not_equal(val1, val2);
+            s += (size_t)bid64_quiet_less(val1, val2, &flag);
+            s += (size_t)bid64_quiet_less_equal(val1, val2, &flag);
+            s += (size_t)bid64_quiet_greater(val1, val2, &flag);
+            s += (size_t)bid64_quiet_greater_equal(val1, val2, &flag);
+            s += (size_t)bid64_quiet_equal(val1, val2, &flag);
+            s += (size_t)bid64_quiet_not_equal(val1, val2, &flag);
         }
     }
 
@@ -125,7 +125,7 @@ __attribute__ ((__noinline__)) void generate_vector_128(Decimal128* buffer, size
     size_t i = 0;
     while (i < buffer_len)
     {
-        buffer[i] = bid128_from_uint64(random_uint64() % 100);
+        buffer[i] = bid128_from_uint64(random_uint64());
         ++i;
     }
 }
@@ -144,12 +144,12 @@ __attribute__ ((__noinline__)) void test_comparisons_128(Decimal128* data, const
             Decimal128 val1 = data[k];
             Decimal128 val2 = data[k + 1];
 
-            s += (size_t)bid128_quiet_less(val1, val2);
-            s += (size_t)bid128_quiet_less_equal(val1, val2);
-            s += (size_t)bid128_quiet_greater(val1, val2);
-            s += (size_t)bid128_quiet_greater_equal(val1, val2);
-            s += (size_t)bid128_quiet_equal(val1, val2);
-            s += (size_t)bid128_quiet_not_equal(val1, val2);
+            s += (size_t)bid128_quiet_less(val1, val2, &flag);
+            s += (size_t)bid128_quiet_less_equal(val1, val2, &flag);
+            s += (size_t)bid128_quiet_greater(val1, val2, &flag);
+            s += (size_t)bid128_quiet_greater_equal(val1, val2, &flag);
+            s += (size_t)bid128_quiet_equal(val1, val2, &flag);
+            s += (size_t)bid128_quiet_not_equal(val1, val2, &flag);
         }
     }
 
@@ -164,21 +164,21 @@ typedef Decimal32 (*operation_32)(Decimal32, Decimal32);
 
 __attribute__ ((noinline)) Decimal32 add_32(Decimal32 a, Decimal32 b)
 {
-    return bid32_add(a, b);
+    return bid32_add(a, b, BID_ROUNDING_DOWN, &flag);
 }
 __attribute__ ((noinline)) Decimal32 sub_32(Decimal32 a, Decimal32 b)
 {
-    return bid32_sub(a, b);
+    return bid32_sub(a, b, BID_ROUNDING_DOWN, &flag);
 }
 
 __attribute__ ((noinline)) Decimal32 mul_32(Decimal32 a, Decimal32 b)
 {
-    return bid32_mul(a, b);
+    return bid32_mul(a, b, BID_ROUNDING_DOWN, &flag);
 }
 
 __attribute__ ((noinline)) Decimal32 div_32(Decimal32 a, Decimal32 b)
 {
-    return bid32_div(a, b);
+    return bid32_div(a, b, BID_ROUNDING_DOWN, &flag);
 }
 
 __attribute__ ((noinline)) void test_two_element_operation_32(Decimal32* data, operation_32 op, const char* label, const char* op_label)
@@ -195,7 +195,7 @@ __attribute__ ((noinline)) void test_two_element_operation_32(Decimal32* data, o
             Decimal32 val1 = data[k];
             Decimal32 val2 = data[k + 1];
 
-            s += (size_t)bid32_to_int32_int(op(val1, val2));
+            s += (size_t)bid32_to_int32_int(op(val1, val2), &flag);
         }
     }
 
@@ -209,22 +209,22 @@ typedef Decimal64 (*operation_64)(Decimal64, Decimal64);
 
 __attribute__ ((noinline)) Decimal64 add_64(Decimal64 a, Decimal64 b)
 {
-    return bid64_add(a, b);
+    return bid64_add(a, b, BID_ROUNDING_DOWN, &flag);
 }
 
 __attribute__ ((noinline)) Decimal64 sub_64(Decimal64 a, Decimal64 b)
 {
-    return bid64_sub(a, b);
+    return bid64_sub(a, b, BID_ROUNDING_DOWN, &flag);
 }
 
 __attribute__ ((noinline)) Decimal64 mul_64(Decimal64 a, Decimal64 b)
 {
-    return bid64_mul(a, b);
+    return bid64_mul(a, b, BID_ROUNDING_DOWN, &flag);
 }
 
 __attribute__ ((noinline)) Decimal64 div_64(Decimal64 a, Decimal64 b)
 {
-    return bid64_div(a, b);
+    return bid64_div(a, b, BID_ROUNDING_DOWN, &flag);
 }
 
 __attribute__ ((noinline)) void test_two_element_operation_64(Decimal64* data, operation_64 op, const char* label, const char* op_label)
@@ -241,7 +241,7 @@ __attribute__ ((noinline)) void test_two_element_operation_64(Decimal64* data, o
             Decimal64 val1 = data[k];
             Decimal64 val2 = data[k + 1];
 
-            s += (size_t)bid64_to_int64_int(op(val1, val2));
+            s += (size_t)bid64_to_int64_int(op(val1, val2), &flag);
         }
     }
 
@@ -256,22 +256,22 @@ typedef Decimal128 (*operation_128)(Decimal128, Decimal128);
 
 __attribute__ ((__noinline__)) Decimal128 add_128(Decimal128 a, Decimal128 b)
 {
-    return bid128_add(a, b);
+    return bid128_add(a, b, BID_ROUNDING_DOWN, &flag);
 }
 
 __attribute__ ((__noinline__)) Decimal128 sub_128(Decimal128 a, Decimal128 b)
 {
-    return bid128_sub(a, b);
+    return bid128_sub(a, b, BID_ROUNDING_DOWN, &flag);
 }
 
 __attribute__ ((__noinline__)) Decimal128 mul_128(Decimal128 a, Decimal128 b)
 {
-    return bid128_mul(a, b);
+    return bid128_mul(a, b, BID_ROUNDING_DOWN, &flag);
 }
 
 __attribute__ ((__noinline__)) Decimal128 div_128(Decimal128 a, Decimal128 b)
 {
-    return bid128_div(a, b);
+    return bid128_div(a, b, BID_ROUNDING_DOWN, &flag);
 }
 
 __attribute__ ((__noinline__)) void test_two_element_operation_128(Decimal128* data, operation_128 op, const char* label, const char* op_label)
@@ -288,7 +288,7 @@ __attribute__ ((__noinline__)) void test_two_element_operation_128(Decimal128* d
             Decimal128 val1 = data[k];
             Decimal128 val2 = data[k + 1];
 
-            s += (size_t)bid128_to_int64_int(op(val1, val2));
+            s += (size_t)bid128_to_int64_int(op(val1, val2), &flag);
         }
     }
 

Original file line number	Diff line number	Diff line change
`@@ -3,8 +3,6 @@`
`3`	`3`	`// https://www.boost.org/LICENSE_1_0.txt`
`4`	`4`
`5`	`5`	`#define _POSIX_C_SOURCE 199309L`
`6`		`-#define DECIMAL_GLOBAL_ROUNDING 1`
`7`		`-#define DECIMAL_GLOBAL_EXCEPTION_FLAGS 1`
`8`	`6`
`9`	`7`	`#include <stdio.h>`
`10`	`8`	`#include <stdlib.h>`
`@@ -23,6 +21,8 @@ typedef BID_UINT128 Decimal128;`
`23`	`21`	`#define K 20000000`
`24`	`22`	`#define N 5`
`25`	`23`
	`24`	`+uint32_t flag = 0;`
	`25`	`+`
`26`	`26`	`uint32_t random_uint32(void)`
`27`	`27`	`{`
`28`	`28`	`uint32_t r = 0;`
`@@ -36,20 +36,20 @@ uint32_t random_uint32(void)`
`36`	`36`
`37`	`37`	`uint64_t random_uint64(void)`
`38`	`38`	`{`
`39`		`- uint32_t r = 0;`
	`39`	`+ uint64_t r = 0;`
`40`	`40`	`for (int i = 0; i < 4; i++)`
`41`	`41`	`{`
`42`	`42`	`r = (r << 16) \| (rand() & 0xFFFF);`
`43`	`43`	`}`
`44`		`-`
	`44`	`+`
`45`	`45`	`return r;`
`46`	`46`	`}`
`47`	`47`
`48`	`48`	`__attribute__ ((noinline)) void generate_vector_32(Decimal32* buffer, size_t buffer_len)`
`49`	`49`	`{`
`50`	`50`	`for (size_t i = 0; i < buffer_len; ++i)`
`51`	`51`	`{`
`52`		`- buffer[i] = bid32_from_uint32(random_uint32() % 100);`
	`52`	`+ buffer[i] = bid32_from_uint32(random_uint32(), BID_ROUNDING_DOWN, &flag);`
`53`	`53`	`}`
`54`	`54`	`}`
`55`	`55`
`@@ -67,12 +67,12 @@ __attribute__ ((noinline)) void test_comparisons_32(Decimal32* data, const char*`
`67`	`67`	`Decimal32 val1 = data[k];`
`68`	`68`	`Decimal32 val2 = data[k + 1];`
`69`	`69`
`70`		`- s += (size_t)bid32_quiet_less(val1, val2);`
`71`		`- s += (size_t)bid32_quiet_less_equal(val1, val2);`
`72`		`- s += (size_t)bid32_quiet_greater(val1, val2);`
`73`		`- s += (size_t)bid32_quiet_greater_equal(val1, val2);`
`74`		`- s += (size_t)bid32_quiet_equal(val1, val2);`
`75`		`- s += (size_t)bid32_quiet_not_equal(val1, val2);`
	`70`	`+ s += (size_t)bid32_quiet_less(val1, val2, &flag);`
	`71`	`+ s += (size_t)bid32_quiet_less_equal(val1, val2, &flag);`
	`72`	`+ s += (size_t)bid32_quiet_greater(val1, val2, &flag);`
	`73`	`+ s += (size_t)bid32_quiet_greater_equal(val1, val2, &flag);`
	`74`	`+ s += (size_t)bid32_quiet_equal(val1, val2, &flag);`
	`75`	`+ s += (size_t)bid32_quiet_not_equal(val1, val2, &flag);`
`76`	`76`	`}`
`77`	`77`	`}`
`78`	`78`
`@@ -86,7 +86,7 @@ __attribute__ ((noinline)) void generate_vector_64(Decimal64* buffer, size_t buf`
`86`	`86`	`{`
`87`	`87`	`for (size_t i = 0; i < buffer_len; ++i)`
`88`	`88`	`{`
`89`		`- buffer[i] = bid64_from_uint64(random_uint64() % 10000);`
	`89`	`+ buffer[i] = bid64_from_uint64(random_uint64(), BID_ROUNDING_DOWN, &flag);`
`90`	`90`	`}`
`91`	`91`	`}`
`92`	`92`
`@@ -104,12 +104,12 @@ __attribute__ ((noinline)) void test_comparisons_64(Decimal64* data, const char*`
`104`	`104`	`Decimal64 val1 = data[k];`
`105`	`105`	`Decimal64 val2 = data[k + 1];`
`106`	`106`
`107`		`- s += (size_t)bid64_quiet_less(val1, val2);`
`108`		`- s += (size_t)bid64_quiet_less_equal(val1, val2);`
`109`		`- s += (size_t)bid64_quiet_greater(val1, val2);`
`110`		`- s += (size_t)bid64_quiet_greater_equal(val1, val2);`
`111`		`- s += (size_t)bid64_quiet_equal(val1, val2);`
`112`		`- s += (size_t)bid64_quiet_not_equal(val1, val2);`
	`107`	`+ s += (size_t)bid64_quiet_less(val1, val2, &flag);`
	`108`	`+ s += (size_t)bid64_quiet_less_equal(val1, val2, &flag);`
	`109`	`+ s += (size_t)bid64_quiet_greater(val1, val2, &flag);`
	`110`	`+ s += (size_t)bid64_quiet_greater_equal(val1, val2, &flag);`
	`111`	`+ s += (size_t)bid64_quiet_equal(val1, val2, &flag);`
	`112`	`+ s += (size_t)bid64_quiet_not_equal(val1, val2, &flag);`
`113`	`113`	`}`
`114`	`114`	`}`
`115`	`115`
`@@ -125,7 +125,7 @@ __attribute__ ((__noinline__)) void generate_vector_128(Decimal128* buffer, size`
`125`	`125`	`size_t i = 0;`
`126`	`126`	`while (i < buffer_len)`
`127`	`127`	`{`
`128`		`- buffer[i] = bid128_from_uint64(random_uint64() % 100);`
	`128`	`+ buffer[i] = bid128_from_uint64(random_uint64());`
`129`	`129`	`++i;`
`130`	`130`	`}`
`131`	`131`	`}`
`@@ -144,12 +144,12 @@ __attribute__ ((__noinline__)) void test_comparisons_128(Decimal128* data, const`
`144`	`144`	`Decimal128 val1 = data[k];`
`145`	`145`	`Decimal128 val2 = data[k + 1];`
`146`	`146`
`147`		`- s += (size_t)bid128_quiet_less(val1, val2);`
`148`		`- s += (size_t)bid128_quiet_less_equal(val1, val2);`
`149`		`- s += (size_t)bid128_quiet_greater(val1, val2);`
`150`		`- s += (size_t)bid128_quiet_greater_equal(val1, val2);`
`151`		`- s += (size_t)bid128_quiet_equal(val1, val2);`
`152`		`- s += (size_t)bid128_quiet_not_equal(val1, val2);`
	`147`	`+ s += (size_t)bid128_quiet_less(val1, val2, &flag);`
	`148`	`+ s += (size_t)bid128_quiet_less_equal(val1, val2, &flag);`
	`149`	`+ s += (size_t)bid128_quiet_greater(val1, val2, &flag);`
	`150`	`+ s += (size_t)bid128_quiet_greater_equal(val1, val2, &flag);`
	`151`	`+ s += (size_t)bid128_quiet_equal(val1, val2, &flag);`
	`152`	`+ s += (size_t)bid128_quiet_not_equal(val1, val2, &flag);`
`153`	`153`	`}`
`154`	`154`	`}`
`155`	`155`
`@@ -164,21 +164,21 @@ typedef Decimal32 (*operation_32)(Decimal32, Decimal32);`
`164`	`164`
`165`	`165`	`__attribute__ ((noinline)) Decimal32 add_32(Decimal32 a, Decimal32 b)`
`166`	`166`	`{`
`167`		`- return bid32_add(a, b);`
	`167`	`+ return bid32_add(a, b, BID_ROUNDING_DOWN, &flag);`
`168`	`168`	`}`
`169`	`169`	`__attribute__ ((noinline)) Decimal32 sub_32(Decimal32 a, Decimal32 b)`
`170`	`170`	`{`
`171`		`- return bid32_sub(a, b);`
	`171`	`+ return bid32_sub(a, b, BID_ROUNDING_DOWN, &flag);`
`172`	`172`	`}`
`173`	`173`
`174`	`174`	`__attribute__ ((noinline)) Decimal32 mul_32(Decimal32 a, Decimal32 b)`
`175`	`175`	`{`
`176`		`- return bid32_mul(a, b);`
	`176`	`+ return bid32_mul(a, b, BID_ROUNDING_DOWN, &flag);`
`177`	`177`	`}`
`178`	`178`
`179`	`179`	`__attribute__ ((noinline)) Decimal32 div_32(Decimal32 a, Decimal32 b)`
`180`	`180`	`{`
`181`		`- return bid32_div(a, b);`
	`181`	`+ return bid32_div(a, b, BID_ROUNDING_DOWN, &flag);`
`182`	`182`	`}`
`183`	`183`
`184`	`184`	`__attribute__ ((noinline)) void test_two_element_operation_32(Decimal32* data, operation_32 op, const char* label, const char* op_label)`
`@@ -195,7 +195,7 @@ __attribute__ ((noinline)) void test_two_element_operation_32(Decimal32* data, o`
`195`	`195`	`Decimal32 val1 = data[k];`
`196`	`196`	`Decimal32 val2 = data[k + 1];`
`197`	`197`
`198`		`- s += (size_t)bid32_to_int32_int(op(val1, val2));`
	`198`	`+ s += (size_t)bid32_to_int32_int(op(val1, val2), &flag);`
`199`	`199`	`}`
`200`	`200`	`}`
`201`	`201`
`@@ -209,22 +209,22 @@ typedef Decimal64 (*operation_64)(Decimal64, Decimal64);`
`209`	`209`
`210`	`210`	`__attribute__ ((noinline)) Decimal64 add_64(Decimal64 a, Decimal64 b)`
`211`	`211`	`{`
`212`		`- return bid64_add(a, b);`
	`212`	`+ return bid64_add(a, b, BID_ROUNDING_DOWN, &flag);`
`213`	`213`	`}`
`214`	`214`
`215`	`215`	`__attribute__ ((noinline)) Decimal64 sub_64(Decimal64 a, Decimal64 b)`
`216`	`216`	`{`
`217`		`- return bid64_sub(a, b);`
	`217`	`+ return bid64_sub(a, b, BID_ROUNDING_DOWN, &flag);`
`218`	`218`	`}`
`219`	`219`
`220`	`220`	`__attribute__ ((noinline)) Decimal64 mul_64(Decimal64 a, Decimal64 b)`
`221`	`221`	`{`
`222`		`- return bid64_mul(a, b);`
	`222`	`+ return bid64_mul(a, b, BID_ROUNDING_DOWN, &flag);`
`223`	`223`	`}`
`224`	`224`
`225`	`225`	`__attribute__ ((noinline)) Decimal64 div_64(Decimal64 a, Decimal64 b)`
`226`	`226`	`{`
`227`		`- return bid64_div(a, b);`
	`227`	`+ return bid64_div(a, b, BID_ROUNDING_DOWN, &flag);`
`228`	`228`	`}`
`229`	`229`
`230`	`230`	`__attribute__ ((noinline)) void test_two_element_operation_64(Decimal64* data, operation_64 op, const char* label, const char* op_label)`
`@@ -241,7 +241,7 @@ __attribute__ ((noinline)) void test_two_element_operation_64(Decimal64* data, o`
`241`	`241`	`Decimal64 val1 = data[k];`
`242`	`242`	`Decimal64 val2 = data[k + 1];`
`243`	`243`
`244`		`- s += (size_t)bid64_to_int64_int(op(val1, val2));`
	`244`	`+ s += (size_t)bid64_to_int64_int(op(val1, val2), &flag);`
`245`	`245`	`}`
`246`	`246`	`}`
`247`	`247`
`@@ -256,22 +256,22 @@ typedef Decimal128 (*operation_128)(Decimal128, Decimal128);`
`256`	`256`
`257`	`257`	`__attribute__ ((__noinline__)) Decimal128 add_128(Decimal128 a, Decimal128 b)`
`258`	`258`	`{`
`259`		`- return bid128_add(a, b);`
	`259`	`+ return bid128_add(a, b, BID_ROUNDING_DOWN, &flag);`
`260`	`260`	`}`
`261`	`261`
`262`	`262`	`__attribute__ ((__noinline__)) Decimal128 sub_128(Decimal128 a, Decimal128 b)`
`263`	`263`	`{`
`264`		`- return bid128_sub(a, b);`
	`264`	`+ return bid128_sub(a, b, BID_ROUNDING_DOWN, &flag);`
`265`	`265`	`}`
`266`	`266`
`267`	`267`	`__attribute__ ((__noinline__)) Decimal128 mul_128(Decimal128 a, Decimal128 b)`
`268`	`268`	`{`
`269`		`- return bid128_mul(a, b);`
	`269`	`+ return bid128_mul(a, b, BID_ROUNDING_DOWN, &flag);`
`270`	`270`	`}`
`271`	`271`
`272`	`272`	`__attribute__ ((__noinline__)) Decimal128 div_128(Decimal128 a, Decimal128 b)`
`273`	`273`	`{`
`274`		`- return bid128_div(a, b);`
	`274`	`+ return bid128_div(a, b, BID_ROUNDING_DOWN, &flag);`
`275`	`275`	`}`
`276`	`276`
`277`	`277`	`__attribute__ ((__noinline__)) void test_two_element_operation_128(Decimal128* data, operation_128 op, const char* label, const char* op_label)`
`@@ -288,7 +288,7 @@ __attribute__ ((__noinline__)) void test_two_element_operation_128(Decimal128* d`
`288`	`288`	`Decimal128 val1 = data[k];`
`289`	`289`	`Decimal128 val2 = data[k + 1];`
`290`	`290`
`291`		`- s += (size_t)bid128_to_int64_int(op(val1, val2));`
	`291`	`+ s += (size_t)bid128_to_int64_int(op(val1, val2), &flag);`
`292`	`292`	`}`
`293`	`293`	`}`
`294`	`294`