Extended bruteforce test.

Dawoodoz · Dawoodoz · commit 5cbdb5243fe2 · 2026-02-15T12:06:17.000+01:00
diff --git a/Source/test/tests/BruteSimdTest.cpp b/Source/test/tests/BruteSimdTest.cpp
@@ -4,6 +4,8 @@
 #include "../../DFPSR/base/TemporaryCallback.h"
 #include "../../DFPSR/api/randomAPI.h"
 
+// These tests check for consistency across implementations, instead of giving examples of expected outcome.
+
 static const intptr_t ITERATIONS = 1000000;
 
 template<typename T>
@@ -119,8 +121,64 @@ void binaryEquivalent (
 	printText(U"*");
 }
 
-#define UNARY_POINT_EQUIVALENCE(S, V, EXPR) unaryEquivalent<S, S, V, V>([](const S &a) -> S { return EXPR; }, [](const V &a) -> V { return EXPR; }, U"unary function equivalence test between " U###S U" and " U###V U" for " U###EXPR)
-#define BINARY_POINT_EQUIVALENCE(S, V, EXPR) binaryEquivalent<S, S, V, V>([](const S &a, const S &b) -> S { return EXPR; }, [](const V &a, const V &b) -> V { return EXPR; }, U"binary function equivalence test between " U###S U" and " U###V U" for " U###EXPR)
+// TODO: Is it time to use varargs instead of copying this?
+template<typename S_IN, typename S_OUT, typename V_IN, typename V_OUT>
+void trinaryEquivalent (
+  const TemporaryCallback<S_OUT(const S_IN &a, const S_IN &b, const S_IN &c)> &scalarOp,
+  const TemporaryCallback<V_OUT(const V_IN &a, const V_IN &b, const V_IN &c)> &simdOp,
+  const ReadableString &testName
+) {
+	constexpr intptr_t laneCount = (sizeof(V_IN) / sizeof(S_IN));
+	// This test only applies to functions where input and output has the same number of lanes.
+	ASSERT_EQUAL(laneCount, sizeof(V_OUT) / sizeof(S_OUT));
+	// Initialize a random generator independently of other bruteforce tests
+	//   so that disabling another test does not affect this test.
+	RandomGenerator generator = random_createGenerator(460983751);
+	// Loop over random inputs.
+	for (intptr_t iteration = 0; iteration < ITERATIONS; iteration++) {
+		// Generate random input.
+		ALIGN_BYTES(sizeof(V_OUT)) S_IN inputA[laneCount];
+		ALIGN_BYTES(sizeof(V_OUT)) S_IN inputB[laneCount];
+		ALIGN_BYTES(sizeof(V_OUT)) S_IN inputC[laneCount];
+		for (intptr_t lane = 0; lane < laneCount; lane++) {
+			inputA[lane] = generate<S_IN>(generator);
+			inputB[lane] = generate<S_IN>(generator);
+			inputC[lane] = generate<S_IN>(generator);
+		}
+		// Execute scalar operation for all lanes.
+		ALIGN_BYTES(sizeof(V_OUT)) S_OUT scalarResult[laneCount];
+		for (intptr_t lane = 0; lane < laneCount; lane++) {
+			scalarResult[lane] = scalarOp(inputA[lane], inputB[lane], inputC[lane]);
+		}
+		// Execute SIMD operation with all lanes at the same time.
+		V_IN simdInputA = V_IN::readAlignedUnsafe(inputA);
+		V_IN simdInputB = V_IN::readAlignedUnsafe(inputB);
+		V_IN simdInputC = V_IN::readAlignedUnsafe(inputC);
+		V_OUT simdOutput = simdOp(simdInputA, simdInputB, simdInputC);
+		ALIGN_BYTES(sizeof(V_OUT)) S_OUT vectorResult[laneCount];
+		simdOutput.writeAlignedUnsafe(vectorResult);
+		// Compare results.
+		for (intptr_t lane = 0; lane < laneCount; lane++) {
+			if (!somewhatEqual(scalarResult[lane], vectorResult[lane])) {
+				printText(U"\n_______________________________ FAIL _______________________________\n");
+				printText(U"\nWrong result at lane ", lane, U" of 0..", laneCount - 1, U" at iteration ", iteration, U" of ", testName, U"!\n");
+				printText(U"Input: ", inputA[lane], U", ", inputB[lane], U"\n");
+				printText(U"Scalar result: ", scalarResult[lane], U"\n");
+				printText(U"Vector result: ", vectorResult[lane], U"\n");
+				printText(U"\n____________________________________________________________________\n");
+				failed = true;
+				return;
+			}
+		}
+	}
+	printText(U"*");
+}
+
+#define   UNARY_POINT_EQUIVALENCE_EXPR(S, V, EXPR)   unaryEquivalent<S, S, V, V>([](const S &a)                         -> S { return EXPR;          }, [](const V &a)                         -> V { return EXPR;          }, U"unary function equivalence test between "  U###S U" and " U###V U" for " U###EXPR)
+#define  BINARY_POINT_EQUIVALENCE_EXPR(S, V, EXPR)  binaryEquivalent<S, S, V, V>([](const S &a, const S &b)             -> S { return EXPR;          }, [](const V &a, const V &b)             -> V { return EXPR;          }, U"binary function equivalence test between " U###S U" and " U###V U" for " U###EXPR)
+#define   UNARY_POINT_EQUIVALENCE_FUNC(S, V, FUNC)   unaryEquivalent<S, S, V, V>([](const S &a)                         -> S { return FUNC(a);       }, [](const V &a)                         -> V { return FUNC(a);       }, U"unary function equivalence test between "  U###S U" and " U###V U" for " U###FUNC)
+#define  BINARY_POINT_EQUIVALENCE_FUNC(S, V, FUNC)  binaryEquivalent<S, S, V, V>([](const S &a, const S &b)             -> S { return FUNC(a, b);    }, [](const V &a, const V &b)             -> V { return FUNC(a, b);    }, U"binary function equivalence test between " U###S U" and " U###V U" for " U###FUNC)
+#define TRINARY_POINT_EQUIVALENCE_FUNC(S, V, FUNC) trinaryEquivalent<S, S, V, V>([](const S &a, const S &b, const S &c) -> S { return FUNC(a, b, c); }, [](const V &a, const V &b, const V &c) -> V { return FUNC(a, b, c); }, U"binary function equivalence test between " U###S U" and " U###V U" for " U###FUNC)
 
 START_TEST(BruteSimd)
 	printText(U"\nThe bruteforce SIMD test is compiled using:\n");
@@ -141,75 +199,154 @@ START_TEST(BruteSimd)
 	#endif
 
 	// Addition.
-	BINARY_POINT_EQUIVALENCE(uint8_t , U8x16 , a + b);
-	BINARY_POINT_EQUIVALENCE(uint8_t , U8x32 , a + b);
-	BINARY_POINT_EQUIVALENCE(uint16_t, U16x8 , a + b);
-	BINARY_POINT_EQUIVALENCE(uint16_t, U16x16, a + b);
-	BINARY_POINT_EQUIVALENCE(uint32_t, U32x4 , a + b);
-	BINARY_POINT_EQUIVALENCE(uint32_t, U32x8 , a + b);
-	BINARY_POINT_EQUIVALENCE(int32_t , I32x4 , a + b);
-	BINARY_POINT_EQUIVALENCE(int32_t , I32x8 , a + b);
-	BINARY_POINT_EQUIVALENCE(float   , F32x4 , a + b);
-	BINARY_POINT_EQUIVALENCE(float   , F32x8 , a + b);
+	BINARY_POINT_EQUIVALENCE_EXPR(uint8_t , U8x16 , a + b);
+	BINARY_POINT_EQUIVALENCE_EXPR(uint8_t , U8x32 , a + b);
+	BINARY_POINT_EQUIVALENCE_EXPR(uint16_t, U16x8 , a + b);
+	BINARY_POINT_EQUIVALENCE_EXPR(uint16_t, U16x16, a + b);
+	BINARY_POINT_EQUIVALENCE_EXPR(uint32_t, U32x4 , a + b);
+	BINARY_POINT_EQUIVALENCE_EXPR(uint32_t, U32x8 , a + b);
+	BINARY_POINT_EQUIVALENCE_EXPR(int32_t , I32x4 , a + b);
+	BINARY_POINT_EQUIVALENCE_EXPR(int32_t , I32x8 , a + b);
+	BINARY_POINT_EQUIVALENCE_EXPR(float   , F32x4 , a + b);
+	BINARY_POINT_EQUIVALENCE_EXPR(float   , F32x8 , a + b);
 
 	// Subtraction
-	BINARY_POINT_EQUIVALENCE(uint8_t , U8x16 , a - b);
-	BINARY_POINT_EQUIVALENCE(uint8_t , U8x32 , a - b);
-	BINARY_POINT_EQUIVALENCE(uint16_t, U16x8 , a - b);
-	BINARY_POINT_EQUIVALENCE(uint16_t, U16x16, a - b);
-	BINARY_POINT_EQUIVALENCE(uint32_t, U32x4 , a - b);
-	BINARY_POINT_EQUIVALENCE(uint32_t, U32x8 , a - b);
-	BINARY_POINT_EQUIVALENCE(int32_t , I32x4 , a - b);
-	BINARY_POINT_EQUIVALENCE(int32_t , I32x8 , a - b);
-	BINARY_POINT_EQUIVALENCE(float   , F32x4 , a - b);
-	BINARY_POINT_EQUIVALENCE(float   , F32x8 , a - b);
-
-	// Negation
-	UNARY_POINT_EQUIVALENCE(int32_t , I32x4 , -a);
-	UNARY_POINT_EQUIVALENCE(int32_t , I32x8 , -a);
-	UNARY_POINT_EQUIVALENCE(float   , F32x4 , -a);
-	UNARY_POINT_EQUIVALENCE(float   , F32x8 , -a);
+	BINARY_POINT_EQUIVALENCE_EXPR(uint8_t , U8x16 , a - b);
+	BINARY_POINT_EQUIVALENCE_EXPR(uint8_t , U8x32 , a - b);
+	BINARY_POINT_EQUIVALENCE_EXPR(uint16_t, U16x8 , a - b);
+	BINARY_POINT_EQUIVALENCE_EXPR(uint16_t, U16x16, a - b);
+	BINARY_POINT_EQUIVALENCE_EXPR(uint32_t, U32x4 , a - b);
+	BINARY_POINT_EQUIVALENCE_EXPR(uint32_t, U32x8 , a - b);
+	BINARY_POINT_EQUIVALENCE_EXPR(int32_t , I32x4 , a - b);
+	BINARY_POINT_EQUIVALENCE_EXPR(int32_t , I32x8 , a - b);
+	BINARY_POINT_EQUIVALENCE_EXPR(float   , F32x4 , a - b);
+	BINARY_POINT_EQUIVALENCE_EXPR(float   , F32x8 , a - b);
+
+	// Negation (only applicable to signed types)
+	UNARY_POINT_EQUIVALENCE_EXPR(int32_t , I32x4 , -a);
+	UNARY_POINT_EQUIVALENCE_EXPR(int32_t , I32x8 , -a);
+	UNARY_POINT_EQUIVALENCE_EXPR(float   , F32x4 , -a);
+	UNARY_POINT_EQUIVALENCE_EXPR(float   , F32x8 , -a);
 
 	// Multiplication
-	//BINARY_POINT_EQUIVALENCE(uint8_t , U8x16 , a * b); // Missing
-	//BINARY_POINT_EQUIVALENCE(uint8_t , U8x32 , a * b); // Missing
-	//BINARY_POINT_EQUIVALENCE(uint16_t, U16x8 , a * b); // Missing
-	//BINARY_POINT_EQUIVALENCE(uint16_t, U16x16, a * b); // Missing
-	BINARY_POINT_EQUIVALENCE(uint32_t, U32x4 , a * b);
-	BINARY_POINT_EQUIVALENCE(uint32_t, U32x8 , a * b);
-	BINARY_POINT_EQUIVALENCE(int32_t , I32x4 , a * b);
-	BINARY_POINT_EQUIVALENCE(int32_t , I32x8 , a * b);
-	BINARY_POINT_EQUIVALENCE(float   , F32x4 , a * b);
-	BINARY_POINT_EQUIVALENCE(float   , F32x8 , a * b);
-
-	// Bitwise and
-	//BINARY_POINT_EQUIVALENCE(uint8_t , U8x16 , a & b); // Missing
-	//BINARY_POINT_EQUIVALENCE(uint8_t , U8x32 , a & b); // Missing
-	BINARY_POINT_EQUIVALENCE(uint16_t, U16x8 , a & b);
-	BINARY_POINT_EQUIVALENCE(uint16_t, U16x16, a & b);
-	BINARY_POINT_EQUIVALENCE(uint32_t, U32x4 , a & b);
-	BINARY_POINT_EQUIVALENCE(uint32_t, U32x8 , a & b);
-
-	// Bitwise or
-	//BINARY_POINT_EQUIVALENCE(uint8_t , U8x16, a | b); // Missing
-	//BINARY_POINT_EQUIVALENCE(uint8_t , U8x32, a | b); // Missing
-	BINARY_POINT_EQUIVALENCE(uint16_t, U16x8 , a | b);
-	BINARY_POINT_EQUIVALENCE(uint16_t, U16x16, a | b);
-	BINARY_POINT_EQUIVALENCE(uint32_t, U32x4 , a | b);
-	BINARY_POINT_EQUIVALENCE(uint32_t, U32x8 , a | b);
-
-	// Bitwise xor
-	//BINARY_POINT_EQUIVALENCE(uint8_t , U8x16, a ^ b); // Missing
-	//BINARY_POINT_EQUIVALENCE(uint8_t , U8x32, a ^ b); // Missing
-	BINARY_POINT_EQUIVALENCE(uint16_t, U16x8 , a ^ b);
-	BINARY_POINT_EQUIVALENCE(uint16_t, U16x16, a ^ b);
-	BINARY_POINT_EQUIVALENCE(uint32_t, U32x4 , a ^ b);
-	BINARY_POINT_EQUIVALENCE(uint32_t, U32x8 , a ^ b);
-
-	// Bitwise negation
-	UNARY_POINT_EQUIVALENCE(uint16_t, U16x8 , ~a);
-	UNARY_POINT_EQUIVALENCE(uint16_t, U16x16, ~a);
-	UNARY_POINT_EQUIVALENCE(uint32_t, U32x4 , ~a);
-	UNARY_POINT_EQUIVALENCE(uint32_t, U32x8 , ~a);
+	//BINARY_POINT_EQUIVALENCE_EXPR(uint8_t , U8x16 , a * b); // Missing
+	//BINARY_POINT_EQUIVALENCE_EXPR(uint8_t , U8x32 , a * b); // Missing
+	//BINARY_POINT_EQUIVALENCE_EXPR(uint16_t, U16x8 , a * b); // Missing
+	//BINARY_POINT_EQUIVALENCE_EXPR(uint16_t, U16x16, a * b); // Missing
+	BINARY_POINT_EQUIVALENCE_EXPR(uint32_t, U32x4 , a * b);
+	BINARY_POINT_EQUIVALENCE_EXPR(uint32_t, U32x8 , a * b);
+	BINARY_POINT_EQUIVALENCE_EXPR(int32_t , I32x4 , a * b);
+	BINARY_POINT_EQUIVALENCE_EXPR(int32_t , I32x8 , a * b);
+	BINARY_POINT_EQUIVALENCE_EXPR(float   , F32x4 , a * b);
+	BINARY_POINT_EQUIVALENCE_EXPR(float   , F32x8 , a * b);
+
+	// Bitwise and (only numerically well defined for unsigned integers)
+	//BINARY_POINT_EQUIVALENCE_EXPR(uint8_t , U8x16 , a & b); // Missing
+	//BINARY_POINT_EQUIVALENCE_EXPR(uint8_t , U8x32 , a & b); // Missing
+	BINARY_POINT_EQUIVALENCE_EXPR(uint16_t, U16x8 , a & b);
+	BINARY_POINT_EQUIVALENCE_EXPR(uint16_t, U16x16, a & b);
+	BINARY_POINT_EQUIVALENCE_EXPR(uint32_t, U32x4 , a & b);
+	BINARY_POINT_EQUIVALENCE_EXPR(uint32_t, U32x8 , a & b);
+
+	// Bitwise or (only numerically well defined for unsigned integers)
+	//BINARY_POINT_EQUIVALENCE_EXPR(uint8_t , U8x16, a | b); // Missing
+	//BINARY_POINT_EQUIVALENCE_EXPR(uint8_t , U8x32, a | b); // Missing
+	BINARY_POINT_EQUIVALENCE_EXPR(uint16_t, U16x8 , a | b);
+	BINARY_POINT_EQUIVALENCE_EXPR(uint16_t, U16x16, a | b);
+	BINARY_POINT_EQUIVALENCE_EXPR(uint32_t, U32x4 , a | b);
+	BINARY_POINT_EQUIVALENCE_EXPR(uint32_t, U32x8 , a | b);
+
+	// Bitwise xor (only numerically well defined for unsigned integers)
+	//BINARY_POINT_EQUIVALENCE_EXPR(uint8_t , U8x16, a ^ b); // Missing
+	//BINARY_POINT_EQUIVALENCE_EXPR(uint8_t , U8x32, a ^ b); // Missing
+	BINARY_POINT_EQUIVALENCE_EXPR(uint16_t, U16x8 , a ^ b);
+	BINARY_POINT_EQUIVALENCE_EXPR(uint16_t, U16x16, a ^ b);
+	BINARY_POINT_EQUIVALENCE_EXPR(uint32_t, U32x4 , a ^ b);
+	BINARY_POINT_EQUIVALENCE_EXPR(uint32_t, U32x8 , a ^ b);
+
+	// Bitwise negation (only numerically well defined for unsigned integers)
+	UNARY_POINT_EQUIVALENCE_EXPR(uint16_t, U16x8 , ~a);
+	UNARY_POINT_EQUIVALENCE_EXPR(uint16_t, U16x16, ~a);
+	UNARY_POINT_EQUIVALENCE_EXPR(uint32_t, U32x4 , ~a);
+	UNARY_POINT_EQUIVALENCE_EXPR(uint32_t, U32x8 , ~a);
+
+	// Absolute (only applicable to signed types)
+	UNARY_POINT_EQUIVALENCE_FUNC(int32_t, I32x4, dsr::abs);
+	UNARY_POINT_EQUIVALENCE_FUNC(int32_t, I32x8, dsr::abs);
+	UNARY_POINT_EQUIVALENCE_FUNC(float  , F32x4, dsr::abs);
+	UNARY_POINT_EQUIVALENCE_FUNC(float  , F32x8, dsr::abs);
+
+	// Minimum
+	//BINARY_POINT_EQUIVALENCE_FUNC(uint8_t , U8x16 , dsr::min); // Missing
+	//BINARY_POINT_EQUIVALENCE_FUNC(uint8_t , U8x32 , dsr::min); // Missing
+	//BINARY_POINT_EQUIVALENCE_FUNC(uint16_t, U16x8 , dsr::min); // Missing
+	//BINARY_POINT_EQUIVALENCE_FUNC(uint16_t, U16x16, dsr::min); // Missing
+	//BINARY_POINT_EQUIVALENCE_FUNC(uint32_t, U32x4 , dsr::min); // Missing
+	//BINARY_POINT_EQUIVALENCE_FUNC(uint32_t, U32x8 , dsr::min); // Missing
+	//BINARY_POINT_EQUIVALENCE_FUNC(int32_t , I32x4 , dsr::min); // Missing
+	//BINARY_POINT_EQUIVALENCE_FUNC(int32_t , I32x8 , dsr::min); // Missing
+	BINARY_POINT_EQUIVALENCE_FUNC(float   , F32x4 , dsr::min);
+	BINARY_POINT_EQUIVALENCE_FUNC(float   , F32x8 , dsr::min);
+
+	// Maximum
+	//BINARY_POINT_EQUIVALENCE_FUNC(uint8_t , U8x16 , dsr::max); // Missing
+	//BINARY_POINT_EQUIVALENCE_FUNC(uint8_t , U8x32 , dsr::max); // Missing
+	//BINARY_POINT_EQUIVALENCE_FUNC(uint16_t, U16x8 , dsr::max); // Missing
+	//BINARY_POINT_EQUIVALENCE_FUNC(uint16_t, U16x16, dsr::max); // Missing
+	//BINARY_POINT_EQUIVALENCE_FUNC(uint32_t, U32x4 , dsr::max); // Missing
+	//BINARY_POINT_EQUIVALENCE_FUNC(uint32_t, U32x8 , dsr::max); // Missing
+	//BINARY_POINT_EQUIVALENCE_FUNC(int32_t , I32x4 , dsr::max); // Missing
+	//BINARY_POINT_EQUIVALENCE_FUNC(int32_t , I32x8 , dsr::max); // Missing
+	BINARY_POINT_EQUIVALENCE_FUNC(float   , F32x4 , dsr::max);
+	BINARY_POINT_EQUIVALENCE_FUNC(float   , F32x8 , dsr::max);
+
+	// Clamp using upper and lower limit
+	//TRINARY_POINT_EQUIVALENCE_FUNC(uint8_t , U8x16 , dsr::clamp); // Missing
+	//TRINARY_POINT_EQUIVALENCE_FUNC(uint8_t , U8x32 , dsr::clamp); // Missing
+	//TRINARY_POINT_EQUIVALENCE_FUNC(uint16_t, U16x8 , dsr::clamp); // Missing
+	//TRINARY_POINT_EQUIVALENCE_FUNC(uint16_t, U16x16, dsr::clamp); // Missing
+	//TRINARY_POINT_EQUIVALENCE_FUNC(uint32_t, U32x4 , dsr::clamp); // Missing
+	//TRINARY_POINT_EQUIVALENCE_FUNC(uint32_t, U32x8 , dsr::clamp); // Missing
+	//TRINARY_POINT_EQUIVALENCE_FUNC(int32_t , I32x4 , dsr::clamp); // Missing
+	//TRINARY_POINT_EQUIVALENCE_FUNC(int32_t , I32x8 , dsr::clamp); // Missing
+	TRINARY_POINT_EQUIVALENCE_FUNC(float   , F32x4 , dsr::clamp);
+	TRINARY_POINT_EQUIVALENCE_FUNC(float   , F32x8 , dsr::clamp);
+
+	// Clamp using only the upper limit (same as minimum but different name for readability)
+	//BINARY_POINT_EQUIVALENCE_FUNC(uint8_t , U8x16 , dsr::clampUpper); // Missing
+	//BINARY_POINT_EQUIVALENCE_FUNC(uint8_t , U8x32 , dsr::clampUpper); // Missing
+	//BINARY_POINT_EQUIVALENCE_FUNC(uint16_t, U16x8 , dsr::clampUpper); // Missing
+	//BINARY_POINT_EQUIVALENCE_FUNC(uint16_t, U16x16, dsr::clampUpper); // Missing
+	//BINARY_POINT_EQUIVALENCE_FUNC(uint32_t, U32x4 , dsr::clampUpper); // Missing
+	//BINARY_POINT_EQUIVALENCE_FUNC(uint32_t, U32x8 , dsr::clampUpper); // Missing
+	//BINARY_POINT_EQUIVALENCE_FUNC(int32_t , I32x4 , dsr::clampUpper); // Missing
+	//BINARY_POINT_EQUIVALENCE_FUNC(int32_t , I32x8 , dsr::clampUpper); // Missing
+	BINARY_POINT_EQUIVALENCE_FUNC(float   , F32x4 , dsr::clampUpper);
+	BINARY_POINT_EQUIVALENCE_FUNC(float   , F32x8 , dsr::clampUpper);
+
+	// Clamp using only the lower limit (same as maximum but different name for readability)
+	//BINARY_POINT_EQUIVALENCE_FUNC(uint8_t , U8x16 , dsr::clampLower); // Missing
+	//BINARY_POINT_EQUIVALENCE_FUNC(uint8_t , U8x32 , dsr::clampLower); // Missing
+	//BINARY_POINT_EQUIVALENCE_FUNC(uint16_t, U16x8 , dsr::clampLower); // Missing
+	//BINARY_POINT_EQUIVALENCE_FUNC(uint16_t, U16x16, dsr::clampLower); // Missing
+	//BINARY_POINT_EQUIVALENCE_FUNC(uint32_t, U32x4 , dsr::clampLower); // Missing
+	//BINARY_POINT_EQUIVALENCE_FUNC(uint32_t, U32x8 , dsr::clampLower); // Missing
+	//BINARY_POINT_EQUIVALENCE_FUNC(int32_t , I32x4 , dsr::clampLower); // Missing
+	//BINARY_POINT_EQUIVALENCE_FUNC(int32_t , I32x8 , dsr::clampLower); // Missing
+	BINARY_POINT_EQUIVALENCE_FUNC(float   , F32x4 , dsr::clampLower);
+	BINARY_POINT_EQUIVALENCE_FUNC(float   , F32x8 , dsr::clampLower);
+
+/* Needs a more flexible precision or input range to handle singularity near division by zero.
+	// Reciprocal (only applicable to floating-point types)
+	UNARY_POINT_EQUIVALENCE_FUNC(float   , F32x4 , dsr::reciprocal);
+	UNARY_POINT_EQUIVALENCE_FUNC(float   , F32x8 , dsr::reciprocal);
+
+	// Square root (only applicable to floating-point types)
+	UNARY_POINT_EQUIVALENCE_FUNC(float   , F32x4 , dsr::squareRoot);
+	UNARY_POINT_EQUIVALENCE_FUNC(float   , F32x8 , dsr::squareRoot);
 
+	// Reciprocal square root (only applicable to floating-point types)
+	UNARY_POINT_EQUIVALENCE_FUNC(float   , F32x4 , dsr::reciprocalSquareRoot);
+	UNARY_POINT_EQUIVALENCE_FUNC(float   , F32x8 , dsr::reciprocalSquareRoot);
+*/
 END_TEST