Fix casts, add tests

calebzulawski · calebzulawski · commit 3d8721b053ce · 2020-10-11T14:32:46.000-04:00
diff --git a/crates/core_simd/src/intrinsics.rs b/crates/core_simd/src/intrinsics.rs
@@ -36,4 +36,7 @@ extern "platform-intrinsic" {
 
     /// xor
     pub(crate) fn simd_xor<T>(x: T, y: T) -> T;
+
+    /// fptoui/fptosi/uitofp/sitofp
+    pub(crate) fn simd_cast<T, U>(x: T) -> U;
 }
diff --git a/crates/core_simd/src/round.rs b/crates/core_simd/src/round.rs
@@ -6,7 +6,6 @@ macro_rules! implement {
             ceil = $ceil_intrinsic:literal,
             round = $round_intrinsic:literal,
             trunc = $trunc_intrinsic:literal,
-            round_to_int = $round_to_int_intrinsic:literal,
         }
     } => {
         mod $type {
@@ -20,8 +19,6 @@ macro_rules! implement {
                 fn round_intrinsic(x: crate::$type) -> crate::$type;
                 #[link_name = $trunc_intrinsic]
                 fn trunc_intrinsic(x: crate::$type) -> crate::$type;
-                #[link_name = $round_to_int_intrinsic]
-                fn round_to_int_intrinsic(x: crate::$type) -> crate::$int_type;
             }
 
             impl crate::$type {
@@ -60,11 +57,24 @@ macro_rules! implement {
                     self - self.trunc()
                 }
 
+                /// Rounds toward zero and converts to the same-width integer type, assuming that
+                /// the value is finite and fits in that type.
+                ///
+                /// # Safety
+                /// The value must:
+                ///
+                /// * Not be NaN
+                /// * Not be infinite
+                /// * Be representable in the return type, after truncating off its fractional part
+                #[inline]
+                pub unsafe fn to_int_unchecked(self) -> crate::$int_type {
+                    crate::intrinsics::simd_cast(self)
+                }
+
                 /// Returns the nearest integer to each lane. Round half-way cases away from 0.0.
-                #[must_use = "method returns a new vector and does not mutate the original value"]
                 #[inline]
-                pub fn round_to_int(self) -> crate::$int_type {
-                    unsafe { round_to_int_intrinsic(self) }
+                pub fn round_from_int(value: crate::$int_type) -> Self {
+                    unsafe { crate::intrinsics::simd_cast(value) }
                 }
             }
         }
@@ -78,7 +88,6 @@ implement! {
         ceil = "llvm.ceil.v2f32",
         round = "llvm.round.v2f32",
         trunc = "llvm.trunc.v2f32",
-        round_to_int = "llvm.lround.i32.v2f32",
     }
 }
 
@@ -89,7 +98,6 @@ implement! {
         ceil = "llvm.ceil.v4f32",
         round = "llvm.round.v4f32",
         trunc = "llvm.trunc.v4f32",
-        round_to_int = "llvm.lround.i32.v4f32",
     }
 }
 
@@ -100,7 +108,6 @@ implement! {
         ceil = "llvm.ceil.v8f32",
         round = "llvm.round.v8f32",
         trunc = "llvm.trunc.v8f32",
-        round_to_int = "llvm.lround.i32.v8f32",
     }
 }
 
@@ -111,7 +118,6 @@ implement! {
         ceil = "llvm.ceil.v16f32",
         round = "llvm.round.v16f32",
         trunc = "llvm.trunc.v16f32",
-        round_to_int = "llvm.lround.i32.v16f32",
     }
 }
 
@@ -122,7 +128,6 @@ implement! {
         ceil = "llvm.ceil.v2f64",
         round = "llvm.round.v2f64",
         trunc = "llvm.trunc.v2f64",
-        round_to_int = "llvm.lround.i64.v2f64",
     }
 }
 
@@ -133,7 +138,6 @@ implement! {
         ceil = "llvm.ceil.v4f64",
         round = "llvm.round.v4f64",
         trunc = "llvm.trunc.v4f64",
-        round_to_int = "llvm.lround.i64.v4f64",
     }
 }
 
@@ -144,6 +148,5 @@ implement! {
         ceil = "llvm.ceil.v8f64",
         round = "llvm.round.v8f64",
         trunc = "llvm.trunc.v8f64",
-        round_to_int = "llvm.lround.i64.v8f64",
     }
 }
diff --git a/crates/core_simd/tests/helpers/lanewise.rs b/crates/core_simd/tests/helpers/lanewise.rs
@@ -1,8 +1,13 @@
-pub fn apply_unary_lanewise<T: Copy, V: AsMut<[T]> + Default>(mut x: V, f: impl Fn(T) -> T) -> V {
-    for lane in x.as_mut() {
-        *lane = f(*lane)
+pub fn apply_unary_lanewise<T1: Copy, T2: Copy, V1: AsRef<[T1]>, V2: AsMut<[T2]> + Default>(
+    x: V1,
+    f: impl Fn(T1) -> T2,
+) -> V2 {
+    let mut y = V2::default();
+    assert_eq!(x.as_ref().len(), y.as_mut().len());
+    for (x, y) in x.as_ref().iter().zip(y.as_mut().iter_mut()) {
+        *y = f(*x);
     }
-    x
+    y
 }
 
 pub fn apply_binary_lanewise<T: Copy, V: AsRef<[T]> + AsMut<[T]> + Default>(
diff --git a/crates/core_simd/tests/ops_impl/f32.rs b/crates/core_simd/tests/ops_impl/f32.rs
@@ -1,6 +1,6 @@
 use super::helpers;
 
-float_tests! { f32x2, f32 }
-float_tests! { f32x4, f32 }
-float_tests! { f32x8, f32 }
-float_tests! { f32x16, f32 }
+float_tests! { f32x2, f32, i32x2, i32 }
+float_tests! { f32x4, f32, i32x4, i32 }
+float_tests! { f32x8, f32, i32x8, i32 }
+float_tests! { f32x16, f32, i32x16, i32 }
diff --git a/crates/core_simd/tests/ops_impl/f64.rs b/crates/core_simd/tests/ops_impl/f64.rs
@@ -1,5 +1,5 @@
 use super::helpers;
 
-float_tests! { f64x2, f64 }
-float_tests! { f64x4, f64 }
-float_tests! { f64x8, f64 }
+float_tests! { f64x2, f64, i64x2, i64 }
+float_tests! { f64x4, f64, i64x4, i64 }
+float_tests! { f64x8, f64, i64x8, i64 }
diff --git a/crates/core_simd/tests/ops_impl/float_macros.rs b/crates/core_simd/tests/ops_impl/float_macros.rs
@@ -1,5 +1,5 @@
 macro_rules! float_tests {
-    { $vector:ident, $scalar:ident } => {
+    { $vector:ident, $scalar:ident, $int_vector:ident, $int_scalar:ident } => {
         #[cfg(test)]
         mod $vector {
             use super::*;
@@ -24,6 +24,18 @@ macro_rules! float_tests {
                 slice.chunks_exact(lanes).map(from_slice)
             }
 
+            fn from_slice_int(slice: &[$int_scalar]) -> core_simd::$int_vector {
+                let mut value = core_simd::$int_vector::default();
+                let value_slice: &mut [_] = value.as_mut();
+                value_slice.copy_from_slice(&slice[0..value_slice.len()]);
+                value
+            }
+
+            fn slice_chunks_int(slice: &[$int_scalar]) -> impl Iterator<Item = core_simd::$int_vector> + '_ {
+                let lanes = core::mem::size_of::<core_simd::$int_vector>() / core::mem::size_of::<$int_scalar>();
+                slice.chunks_exact(lanes).map(from_slice_int)
+            }
+
             const A: [$scalar; 16] = [0.,   1.,  2.,  3.,  4.,  5.,  6.,  7.,  8.,  9., 10., 11., 12., 13., 14., 15.];
             const B: [$scalar; 16] = [16., 17., 18., 19., 20., 21., 22., 23., 24., 25., 26., 27., 28., 29., 30., 31.];
             const C: [$scalar; 16] = [
@@ -322,6 +334,107 @@ macro_rules! float_tests {
                     assert_biteq!(v.abs(), expected);
                 }
             }
+
+            #[test]
+            #[cfg_attr(target_arch = "wasm32", wasm_bindgen_test)]
+            fn ceil_odd_floats() {
+                for v in slice_chunks(&C) {
+                    let expected = apply_unary_lanewise(v, <$scalar>::ceil);
+                    assert_biteq!(v.ceil(), expected);
+                }
+            }
+
+            #[test]
+            #[cfg_attr(target_arch = "wasm32", wasm_bindgen_test)]
+            fn floor_odd_floats() {
+                for v in slice_chunks(&C) {
+                    let expected = apply_unary_lanewise(v, <$scalar>::floor);
+                    assert_biteq!(v.floor(), expected);
+                }
+            }
+
+            #[test]
+            #[cfg_attr(target_arch = "wasm32", wasm_bindgen_test)]
+            fn round_odd_floats() {
+                for v in slice_chunks(&C) {
+                    let expected = apply_unary_lanewise(v, <$scalar>::round);
+                    assert_biteq!(v.round(), expected);
+                }
+            }
+
+            #[test]
+            #[cfg_attr(target_arch = "wasm32", wasm_bindgen_test)]
+            fn trunc_odd_floats() {
+                for v in slice_chunks(&C) {
+                    let expected = apply_unary_lanewise(v, <$scalar>::trunc);
+                    assert_biteq!(v.trunc(), expected);
+                }
+            }
+
+            #[test]
+            #[cfg_attr(target_arch = "wasm32", wasm_bindgen_test)]
+            fn fract_odd_floats() {
+                for v in slice_chunks(&C) {
+                    let expected = apply_unary_lanewise(v, <$scalar>::fract);
+                    assert_biteq!(v.fract(), expected);
+                }
+            }
+
+            #[test]
+            #[cfg_attr(target_arch = "wasm32", wasm_bindgen_test)]
+            fn to_int_unchecked() {
+                const VALUES: [$scalar; 16] = [
+                    -0.0,
+                    0.0,
+                    -1.0,
+                    1.0,
+                    <$scalar>::MIN,
+                    -<$scalar>::MIN,
+                    <$scalar>::MIN_POSITIVE,
+                    -<$scalar>::MIN_POSITIVE,
+                    <$scalar>::EPSILON,
+                    -<$scalar>::EPSILON,
+                    core::$scalar::consts::PI,
+                    -core::$scalar::consts::PI,
+                    core::$scalar::consts::TAU,
+                    -core::$scalar::consts::TAU,
+                    100.0 / 3.0,
+                    -100.0 / 3.0,
+                ];
+
+                for v in slice_chunks(&VALUES) {
+                    let expected = apply_unary_lanewise(v, |x| unsafe { x.to_int_unchecked() });
+                    assert_biteq!(unsafe { v.to_int_unchecked() }, expected);
+                }
+            }
+
+            #[test]
+            #[cfg_attr(target_arch = "wasm32", wasm_bindgen_test)]
+            fn round_from_int() {
+                const VALUES: [$int_scalar; 16] = [
+                    0,
+                    0,
+                    1,
+                    -1,
+                    100,
+                    -100,
+                    200,
+                    -200,
+                    413,
+                    -413,
+                    1017,
+                    -1017,
+                    1234567,
+                    -1234567,
+                    <$int_scalar>::MAX,
+                    <$int_scalar>::MIN,
+                ];
+
+                for v in slice_chunks_int(&VALUES) {
+                    let expected = apply_unary_lanewise(v, |x| x as $scalar);
+                    assert_biteq!(core_simd::$vector::round_from_int(v), expected);
+                }
+            }
         }
     }
 }

Original file line number	Diff line number	Diff line change
`@@ -36,4 +36,7 @@ extern "platform-intrinsic" {`
`36`	`36`
`37`	`37`	`/// xor`
`38`	`38`	`pub(crate) fn simd_xor<T>(x: T, y: T) -> T;`
	`39`	`+`
	`40`	`+ /// fptoui/fptosi/uitofp/sitofp`
	`41`	`+ pub(crate) fn simd_cast<T, U>(x: T) -> U;`
`39`	`42`	`}`
Original file line number	Diff line number	Diff line change
`@@ -6,7 +6,6 @@ macro_rules! implement {`
`6`	`6`	`ceil = $ceil_intrinsic:literal,`
`7`	`7`	`round = $round_intrinsic:literal,`
`8`	`8`	`trunc = $trunc_intrinsic:literal,`
`9`		`- round_to_int = $round_to_int_intrinsic:literal,`
`10`	`9`	`}`
`11`	`10`	`} => {`
`12`	`11`	`mod $type {`
`@@ -20,8 +19,6 @@ macro_rules! implement {`
`20`	`19`	`fn round_intrinsic(x: crate::$type) -> crate::$type;`
`21`	`20`	`#[link_name = $trunc_intrinsic]`
`22`	`21`	`fn trunc_intrinsic(x: crate::$type) -> crate::$type;`
`23`		`- #[link_name = $round_to_int_intrinsic]`
`24`		`- fn round_to_int_intrinsic(x: crate::$type) -> crate::$int_type;`
`25`	`22`	`}`
`26`	`23`
`27`	`24`	`impl crate::$type {`
`@@ -60,11 +57,24 @@ macro_rules! implement {`
`60`	`57`	`self - self.trunc()`
`61`	`58`	`}`
`62`	`59`
	`60`	`+ /// Rounds toward zero and converts to the same-width integer type, assuming that`
	`61`	`+ /// the value is finite and fits in that type.`
	`62`	`+ ///`
	`63`	`+ /// # Safety`
	`64`	`+ /// The value must:`
	`65`	`+ ///`
	`66`	`+ /// * Not be NaN`
	`67`	`+ /// * Not be infinite`
	`68`	`+ /// * Be representable in the return type, after truncating off its fractional part`
	`69`	`+ #[inline]`
	`70`	`+ pub unsafe fn to_int_unchecked(self) -> crate::$int_type {`
	`71`	`+ crate::intrinsics::simd_cast(self)`
	`72`	`+ }`
	`73`	`+`
`63`	`74`	`/// Returns the nearest integer to each lane. Round half-way cases away from 0.0.`
`64`		`- #[must_use = "method returns a new vector and does not mutate the original value"]`
`65`	`75`	`#[inline]`
`66`		`- pub fn round_to_int(self) -> crate::$int_type {`
`67`		`- unsafe { round_to_int_intrinsic(self) }`
	`76`	`+ pub fn round_from_int(value: crate::$int_type) -> Self {`
	`77`	`+ unsafe { crate::intrinsics::simd_cast(value) }`
`68`	`78`	`}`
`69`	`79`	`}`
`70`	`80`	`}`
`@@ -78,7 +88,6 @@ implement! {`
`78`	`88`	`ceil = "llvm.ceil.v2f32",`
`79`	`89`	`round = "llvm.round.v2f32",`
`80`	`90`	`trunc = "llvm.trunc.v2f32",`
`81`		`- round_to_int = "llvm.lround.i32.v2f32",`
`82`	`91`	`}`
`83`	`92`	`}`
`84`	`93`
`@@ -89,7 +98,6 @@ implement! {`
`89`	`98`	`ceil = "llvm.ceil.v4f32",`
`90`	`99`	`round = "llvm.round.v4f32",`
`91`	`100`	`trunc = "llvm.trunc.v4f32",`
`92`		`- round_to_int = "llvm.lround.i32.v4f32",`
`93`	`101`	`}`
`94`	`102`	`}`
`95`	`103`
`@@ -100,7 +108,6 @@ implement! {`
`100`	`108`	`ceil = "llvm.ceil.v8f32",`
`101`	`109`	`round = "llvm.round.v8f32",`
`102`	`110`	`trunc = "llvm.trunc.v8f32",`
`103`		`- round_to_int = "llvm.lround.i32.v8f32",`
`104`	`111`	`}`
`105`	`112`	`}`
`106`	`113`
`@@ -111,7 +118,6 @@ implement! {`
`111`	`118`	`ceil = "llvm.ceil.v16f32",`
`112`	`119`	`round = "llvm.round.v16f32",`
`113`	`120`	`trunc = "llvm.trunc.v16f32",`
`114`		`- round_to_int = "llvm.lround.i32.v16f32",`
`115`	`121`	`}`
`116`	`122`	`}`
`117`	`123`
`@@ -122,7 +128,6 @@ implement! {`
`122`	`128`	`ceil = "llvm.ceil.v2f64",`
`123`	`129`	`round = "llvm.round.v2f64",`
`124`	`130`	`trunc = "llvm.trunc.v2f64",`
`125`		`- round_to_int = "llvm.lround.i64.v2f64",`
`126`	`131`	`}`
`127`	`132`	`}`
`128`	`133`
`@@ -133,7 +138,6 @@ implement! {`
`133`	`138`	`ceil = "llvm.ceil.v4f64",`
`134`	`139`	`round = "llvm.round.v4f64",`
`135`	`140`	`trunc = "llvm.trunc.v4f64",`
`136`		`- round_to_int = "llvm.lround.i64.v4f64",`
`137`	`141`	`}`
`138`	`142`	`}`
`139`	`143`
`@@ -144,6 +148,5 @@ implement! {`
`144`	`148`	`ceil = "llvm.ceil.v8f64",`
`145`	`149`	`round = "llvm.round.v8f64",`
`146`	`150`	`trunc = "llvm.trunc.v8f64",`
`147`		`- round_to_int = "llvm.lround.i64.v8f64",`
`148`	`151`	`}`
`149`	`152`	`}`