format

karthikbhargavan · karthikbhargavan · commit 2bba06951d92 · 2025-07-31T01:46:01.000-04:00
diff --git a/testable-simd-models/src/core_arch/x86/models/avx.rs b/testable-simd-models/src/core_arch/x86/models/avx.rs
@@ -779,8 +779,14 @@ pub fn _mm_permute_ps<const IMM8: i32>(a: __m128) -> __m128 {
     static_assert_uimm_bits!(IMM8, 8);
     {
         transmute(simd_shuffle(
-            a.as_f32x4(), _mm_undefined_ps().as_f32x4(), [(IMM8 as u32 >> 0) & 0b11, (IMM8 as u32 >> 2) & 0b11,
-            (IMM8 as u32 >> 4) & 0b11, (IMM8 as u32 >> 6) & 0b11,],
+            a.as_f32x4(),
+            _mm_undefined_ps().as_f32x4(),
+            [
+                (IMM8 as u32 >> 0) & 0b11,
+                (IMM8 as u32 >> 2) & 0b11,
+                (IMM8 as u32 >> 4) & 0b11,
+                (IMM8 as u32 >> 6) & 0b11,
+            ],
         ))
     }
 }
@@ -887,7 +893,13 @@ pub fn _mm256_broadcast_ss(f: &f32) -> __m256 {
 ///
 /// [Intel's documentation](https://www.intel.com/content/www/us/en/docs/intrinsics-guide/index.htmlext=_mm256_broadcast_ps)
 pub fn _mm256_broadcast_ps(a: &__m128) -> __m256 {
-    { transmute(simd_shuffle((*a).as_f32x4(), _mm_setzero_ps().as_f32x4(), [0, 1, 2, 3, 0, 1, 2, 3])) }
+    {
+        transmute(simd_shuffle(
+            (*a).as_f32x4(),
+            _mm_setzero_ps().as_f32x4(),
+            [0, 1, 2, 3, 0, 1, 2, 3],
+        ))
+    }
 }
 /// Broadcasts 128 bits from memory (composed of 2 packed double-precision
 /// (64-bit) floating-point elements) to all elements of the returned vector.
@@ -909,8 +921,9 @@ pub fn _mm256_insertf128_ps<const IMM1: i32>(a: __m256, b: __m128) -> __m256 {
     static_assert_uimm_bits!(IMM1, 1);
     {
         transmute(simd_shuffle(
-            a.as_f32x8(), _mm256_castps128_ps256(b).as_f32x8(), [[8, 9, 10, 11, 4, 5, 6, 7], [0, 1, 2, 3, 8, 9,
-            10, 11]] [IMM1 as usize],
+            a.as_f32x8(),
+            _mm256_castps128_ps256(b).as_f32x8(),
+            [[8, 9, 10, 11, 4, 5, 6, 7], [0, 1, 2, 3, 8, 9, 10, 11]][IMM1 as usize],
         ))
     }
 }
@@ -923,8 +936,9 @@ pub fn _mm256_insertf128_pd<const IMM1: i32>(a: __m256d, b: __m128d) -> __m256d
     static_assert_uimm_bits!(IMM1, 1);
     {
         transmute(simd_shuffle(
-            a.as_f64x4(), _mm256_castpd128_pd256(b).as_f64x4(), 
-            [[4, 5, 2, 3], [0, 1, 4, 5]] [IMM1 as usize],
+            a.as_f64x4(),
+            _mm256_castpd128_pd256(b).as_f64x4(),
+            [[4, 5, 2, 3], [0, 1, 4, 5]][IMM1 as usize],
         ))
     }
 }
@@ -1599,7 +1613,13 @@ pub fn _mm256_castsi256_si128(a: __m256i) -> __m128i {
 ///
 /// [Intel's documentation](https://www.intel.com/content/www/us/en/docs/intrinsics-guide/index.htmlext=_mm256_castps128_ps256)
 pub fn _mm256_castps128_ps256(a: __m128) -> __m256 {
-    { transmute(simd_shuffle(a.as_f32x4(), _mm_undefined_ps().as_f32x4(), [0, 1, 2, 3, 4, 4, 4, 4])) }
+    {
+        transmute(simd_shuffle(
+            a.as_f32x4(),
+            _mm_undefined_ps().as_f32x4(),
+            [0, 1, 2, 3, 4, 4, 4, 4],
+        ))
+    }
 }
 /// Casts vector of type __m128d to type __m256d;
 /// the upper 128 bits of the result are undefined.
@@ -1630,7 +1650,13 @@ pub fn _mm256_castsi128_si256(a: __m128i) -> __m256i {
 ///
 /// [Intel's documentation](https://www.intel.com/content/www/us/en/docs/intrinsics-guide/index.htmlext=_mm256_zextps128_ps256)
 pub fn _mm256_zextps128_ps256(a: __m128) -> __m256 {
-    { transmute(simd_shuffle(a.as_f32x4(), _mm_setzero_ps().as_f32x4(), [0, 1, 2, 3, 4, 5, 6, 7])) }
+    {
+        transmute(simd_shuffle(
+            a.as_f32x4(),
+            _mm_setzero_ps().as_f32x4(),
+            [0, 1, 2, 3, 4, 5, 6, 7],
+        ))
+    }
 }
 /// Constructs a 256-bit integer vector from a 128-bit integer vector.
 /// The lower 128 bits contain the value of the source vector. The upper
@@ -1652,7 +1678,13 @@ pub fn _mm256_zextsi128_si256(a: __m128i) -> __m256i {
 /// [Intel's documentation](https://www.intel.com/content/www/us/en/docs/intrinsics-guide/index.htmlext=_mm256_zextpd128_pd256)
 // NOTE: Not modeled yet
 pub fn _mm256_zextpd128_pd256(a: __m128d) -> __m256d {
-    { transmute(simd_shuffle(a.as_f64x2(), _mm_setzero_pd().as_f64x2(), [0, 1, 2, 3])) }
+    {
+        transmute(simd_shuffle(
+            a.as_f64x2(),
+            _mm_setzero_pd().as_f64x2(),
+            [0, 1, 2, 3],
+        ))
+    }
 }
 /// Returns vector of type `__m256` with indeterminate elements.
 /// Despite using the word "undefined" (following Intel's naming scheme), this non-deterministically
diff --git a/testable-simd-models/src/core_arch/x86/models/avx2.rs b/testable-simd-models/src/core_arch/x86/models/avx2.rs
@@ -22,10 +22,10 @@
 use crate::abstractions::simd::*;
 use crate::abstractions::utilities::*;
 
-use super::sse::*;
-use super::sse2::*;
 use super::avx::*;
 use super::avx2_handwritten::*;
+use super::sse::*;
+use super::sse2::*;
 use super::types::*;
 
 /// Computes the absolute values of packed 32-bit integers in `a`.
@@ -389,14 +389,26 @@ pub fn _mm256_broadcastq_epi64(a: __m128i) -> __m256i {
 ///
 /// [Intel's documentation](https://www.intel.com/content/www/us/en/docs/intrinsics-guide/index.html#text=_mm_broadcastsd_pd)
 pub fn _mm_broadcastsd_pd(a: __m128d) -> __m128d {
-    { transmute(simd_shuffle(a.as_f64x2(), _mm_setzero_pd().as_f64x2(), [0_u32; 2])) }
+    {
+        transmute(simd_shuffle(
+            a.as_f64x2(),
+            _mm_setzero_pd().as_f64x2(),
+            [0_u32; 2],
+        ))
+    }
 }
 /// Broadcasts the low double-precision (64-bit) floating-point element
 /// from `a` to all elements of the 256-bit returned value.
 ///
 /// [Intel's documentation](https://www.intel.com/content/www/us/en/docs/intrinsics-guide/index.html#text=_mm256_broadcastsd_pd)
 pub fn _mm256_broadcastsd_pd(a: __m128d) -> __m256d {
-    { transmute(simd_shuffle(a.as_f64x2(), _mm_setzero_pd().as_f64x2(), [0_u32; 4])) }
+    {
+        transmute(simd_shuffle(
+            a.as_f64x2(),
+            _mm_setzero_pd().as_f64x2(),
+            [0_u32; 4],
+        ))
+    }
 }
 /// Broadcasts 128 bits of integer data from a to all 128-bit lanes in
 /// the 256-bit returned value.
@@ -423,14 +435,26 @@ pub fn _mm256_broadcastsi128_si256(a: __m128i) -> __m256i {
 ///
 /// [Intel's documentation](https://www.intel.com/content/www/us/en/docs/intrinsics-guide/index.html#text=_mm_broadcastss_ps)
 pub fn _mm_broadcastss_ps(a: __m128) -> __m128 {
-    { transmute(simd_shuffle(a.as_f32x4(), _mm_setzero_ps().as_f32x4(), [0_u32; 4])) }
+    {
+        transmute(simd_shuffle(
+            a.as_f32x4(),
+            _mm_setzero_ps().as_f32x4(),
+            [0_u32; 4],
+        ))
+    }
 }
 /// Broadcasts the low single-precision (32-bit) floating-point element
 /// from `a` to all elements of the 256-bit returned value.
 ///
 /// [Intel's documentation](https://www.intel.com/content/www/us/en/docs/intrinsics-guide/index.html#text=_mm256_broadcastss_ps)
 pub fn _mm256_broadcastss_ps(a: __m128) -> __m256 {
-    { transmute(simd_shuffle(a.as_f32x4(), _mm_setzero_ps().as_f32x4(), [0_u32; 8])) }
+    {
+        transmute(simd_shuffle(
+            a.as_f32x4(),
+            _mm_setzero_ps().as_f32x4(),
+            [0_u32; 8],
+        ))
+    }
 }
 /// Broadcasts the low packed 16-bit integer from a to all elements of
 /// the 128-bit returned value
diff --git a/testable-simd-models/src/core_arch/x86/models/mod.rs b/testable-simd-models/src/core_arch/x86/models/mod.rs
@@ -20,11 +20,11 @@
 //! In general, it is best to gain an idea of how an implementation should be written by looking
 //! at how other functions are implemented. Also see `core::arch::x86` for [reference](https://github.com/rust-lang/stdarch/tree/master/crates/core_arch).
 
-pub mod sse;
 pub mod avx;
 pub mod avx2;
 pub mod avx2_handwritten;
 pub mod avx_handwritten;
+pub mod sse;
 pub mod sse2;
 pub mod sse2_handwritten;
 pub mod ssse3;
diff --git a/testable-simd-models/src/core_arch/x86/models/sse.rs b/testable-simd-models/src/core_arch/x86/models/sse.rs
@@ -1,7 +1,7 @@
 //! Streaming SIMD Extensions (SSE)
+use super::types::*;
 use crate::abstractions::simd::*;
 use crate::abstractions::utilities::*;
-use super::types::*;
 
 /// Returns vector of type __m128 with indeterminate elements.with indetermination elements.
 /// Despite using the word "undefined" (following Intel's naming scheme), this non-deterministically
@@ -10,11 +10,12 @@ use super::types::*;
 ///
 /// [Intel's documentation](https://www.intel.com/content/www/us/en/docs/intrinsics-guide/index.html#text=_mm_undefined_ps)
 pub fn _mm_undefined_ps() -> __m128 {
-    transmute(f32x4::ZERO()) 
+    transmute(f32x4::ZERO())
 }
 
 /// Construct a `__m128` with all elements initialized to zero.
 ///
 /// [Intel's documentation](https://www.intel.com/content/www/us/en/docs/intrinsics-guide/index.html#text=_mm_setzero_ps)
 pub fn _mm_setzero_ps() -> __m128 {
-    transmute(f32x4::ZERO()) }
+    transmute(f32x4::ZERO())
+}