@@ -4022,7 +4022,7 @@ SZ_PUBLIC sz_u64_t sz_checksum_avx2(sz_cptr_t text, sz_size_t length) {
40224022 __m128i low_xmm = _mm256_castsi256_si128 (sums_vec.ymm );
40234023 __m128i high_xmm = _mm256_extracti128_si256 (sums_vec.ymm , 1 );
40244024 __m128i sums_xmm = _mm_add_epi64 (low_xmm, high_xmm);
4025- sz_u64_t low = (sz_u64_t )_mm_cvtsi128_si64x (sums_xmm);
4025+ sz_u64_t low = (sz_u64_t )_mm_cvtsi128_si64 (sums_xmm);
40264026 sz_u64_t high = (sz_u64_t )_mm_extract_epi64 (sums_xmm, 1 );
40274027 sz_u64_t result = low + high;
40284028 if (length) result += sz_checksum_serial (text, length);
@@ -4073,7 +4073,7 @@ SZ_PUBLIC sz_u64_t sz_checksum_avx2(sz_cptr_t text, sz_size_t length) {
40734073 __m128i low_xmm = _mm256_castsi256_si128 (sums_vec.ymm );
40744074 __m128i high_xmm = _mm256_extracti128_si256 (sums_vec.ymm , 1 );
40754075 __m128i sums_xmm = _mm_add_epi64 (low_xmm, high_xmm);
4076- sz_u64_t low = (sz_u64_t )_mm_cvtsi128_si64x (sums_xmm);
4076+ sz_u64_t low = (sz_u64_t )_mm_cvtsi128_si64 (sums_xmm);
40774077 sz_u64_t high = (sz_u64_t )_mm_extract_epi64 (sums_xmm, 1 );
40784078 result += low + high;
40794079 return result;
@@ -5306,7 +5306,7 @@ SZ_PUBLIC sz_u64_t sz_checksum_avx512(sz_cptr_t text, sz_size_t length) {
53065306 __mmask16 mask = _sz_u16_mask_until (length);
53075307 text_vec.xmms [0 ] = _mm_maskz_loadu_epi8 (mask, text);
53085308 sums_vec.xmms [0 ] = _mm_sad_epu8 (text_vec.xmms [0 ], _mm_setzero_si128 ());
5309- sz_u64_t low = (sz_u64_t )_mm_cvtsi128_si64x (sums_vec.xmms [0 ]);
5309+ sz_u64_t low = (sz_u64_t )_mm_cvtsi128_si64 (sums_vec.xmms [0 ]);
53105310 sz_u64_t high = (sz_u64_t )_mm_extract_epi64 (sums_vec.xmms [0 ], 1 );
53115311 return low + high;
53125312 }
@@ -5318,7 +5318,7 @@ SZ_PUBLIC sz_u64_t sz_checksum_avx512(sz_cptr_t text, sz_size_t length) {
53185318 __m128i low_xmm = _mm256_castsi256_si128 (sums_vec.ymms [0 ]);
53195319 __m128i high_xmm = _mm256_extracti128_si256 (sums_vec.ymms [0 ], 1 );
53205320 __m128i sums_xmm = _mm_add_epi64 (low_xmm, high_xmm);
5321- sz_u64_t low = (sz_u64_t )_mm_cvtsi128_si64x (sums_xmm);
5321+ sz_u64_t low = (sz_u64_t )_mm_cvtsi128_si64 (sums_xmm);
53225322 sz_u64_t high = (sz_u64_t )_mm_extract_epi64 (sums_xmm, 1 );
53235323 return low + high;
53245324 }
@@ -6092,7 +6092,7 @@ SZ_PUBLIC sz_bool_t sz_equal_neon(sz_cptr_t a, sz_cptr_t b, sz_size_t length) {
60926092 return sz_true_k;
60936093}
60946094
6095- SZ_PUBLIC sz_u64_t sz_checksum_neon (sz_cptr_t const * text, size_t length) {
6095+ SZ_PUBLIC sz_u64_t sz_checksum_neon (sz_cptr_t text, sz_size_t length) {
60966096 uint64x2_t sum_vec = vdupq_n_u64 (0 );
60976097
60986098 // Process 16 bytes (128 bits) at a time
0 commit comments