Skip to content

Commit 353dc3c

Browse files
author
Raghuveer Devulapalli
committed
Use _mm256_loadu_si256 to make it work on g++-10
1 parent bab65af commit 353dc3c

File tree

2 files changed

+3
-3
lines changed

2 files changed

+3
-3
lines changed

Makefile

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,4 +1,4 @@
1-
CXX = g++-12
1+
CXX ?= g++-12
22
SRCDIR = ./src
33
TESTDIR = ./tests
44
BENCHDIR = ./benchmarks

src/avx512-64bit-common.h

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -219,7 +219,7 @@ struct ymm_vector<uint32_t> {
219219
}
220220
static zmm_t loadu(void const *mem)
221221
{
222-
return _mm256_loadu_epi32(mem);
222+
return _mm256_loadu_si256((__m256i*) mem);
223223
}
224224
static zmm_t max(zmm_t x, zmm_t y)
225225
{
@@ -348,7 +348,7 @@ struct ymm_vector<int32_t> {
348348
}
349349
static zmm_t loadu(void const *mem)
350350
{
351-
return _mm256_loadu_epi32(mem);
351+
return _mm256_loadu_si256((__m256i*) mem);
352352
}
353353
static zmm_t max(zmm_t x, zmm_t y)
354354
{

0 commit comments

Comments
 (0)