Skip to content

Commit f542744

Browse files
jxraviBiplabRaut
authored andcommitted
SNAPPY : Performance improvement with clang compiler
- Fixed regression in decompression with AOCC compiler AMD-Internal JIRA : [CPUPL-4352]
1 parent 1406f14 commit f542744

File tree

1 file changed

+2
-2
lines changed

1 file changed

+2
-2
lines changed

algos/snappy/snappy.cc

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -1131,7 +1131,7 @@ static inline uint32_t ExtractLowBytes_no_bmi(uint32_t v, int n) {
11311131

11321132
#ifdef AOCL_SNAPPY_AVX2_OPT
11331133
//#if SNAPPY_HAVE_BMI2
1134-
__attribute__((__target__("bmi2")))
1134+
__attribute__((__target__("bmi2,avx2")))
11351135
static inline uint32_t ExtractLowBytes_bmi(uint32_t v, int n) {
11361136
AOCL_SIMD_UNIT_TEST(DEBUG, logCtx, "Enter");
11371137
assert(n >= 0);
@@ -1231,7 +1231,7 @@ class SnappyDecompressor {
12311231
#if defined(__GNUC__) && defined(__x86_64__)
12321232
__attribute__((aligned(32)))
12331233
#endif
1234-
__attribute__((__target__("bmi2")))
1234+
__attribute__((__target__("bmi2,avx2")))
12351235
AOCL_SNAPPY_TARGET_AVX
12361236
void DecompressAllTags_bmi(Writer* writer) {
12371237
AOCL_SIMD_UNIT_TEST(DEBUG, logCtx, "Enter");

0 commit comments

Comments
 (0)