|
138 | 138 | .macro _fold_vec acc, data, consts, tmp
|
139 | 139 | _pclmulqdq \consts, HI64_TERMS, \acc, HI64_TERMS, \tmp
|
140 | 140 | _pclmulqdq \consts, LO64_TERMS, \acc, LO64_TERMS, \acc
|
141 |
| -.if AVX_LEVEL < 10 |
| 141 | +.if AVX_LEVEL <= 2 |
142 | 142 | _cond_vex pxor, \data, \tmp, \tmp
|
143 | 143 | _cond_vex pxor, \tmp, \acc, \acc
|
144 | 144 | .else
|
|
201 | 201 | // \vl is the maximum length of vector register to use in bytes: 16, 32, or 64.
|
202 | 202 | //
|
203 | 203 | // \avx_level is the level of AVX support to use: 0 for SSE only, 2 for AVX2, or
|
204 |
| -// 10 for AVX10 or AVX512. |
| 204 | +// 512 for AVX512. |
205 | 205 | //
|
206 | 206 | // If \vl == 16 && \avx_level == 0, the generated code requires:
|
207 | 207 | // PCLMULQDQ && SSE4.1. (Note: all known CPUs with PCLMULQDQ also have SSE4.1.)
|
208 | 208 | //
|
209 | 209 | // If \vl == 32 && \avx_level == 2, the generated code requires:
|
210 | 210 | // VPCLMULQDQ && AVX2.
|
211 | 211 | //
|
212 |
| -// If \vl == 32 && \avx_level == 10, the generated code requires: |
213 |
| -// VPCLMULQDQ && (AVX10/256 || (AVX512BW && AVX512VL)) |
214 |
| -// |
215 |
| -// If \vl == 64 && \avx_level == 10, the generated code requires: |
216 |
| -// VPCLMULQDQ && (AVX10/512 || (AVX512BW && AVX512VL)) |
| 212 | +// If \vl == 64 && \avx_level == 512, the generated code requires: |
| 213 | +// VPCLMULQDQ && AVX512BW && AVX512VL. |
217 | 214 | //
|
218 | 215 | // Other \vl and \avx_level combinations are either not supported or not useful.
|
219 | 216 | .macro _crc_pclmul n, lsb_crc, vl, avx_level
|
|
534 | 531 | .if LSB_CRC && \n == 64
|
535 | 532 | _cond_vex punpcklqdq, %xmm1, %xmm2, %xmm2
|
536 | 533 | _pclmulqdq CONSTS_XMM, LO64_TERMS, %xmm1, HI64_TERMS, %xmm1
|
537 |
| - .if AVX_LEVEL < 10 |
| 534 | + .if AVX_LEVEL <= 2 |
538 | 535 | _cond_vex pxor, %xmm2, %xmm0, %xmm0
|
539 | 536 | _cond_vex pxor, %xmm1, %xmm0, %xmm0
|
540 | 537 | .else
|
@@ -574,13 +571,9 @@ SYM_FUNC_START(prefix##_vpclmul_avx2); \
|
574 | 571 | _crc_pclmul n=bits, lsb_crc=lsb, vl=32, avx_level=2; \
|
575 | 572 | SYM_FUNC_END(prefix##_vpclmul_avx2); \
|
576 | 573 | \
|
577 |
| -SYM_FUNC_START(prefix##_vpclmul_avx10_256); \ |
578 |
| - _crc_pclmul n=bits, lsb_crc=lsb, vl=32, avx_level=10; \ |
579 |
| -SYM_FUNC_END(prefix##_vpclmul_avx10_256); \ |
580 |
| - \ |
581 |
| -SYM_FUNC_START(prefix##_vpclmul_avx10_512); \ |
582 |
| - _crc_pclmul n=bits, lsb_crc=lsb, vl=64, avx_level=10; \ |
583 |
| -SYM_FUNC_END(prefix##_vpclmul_avx10_512); |
| 574 | +SYM_FUNC_START(prefix##_vpclmul_avx512); \ |
| 575 | + _crc_pclmul n=bits, lsb_crc=lsb, vl=64, avx_level=512; \ |
| 576 | +SYM_FUNC_END(prefix##_vpclmul_avx512); |
584 | 577 | #else
|
585 | 578 | #define DEFINE_CRC_PCLMUL_FUNCS(prefix, bits, lsb) \
|
586 | 579 | SYM_FUNC_START(prefix##_pclmul_sse); \
|
|
0 commit comments