From ef979383a507277247d36b97572f4bf558e84305 Mon Sep 17 00:00:00 2001 From: "Wang, Phoebe" Date: Fri, 17 Jan 2025 21:25:19 +0800 Subject: [PATCH 1/2] [X86][AVX10.2-BF16] Remove [NE]P from intrinsic and instruction name Ref.: https://cdrdv2.intel.com/v1/dl/getContent/828965 --- clang/include/clang/Basic/BuiltinsX86.td | 96 +- clang/lib/CodeGen/CGBuiltin.cpp | 30 +- clang/lib/Headers/avx10_2_512bf16intrin.h | 210 +- clang/lib/Headers/avx10_2bf16intrin.h | 426 ++- clang/lib/Sema/SemaX86.cpp | 18 +- .../CodeGen/X86/avx10_2_512bf16-builtins.c | 300 +- clang/test/CodeGen/X86/avx10_2bf16-builtins.c | 546 +-- llvm/include/llvm/IR/IntrinsicsX86.td | 156 +- .../lib/Target/X86/AsmParser/X86AsmParser.cpp | 8 +- .../X86/MCTargetDesc/X86ATTInstPrinter.cpp | 18 +- .../X86/MCTargetDesc/X86InstComments.cpp | 4 +- .../X86/MCTargetDesc/X86InstPrinterCommon.cpp | 20 +- .../X86/MCTargetDesc/X86IntelInstPrinter.cpp | 18 +- llvm/lib/Target/X86/X86InstrAVX10.td | 140 +- llvm/lib/Target/X86/X86InstrFMA3Info.cpp | 4 +- llvm/lib/Target/X86/X86InstrUtils.td | 6 +- llvm/lib/Target/X86/X86IntrinsicsInfo.h | 54 +- llvm/test/CodeGen/X86/avx10.2-fma-commute.ll | 216 +- .../test/CodeGen/X86/avx10_2_512bf16-arith.ll | 220 +- .../CodeGen/X86/avx10_2_512bf16-intrinsics.ll | 194 +- llvm/test/CodeGen/X86/avx10_2bf16-arith.ll | 444 +-- .../CodeGen/X86/avx10_2bf16-intrinsics.ll | 444 +-- .../MC/Disassembler/X86/avx10.2-bf16-32.txt | 2984 ++++++++--------- .../MC/Disassembler/X86/avx10.2-bf16-64.txt | 2984 ++++++++--------- llvm/test/MC/X86/avx10.2-bf16-32-att.s | 2984 ++++++++--------- llvm/test/MC/X86/avx10.2-bf16-32-intel.s | 2984 ++++++++--------- llvm/test/MC/X86/avx10.2-bf16-64-att.s | 2984 ++++++++--------- llvm/test/MC/X86/avx10.2-bf16-64-intel.s | 2984 ++++++++--------- llvm/test/TableGen/x86-fold-tables.inc | 984 +++--- 29 files changed, 11225 insertions(+), 11235 deletions(-) diff --git a/clang/include/clang/Basic/BuiltinsX86.td b/clang/include/clang/Basic/BuiltinsX86.td index 18fc10eb85c02..32d5486f162b3 100644 --- a/clang/include/clang/Basic/BuiltinsX86.td +++ b/clang/include/clang/Basic/BuiltinsX86.td @@ -5304,75 +5304,75 @@ let Features = "avx10.2-256", Attributes = [NoThrow, RequiredVectorWidth<128>] i } let Features = "avx10.2-256", Attributes = [NoThrow, Const, RequiredVectorWidth<128>] in { - def vaddnepbf16128 : X86Builtin<"_Vector<8, __bf16>(_Vector<8, __bf16>, _Vector<8, __bf16>)">; + def vaddbf16128 : X86Builtin<"_Vector<8, __bf16>(_Vector<8, __bf16>, _Vector<8, __bf16>)">; } let Features = "avx10.2-256", Attributes = [NoThrow, Const, RequiredVectorWidth<256>] in { - def vaddnepbf16256 : X86Builtin<"_Vector<16, __bf16>(_Vector<16, __bf16>, _Vector<16, __bf16>)">; + def vaddbf16256 : X86Builtin<"_Vector<16, __bf16>(_Vector<16, __bf16>, _Vector<16, __bf16>)">; } let Features = "avx10.2-512", Attributes = [NoThrow, Const, RequiredVectorWidth<512>] in { - def vaddnepbf16512 : X86Builtin<"_Vector<32, __bf16>(_Vector<32, __bf16>, _Vector<32, __bf16>)">; + def vaddbf16512 : X86Builtin<"_Vector<32, __bf16>(_Vector<32, __bf16>, _Vector<32, __bf16>)">; } let Features = "avx10.2-256", Attributes = [NoThrow, Const, RequiredVectorWidth<128>] in { - def vdivnepbf16128 : X86Builtin<"_Vector<8, __bf16>(_Vector<8, __bf16>, _Vector<8, __bf16>)">; + def vdivbf16128 : X86Builtin<"_Vector<8, __bf16>(_Vector<8, __bf16>, _Vector<8, __bf16>)">; } let Features = "avx10.2-256", Attributes = [NoThrow, Const, RequiredVectorWidth<256>] in { - def vdivnepbf16256 : X86Builtin<"_Vector<16, __bf16>(_Vector<16, __bf16>, _Vector<16, __bf16>)">; + def vdivbf16256 : X86Builtin<"_Vector<16, __bf16>(_Vector<16, __bf16>, _Vector<16, __bf16>)">; } let Features = "avx10.2-512", Attributes = [NoThrow, Const, RequiredVectorWidth<512>] in { - def vdivnepbf16512 : X86Builtin<"_Vector<32, __bf16>(_Vector<32, __bf16>, _Vector<32, __bf16>)">; + def vdivbf16512 : X86Builtin<"_Vector<32, __bf16>(_Vector<32, __bf16>, _Vector<32, __bf16>)">; } let Features = "avx10.2-256", Attributes = [NoThrow, Const, RequiredVectorWidth<128>] in { - def vmaxpbf16128 : X86Builtin<"_Vector<8, __bf16>(_Vector<8, __bf16>, _Vector<8, __bf16>)">; + def vmaxbf16128 : X86Builtin<"_Vector<8, __bf16>(_Vector<8, __bf16>, _Vector<8, __bf16>)">; } let Features = "avx10.2-256", Attributes = [NoThrow, Const, RequiredVectorWidth<256>] in { - def vmaxpbf16256 : X86Builtin<"_Vector<16, __bf16>(_Vector<16, __bf16>, _Vector<16, __bf16>)">; + def vmaxbf16256 : X86Builtin<"_Vector<16, __bf16>(_Vector<16, __bf16>, _Vector<16, __bf16>)">; } let Features = "avx10.2-512", Attributes = [NoThrow, Const, RequiredVectorWidth<512>] in { - def vmaxpbf16512 : X86Builtin<"_Vector<32, __bf16>(_Vector<32, __bf16>, _Vector<32, __bf16>)">; + def vmaxbf16512 : X86Builtin<"_Vector<32, __bf16>(_Vector<32, __bf16>, _Vector<32, __bf16>)">; } let Features = "avx10.2-256", Attributes = [NoThrow, Const, RequiredVectorWidth<128>] in { - def vminpbf16128 : X86Builtin<"_Vector<8, __bf16>(_Vector<8, __bf16>, _Vector<8, __bf16>)">; + def vminbf16128 : X86Builtin<"_Vector<8, __bf16>(_Vector<8, __bf16>, _Vector<8, __bf16>)">; } let Features = "avx10.2-256", Attributes = [NoThrow, Const, RequiredVectorWidth<256>] in { - def vminpbf16256 : X86Builtin<"_Vector<16, __bf16>(_Vector<16, __bf16>, _Vector<16, __bf16>)">; + def vminbf16256 : X86Builtin<"_Vector<16, __bf16>(_Vector<16, __bf16>, _Vector<16, __bf16>)">; } let Features = "avx10.2-512", Attributes = [NoThrow, Const, RequiredVectorWidth<512>] in { - def vminpbf16512 : X86Builtin<"_Vector<32, __bf16>(_Vector<32, __bf16>, _Vector<32, __bf16>)">; + def vminbf16512 : X86Builtin<"_Vector<32, __bf16>(_Vector<32, __bf16>, _Vector<32, __bf16>)">; } let Features = "avx10.2-256", Attributes = [NoThrow, Const, RequiredVectorWidth<128>] in { - def vmulnepbf16128 : X86Builtin<"_Vector<8, __bf16>(_Vector<8, __bf16>, _Vector<8, __bf16>)">; + def vmulbf16128 : X86Builtin<"_Vector<8, __bf16>(_Vector<8, __bf16>, _Vector<8, __bf16>)">; } let Features = "avx10.2-256", Attributes = [NoThrow, Const, RequiredVectorWidth<256>] in { - def vmulnepbf16256 : X86Builtin<"_Vector<16, __bf16>(_Vector<16, __bf16>, _Vector<16, __bf16>)">; + def vmulbf16256 : X86Builtin<"_Vector<16, __bf16>(_Vector<16, __bf16>, _Vector<16, __bf16>)">; } let Features = "avx10.2-512", Attributes = [NoThrow, Const, RequiredVectorWidth<512>] in { - def vmulnepbf16512 : X86Builtin<"_Vector<32, __bf16>(_Vector<32, __bf16>, _Vector<32, __bf16>)">; + def vmulbf16512 : X86Builtin<"_Vector<32, __bf16>(_Vector<32, __bf16>, _Vector<32, __bf16>)">; } let Features = "avx10.2-256", Attributes = [NoThrow, Const, RequiredVectorWidth<128>] in { - def vsubnepbf16128 : X86Builtin<"_Vector<8, __bf16>(_Vector<8, __bf16>, _Vector<8, __bf16>)">; + def vsubbf16128 : X86Builtin<"_Vector<8, __bf16>(_Vector<8, __bf16>, _Vector<8, __bf16>)">; } let Features = "avx10.2-256", Attributes = [NoThrow, Const, RequiredVectorWidth<256>] in { - def vsubnepbf16256 : X86Builtin<"_Vector<16, __bf16>(_Vector<16, __bf16>, _Vector<16, __bf16>)">; + def vsubbf16256 : X86Builtin<"_Vector<16, __bf16>(_Vector<16, __bf16>, _Vector<16, __bf16>)">; } let Features = "avx10.2-512", Attributes = [NoThrow, Const, RequiredVectorWidth<512>] in { - def vsubnepbf16512 : X86Builtin<"_Vector<32, __bf16>(_Vector<32, __bf16>, _Vector<32, __bf16>)">; + def vsubbf16512 : X86Builtin<"_Vector<32, __bf16>(_Vector<32, __bf16>, _Vector<32, __bf16>)">; } let Features = "avx10.2-256", Attributes = [NoThrow, Const, RequiredVectorWidth<128>] in { @@ -5385,120 +5385,120 @@ let Features = "avx10.2-256", Attributes = [NoThrow, Const, RequiredVectorWidth< } let Features = "avx10.2-512", Attributes = [NoThrow, Const, RequiredVectorWidth<512>] in { - def vcmppbf16512_mask : X86Builtin<"unsigned int(_Vector<32, __bf16>, _Vector<32, __bf16>, _Constant int, unsigned int)">; + def vcmpbf16512_mask : X86Builtin<"unsigned int(_Vector<32, __bf16>, _Vector<32, __bf16>, _Constant int, unsigned int)">; } let Features = "avx10.2-256", Attributes = [NoThrow, Const, RequiredVectorWidth<256>] in { - def vcmppbf16256_mask : X86Builtin<"unsigned short(_Vector<16, __bf16>, _Vector<16, __bf16>, _Constant int, unsigned short)">; + def vcmpbf16256_mask : X86Builtin<"unsigned short(_Vector<16, __bf16>, _Vector<16, __bf16>, _Constant int, unsigned short)">; } let Features = "avx10.2-256", Attributes = [NoThrow, Const, RequiredVectorWidth<128>] in { - def vcmppbf16128_mask : X86Builtin<"unsigned char(_Vector<8, __bf16>, _Vector<8, __bf16>, _Constant int, unsigned char)">; - def vfpclasspbf16128_mask : X86Builtin<"unsigned char(_Vector<8, __bf16>, _Constant int, unsigned char)">; + def vcmpbf16128_mask : X86Builtin<"unsigned char(_Vector<8, __bf16>, _Vector<8, __bf16>, _Constant int, unsigned char)">; + def vfpclassbf16128_mask : X86Builtin<"unsigned char(_Vector<8, __bf16>, _Constant int, unsigned char)">; } let Features = "avx10.2-256", Attributes = [NoThrow, Const, RequiredVectorWidth<256>] in { - def vfpclasspbf16256_mask : X86Builtin<"unsigned short(_Vector<16, __bf16>, _Constant int, unsigned short)">; + def vfpclassbf16256_mask : X86Builtin<"unsigned short(_Vector<16, __bf16>, _Constant int, unsigned short)">; } let Features = "avx10.2-512", Attributes = [NoThrow, Const, RequiredVectorWidth<512>] in { - def vfpclasspbf16512_mask : X86Builtin<"unsigned int(_Vector<32, __bf16>, _Constant int, unsigned int)">; + def vfpclassbf16512_mask : X86Builtin<"unsigned int(_Vector<32, __bf16>, _Constant int, unsigned int)">; } let Features = "avx10.2-256", Attributes = [NoThrow, Const, RequiredVectorWidth<128>] in { - def vscalefpbf16128_mask : X86Builtin<"_Vector<8, __bf16>(_Vector<8, __bf16>, _Vector<8, __bf16>, _Vector<8, __bf16>, unsigned char)">; + def vscalefbf16128_mask : X86Builtin<"_Vector<8, __bf16>(_Vector<8, __bf16>, _Vector<8, __bf16>, _Vector<8, __bf16>, unsigned char)">; } let Features = "avx10.2-256", Attributes = [NoThrow, Const, RequiredVectorWidth<256>] in { - def vscalefpbf16256_mask : X86Builtin<"_Vector<16, __bf16>(_Vector<16, __bf16>, _Vector<16, __bf16>, _Vector<16, __bf16>, unsigned short)">; + def vscalefbf16256_mask : X86Builtin<"_Vector<16, __bf16>(_Vector<16, __bf16>, _Vector<16, __bf16>, _Vector<16, __bf16>, unsigned short)">; } let Features = "avx10.2-512", Attributes = [NoThrow, Const, RequiredVectorWidth<512>] in { - def vscalefpbf16512_mask : X86Builtin<"_Vector<32, __bf16>(_Vector<32, __bf16>, _Vector<32, __bf16>, _Vector<32, __bf16>, unsigned int)">; + def vscalefbf16512_mask : X86Builtin<"_Vector<32, __bf16>(_Vector<32, __bf16>, _Vector<32, __bf16>, _Vector<32, __bf16>, unsigned int)">; } let Features = "avx10.2-256", Attributes = [NoThrow, Const, RequiredVectorWidth<128>] in { - def vrcppbf16128_mask : X86Builtin<"_Vector<8, __bf16>(_Vector<8, __bf16>, _Vector<8, __bf16>, unsigned char)">; + def vrcpbf16128_mask : X86Builtin<"_Vector<8, __bf16>(_Vector<8, __bf16>, _Vector<8, __bf16>, unsigned char)">; } let Features = "avx10.2-256", Attributes = [NoThrow, Const, RequiredVectorWidth<256>] in { - def vrcppbf16256_mask : X86Builtin<"_Vector<16, __bf16>(_Vector<16, __bf16>, _Vector<16, __bf16>, unsigned short)">; + def vrcpbf16256_mask : X86Builtin<"_Vector<16, __bf16>(_Vector<16, __bf16>, _Vector<16, __bf16>, unsigned short)">; } let Features = "avx10.2-512", Attributes = [NoThrow, Const, RequiredVectorWidth<512>] in { - def vrcppbf16512_mask : X86Builtin<"_Vector<32, __bf16>(_Vector<32, __bf16>, _Vector<32, __bf16>, unsigned int)">; + def vrcpbf16512_mask : X86Builtin<"_Vector<32, __bf16>(_Vector<32, __bf16>, _Vector<32, __bf16>, unsigned int)">; } let Features = "avx10.2-256", Attributes = [NoThrow, Const, RequiredVectorWidth<128>] in { - def vgetexppbf16128_mask : X86Builtin<"_Vector<8, __bf16>(_Vector<8, __bf16>, _Vector<8, __bf16>, unsigned char)">; + def vgetexpbf16128_mask : X86Builtin<"_Vector<8, __bf16>(_Vector<8, __bf16>, _Vector<8, __bf16>, unsigned char)">; } let Features = "avx10.2-256", Attributes = [NoThrow, Const, RequiredVectorWidth<256>] in { - def vgetexppbf16256_mask : X86Builtin<"_Vector<16, __bf16>(_Vector<16, __bf16>, _Vector<16, __bf16>, unsigned short)">; + def vgetexpbf16256_mask : X86Builtin<"_Vector<16, __bf16>(_Vector<16, __bf16>, _Vector<16, __bf16>, unsigned short)">; } let Features = "avx10.2-512", Attributes = [NoThrow, Const, RequiredVectorWidth<512>] in { - def vgetexppbf16512_mask : X86Builtin<"_Vector<32, __bf16>(_Vector<32, __bf16>, _Vector<32, __bf16>, unsigned int)">; + def vgetexpbf16512_mask : X86Builtin<"_Vector<32, __bf16>(_Vector<32, __bf16>, _Vector<32, __bf16>, unsigned int)">; } let Features = "avx10.2-256", Attributes = [NoThrow, Const, RequiredVectorWidth<128>] in { - def vrsqrtpbf16128_mask : X86Builtin<"_Vector<8, __bf16>(_Vector<8, __bf16>, _Vector<8, __bf16>, unsigned char)">; + def vrsqrtbf16128_mask : X86Builtin<"_Vector<8, __bf16>(_Vector<8, __bf16>, _Vector<8, __bf16>, unsigned char)">; } let Features = "avx10.2-256", Attributes = [NoThrow, Const, RequiredVectorWidth<256>] in { - def vrsqrtpbf16256_mask : X86Builtin<"_Vector<16, __bf16>(_Vector<16, __bf16>, _Vector<16, __bf16>, unsigned short)">; + def vrsqrtbf16256_mask : X86Builtin<"_Vector<16, __bf16>(_Vector<16, __bf16>, _Vector<16, __bf16>, unsigned short)">; } let Features = "avx10.2-512", Attributes = [NoThrow, Const, RequiredVectorWidth<512>] in { - def vrsqrtpbf16512_mask : X86Builtin<"_Vector<32, __bf16>(_Vector<32, __bf16>, _Vector<32, __bf16>, unsigned int)">; + def vrsqrtbf16512_mask : X86Builtin<"_Vector<32, __bf16>(_Vector<32, __bf16>, _Vector<32, __bf16>, unsigned int)">; } let Features = "avx10.2-256", Attributes = [NoThrow, Const, RequiredVectorWidth<128>] in { - def vreducenepbf16128_mask : X86Builtin<"_Vector<8, __bf16>(_Vector<8, __bf16>, _Constant int, _Vector<8, __bf16>, unsigned char)">; + def vreducebf16128_mask : X86Builtin<"_Vector<8, __bf16>(_Vector<8, __bf16>, _Constant int, _Vector<8, __bf16>, unsigned char)">; } let Features = "avx10.2-256", Attributes = [NoThrow, Const, RequiredVectorWidth<256>] in { - def vreducenepbf16256_mask : X86Builtin<"_Vector<16, __bf16>(_Vector<16, __bf16>, _Constant int, _Vector<16, __bf16>, unsigned short)">; + def vreducebf16256_mask : X86Builtin<"_Vector<16, __bf16>(_Vector<16, __bf16>, _Constant int, _Vector<16, __bf16>, unsigned short)">; } let Features = "avx10.2-512", Attributes = [NoThrow, Const, RequiredVectorWidth<512>] in { - def vreducenepbf16512_mask : X86Builtin<"_Vector<32, __bf16>(_Vector<32, __bf16>, _Constant int, _Vector<32, __bf16>, unsigned int)">; + def vreducebf16512_mask : X86Builtin<"_Vector<32, __bf16>(_Vector<32, __bf16>, _Constant int, _Vector<32, __bf16>, unsigned int)">; } let Features = "avx10.2-256", Attributes = [NoThrow, Const, RequiredVectorWidth<128>] in { - def vrndscalenepbf16_128_mask : X86Builtin<"_Vector<8, __bf16>(_Vector<8, __bf16>, _Constant int, _Vector<8, __bf16>, unsigned char)">; + def vrndscalebf16_128_mask : X86Builtin<"_Vector<8, __bf16>(_Vector<8, __bf16>, _Constant int, _Vector<8, __bf16>, unsigned char)">; } let Features = "avx10.2-256", Attributes = [NoThrow, Const, RequiredVectorWidth<256>] in { - def vrndscalenepbf16_256_mask : X86Builtin<"_Vector<16, __bf16>(_Vector<16, __bf16>, _Constant int, _Vector<16, __bf16>, unsigned short)">; + def vrndscalebf16_256_mask : X86Builtin<"_Vector<16, __bf16>(_Vector<16, __bf16>, _Constant int, _Vector<16, __bf16>, unsigned short)">; } let Features = "avx10.2-512", Attributes = [NoThrow, Const, RequiredVectorWidth<512>] in { - def vrndscalenepbf16_mask : X86Builtin<"_Vector<32, __bf16>(_Vector<32, __bf16>, _Constant int, _Vector<32, __bf16>, unsigned int)">; + def vrndscalebf16_mask : X86Builtin<"_Vector<32, __bf16>(_Vector<32, __bf16>, _Constant int, _Vector<32, __bf16>, unsigned int)">; } let Features = "avx10.2-256", Attributes = [NoThrow, Const, RequiredVectorWidth<128>] in { - def vgetmantpbf16128_mask : X86Builtin<"_Vector<8, __bf16>(_Vector<8, __bf16>, _Constant int, _Vector<8, __bf16>, unsigned char)">; + def vgetmantbf16128_mask : X86Builtin<"_Vector<8, __bf16>(_Vector<8, __bf16>, _Constant int, _Vector<8, __bf16>, unsigned char)">; } let Features = "avx10.2-256", Attributes = [NoThrow, Const, RequiredVectorWidth<256>] in { - def vgetmantpbf16256_mask : X86Builtin<"_Vector<16, __bf16>(_Vector<16, __bf16>, _Constant int, _Vector<16, __bf16>, unsigned short)">; + def vgetmantbf16256_mask : X86Builtin<"_Vector<16, __bf16>(_Vector<16, __bf16>, _Constant int, _Vector<16, __bf16>, unsigned short)">; } let Features = "avx10.2-512", Attributes = [NoThrow, Const, RequiredVectorWidth<512>] in { - def vgetmantpbf16512_mask : X86Builtin<"_Vector<32, __bf16>(_Vector<32, __bf16>, _Constant int, _Vector<32, __bf16>, unsigned int)">; + def vgetmantbf16512_mask : X86Builtin<"_Vector<32, __bf16>(_Vector<32, __bf16>, _Constant int, _Vector<32, __bf16>, unsigned int)">; } let Features = "avx10.2-256", Attributes = [NoThrow, Const, RequiredVectorWidth<128>] in { - def vsqrtnepbf16 : X86Builtin<"_Vector<8, __bf16>(_Vector<8, __bf16>)">; + def vsqrtbf16 : X86Builtin<"_Vector<8, __bf16>(_Vector<8, __bf16>)">; } let Features = "avx10.2-256", Attributes = [NoThrow, Const, RequiredVectorWidth<256>] in { - def vsqrtnepbf16256 : X86Builtin<"_Vector<16, __bf16>(_Vector<16, __bf16>)">; + def vsqrtbf16256 : X86Builtin<"_Vector<16, __bf16>(_Vector<16, __bf16>)">; } let Features = "avx10.2-512", Attributes = [NoThrow, Const, RequiredVectorWidth<512>] in { - def vsqrtnepbf16512 : X86Builtin<"_Vector<32, __bf16>(_Vector<32, __bf16>)">; + def vsqrtbf16512 : X86Builtin<"_Vector<32, __bf16>(_Vector<32, __bf16>)">; def vfmaddnepbh512 : X86Builtin<"_Vector<32, __bf16>(_Vector<32, __bf16>, _Vector<32, __bf16>, _Vector<32, __bf16>)">; } diff --git a/clang/lib/CodeGen/CGBuiltin.cpp b/clang/lib/CodeGen/CGBuiltin.cpp index 2385f2a320b62..4160a5b8b59bf 100644 --- a/clang/lib/CodeGen/CGBuiltin.cpp +++ b/clang/lib/CodeGen/CGBuiltin.cpp @@ -16661,9 +16661,9 @@ Value *CodeGenFunction::EmitX86BuiltinExpr(unsigned BuiltinID, case X86::BI__builtin_ia32_sqrtph256: case X86::BI__builtin_ia32_sqrtph: case X86::BI__builtin_ia32_sqrtph512: - case X86::BI__builtin_ia32_vsqrtnepbf16256: - case X86::BI__builtin_ia32_vsqrtnepbf16: - case X86::BI__builtin_ia32_vsqrtnepbf16512: + case X86::BI__builtin_ia32_vsqrtbf16256: + case X86::BI__builtin_ia32_vsqrtbf16: + case X86::BI__builtin_ia32_vsqrtbf16512: case X86::BI__builtin_ia32_sqrtps512: case X86::BI__builtin_ia32_sqrtpd512: { if (Ops.size() == 2) { @@ -16883,9 +16883,9 @@ Value *CodeGenFunction::EmitX86BuiltinExpr(unsigned BuiltinID, case X86::BI__builtin_ia32_fpclassps128_mask: case X86::BI__builtin_ia32_fpclassps256_mask: case X86::BI__builtin_ia32_fpclassps512_mask: - case X86::BI__builtin_ia32_vfpclasspbf16128_mask: - case X86::BI__builtin_ia32_vfpclasspbf16256_mask: - case X86::BI__builtin_ia32_vfpclasspbf16512_mask: + case X86::BI__builtin_ia32_vfpclassbf16128_mask: + case X86::BI__builtin_ia32_vfpclassbf16256_mask: + case X86::BI__builtin_ia32_vfpclassbf16512_mask: case X86::BI__builtin_ia32_fpclassph128_mask: case X86::BI__builtin_ia32_fpclassph256_mask: case X86::BI__builtin_ia32_fpclassph512_mask: @@ -16900,14 +16900,14 @@ Value *CodeGenFunction::EmitX86BuiltinExpr(unsigned BuiltinID, Intrinsic::ID ID; switch (BuiltinID) { default: llvm_unreachable("Unsupported intrinsic!"); - case X86::BI__builtin_ia32_vfpclasspbf16128_mask: - ID = Intrinsic::x86_avx10_fpclass_nepbf16_128; + case X86::BI__builtin_ia32_vfpclassbf16128_mask: + ID = Intrinsic::x86_avx10_fpclass_bf16_128; break; - case X86::BI__builtin_ia32_vfpclasspbf16256_mask: - ID = Intrinsic::x86_avx10_fpclass_nepbf16_256; + case X86::BI__builtin_ia32_vfpclassbf16256_mask: + ID = Intrinsic::x86_avx10_fpclass_bf16_256; break; - case X86::BI__builtin_ia32_vfpclasspbf16512_mask: - ID = Intrinsic::x86_avx10_fpclass_nepbf16_512; + case X86::BI__builtin_ia32_vfpclassbf16512_mask: + ID = Intrinsic::x86_avx10_fpclass_bf16_512; break; case X86::BI__builtin_ia32_fpclassph128_mask: ID = Intrinsic::x86_avx512fp16_fpclass_ph_128; @@ -17067,9 +17067,9 @@ Value *CodeGenFunction::EmitX86BuiltinExpr(unsigned BuiltinID, case X86::BI__builtin_ia32_vcmppd256_round_mask: case X86::BI__builtin_ia32_vcmpps256_round_mask: case X86::BI__builtin_ia32_vcmpph256_round_mask: - case X86::BI__builtin_ia32_vcmppbf16512_mask: - case X86::BI__builtin_ia32_vcmppbf16256_mask: - case X86::BI__builtin_ia32_vcmppbf16128_mask: + case X86::BI__builtin_ia32_vcmpbf16512_mask: + case X86::BI__builtin_ia32_vcmpbf16256_mask: + case X86::BI__builtin_ia32_vcmpbf16128_mask: IsMaskFCmp = true; [[fallthrough]]; case X86::BI__builtin_ia32_cmpps: diff --git a/clang/lib/Headers/avx10_2_512bf16intrin.h b/clang/lib/Headers/avx10_2_512bf16intrin.h index 392b7ae770c5b..ce43ecbcfe047 100644 --- a/clang/lib/Headers/avx10_2_512bf16intrin.h +++ b/clang/lib/Headers/avx10_2_512bf16intrin.h @@ -62,17 +62,17 @@ static __inline __m512bh __DEFAULT_FN_ATTRS512 _mm512_set_pbh( (bf3), (bf2), (bf1)) static __inline__ __m512 __DEFAULT_FN_ATTRS512 -_mm512_castpbf16_ps(__m512bh __a) { +_mm512_castbf16_ps(__m512bh __a) { return (__m512)__a; } static __inline__ __m512d __DEFAULT_FN_ATTRS512 -_mm512_castpbf16_pd(__m512bh __a) { +_mm512_castbf16_pd(__m512bh __a) { return (__m512d)__a; } static __inline__ __m512i __DEFAULT_FN_ATTRS512 -_mm512_castpbf16_si512(__m512bh __a) { +_mm512_castbf16_si512(__m512bh __a) { return (__m512i)__a; } @@ -91,39 +91,39 @@ _mm512_castsi512_pbh(__m512i __a) { } static __inline__ __m128bh __DEFAULT_FN_ATTRS512 -_mm512_castpbf16512_pbh128(__m512bh __a) { +_mm512_castbf16512_pbh128(__m512bh __a) { return __builtin_shufflevector(__a, __a, 0, 1, 2, 3, 4, 5, 6, 7); } static __inline__ __m256bh __DEFAULT_FN_ATTRS512 -_mm512_castpbf16512_pbh256(__m512bh __a) { +_mm512_castbf16512_pbh256(__m512bh __a) { return __builtin_shufflevector(__a, __a, 0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15); } static __inline__ __m512bh __DEFAULT_FN_ATTRS512 -_mm512_castpbf16128_pbh512(__m128bh __a) { +_mm512_castbf16128_pbh512(__m128bh __a) { return __builtin_shufflevector(__a, __a, 0, 1, 2, 3, 4, 5, 6, 7, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1); } static __inline__ __m512bh __DEFAULT_FN_ATTRS512 -_mm512_castpbf16256_pbh512(__m256bh __a) { +_mm512_castbf16256_pbh512(__m256bh __a) { return __builtin_shufflevector(__a, __a, 0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1); } static __inline__ __m512bh __DEFAULT_FN_ATTRS512 -_mm512_zextpbf16128_pbh512(__m128bh __a) { +_mm512_zextbf16128_pbh512(__m128bh __a) { return __builtin_shufflevector( __a, (__v8bf)_mm_setzero_pbh(), 0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 8, 9, 10, 11, 12, 13, 14, 15, 8, 9, 10, 11, 12, 13, 14, 15); } static __inline__ __m512bh __DEFAULT_FN_ATTRS512 -_mm512_zextpbf16256_pbh512(__m256bh __a) { +_mm512_zextbf16256_pbh512(__m256bh __a) { return __builtin_shufflevector(__a, (__v16bf)_mm256_setzero_pbh(), 0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, @@ -178,81 +178,81 @@ _mm512_permutexvar_pbh(__m512i __A, __m512bh __B) { return (__m512bh)__builtin_ia32_permvarhi512((__v32hi)__B, (__v32hi)__A); } -static __inline__ __m512bh __DEFAULT_FN_ATTRS512 -_mm512_addne_pbh(__m512bh __A, __m512bh __B) { +static __inline__ __m512bh __DEFAULT_FN_ATTRS512 _mm512_add_pbh(__m512bh __A, + __m512bh __B) { return (__m512bh)((__v32bf)__A + (__v32bf)__B); } static __inline__ __m512bh __DEFAULT_FN_ATTRS512 -_mm512_mask_addne_pbh(__m512bh __W, __mmask32 __U, __m512bh __A, __m512bh __B) { +_mm512_mask_add_pbh(__m512bh __W, __mmask32 __U, __m512bh __A, __m512bh __B) { return (__m512bh)__builtin_ia32_selectpbf_512( - (__mmask32)__U, (__v32bf)_mm512_addne_pbh(__A, __B), (__v32bf)__W); + (__mmask32)__U, (__v32bf)_mm512_add_pbh(__A, __B), (__v32bf)__W); } static __inline__ __m512bh __DEFAULT_FN_ATTRS512 -_mm512_maskz_addne_pbh(__mmask32 __U, __m512bh __A, __m512bh __B) { +_mm512_maskz_add_pbh(__mmask32 __U, __m512bh __A, __m512bh __B) { return (__m512bh)__builtin_ia32_selectpbf_512( - (__mmask32)__U, (__v32bf)_mm512_addne_pbh(__A, __B), + (__mmask32)__U, (__v32bf)_mm512_add_pbh(__A, __B), (__v32bf)_mm512_setzero_pbh()); } -static __inline__ __m512bh __DEFAULT_FN_ATTRS512 -_mm512_subne_pbh(__m512bh __A, __m512bh __B) { +static __inline__ __m512bh __DEFAULT_FN_ATTRS512 _mm512_sub_pbh(__m512bh __A, + __m512bh __B) { return (__m512bh)((__v32bf)__A - (__v32bf)__B); } static __inline__ __m512bh __DEFAULT_FN_ATTRS512 -_mm512_mask_subne_pbh(__m512bh __W, __mmask32 __U, __m512bh __A, __m512bh __B) { +_mm512_mask_sub_pbh(__m512bh __W, __mmask32 __U, __m512bh __A, __m512bh __B) { return (__m512bh)__builtin_ia32_selectpbf_512( - (__mmask32)__U, (__v32bf)_mm512_subne_pbh(__A, __B), (__v32bf)__W); + (__mmask32)__U, (__v32bf)_mm512_sub_pbh(__A, __B), (__v32bf)__W); } static __inline__ __m512bh __DEFAULT_FN_ATTRS512 -_mm512_maskz_subne_pbh(__mmask32 __U, __m512bh __A, __m512bh __B) { +_mm512_maskz_sub_pbh(__mmask32 __U, __m512bh __A, __m512bh __B) { return (__m512bh)__builtin_ia32_selectpbf_512( - (__mmask32)__U, (__v32bf)_mm512_subne_pbh(__A, __B), + (__mmask32)__U, (__v32bf)_mm512_sub_pbh(__A, __B), (__v32bf)_mm512_setzero_pbh()); } -static __inline__ __m512bh __DEFAULT_FN_ATTRS512 -_mm512_mulne_pbh(__m512bh __A, __m512bh __B) { +static __inline__ __m512bh __DEFAULT_FN_ATTRS512 _mm512_mul_pbh(__m512bh __A, + __m512bh __B) { return (__m512bh)((__v32bf)__A * (__v32bf)__B); } static __inline__ __m512bh __DEFAULT_FN_ATTRS512 -_mm512_mask_mulne_pbh(__m512bh __W, __mmask32 __U, __m512bh __A, __m512bh __B) { +_mm512_mask_mul_pbh(__m512bh __W, __mmask32 __U, __m512bh __A, __m512bh __B) { return (__m512bh)__builtin_ia32_selectpbf_512( - (__mmask32)__U, (__v32bf)_mm512_mulne_pbh(__A, __B), (__v32bf)__W); + (__mmask32)__U, (__v32bf)_mm512_mul_pbh(__A, __B), (__v32bf)__W); } static __inline__ __m512bh __DEFAULT_FN_ATTRS512 -_mm512_maskz_mulne_pbh(__mmask32 __U, __m512bh __A, __m512bh __B) { +_mm512_maskz_mul_pbh(__mmask32 __U, __m512bh __A, __m512bh __B) { return (__m512bh)__builtin_ia32_selectpbf_512( - (__mmask32)__U, (__v32bf)_mm512_mulne_pbh(__A, __B), + (__mmask32)__U, (__v32bf)_mm512_mul_pbh(__A, __B), (__v32bf)_mm512_setzero_pbh()); } -static __inline__ __m512bh __DEFAULT_FN_ATTRS512 -_mm512_divne_pbh(__m512bh __A, __m512bh __B) { +static __inline__ __m512bh __DEFAULT_FN_ATTRS512 _mm512_div_pbh(__m512bh __A, + __m512bh __B) { return (__m512bh)((__v32bf)__A / (__v32bf)__B); } static __inline__ __m512bh __DEFAULT_FN_ATTRS512 -_mm512_mask_divne_pbh(__m512bh __W, __mmask32 __U, __m512bh __A, __m512bh __B) { +_mm512_mask_div_pbh(__m512bh __W, __mmask32 __U, __m512bh __A, __m512bh __B) { return (__m512bh)__builtin_ia32_selectpbf_512( - (__mmask32)__U, (__v32bf)_mm512_divne_pbh(__A, __B), (__v32bf)__W); + (__mmask32)__U, (__v32bf)_mm512_div_pbh(__A, __B), (__v32bf)__W); } static __inline__ __m512bh __DEFAULT_FN_ATTRS512 -_mm512_maskz_divne_pbh(__mmask32 __U, __m512bh __A, __m512bh __B) { +_mm512_maskz_div_pbh(__mmask32 __U, __m512bh __A, __m512bh __B) { return (__m512bh)__builtin_ia32_selectpbf_512( - (__mmask32)__U, (__v32bf)_mm512_divne_pbh(__A, __B), + (__mmask32)__U, (__v32bf)_mm512_div_pbh(__A, __B), (__v32bf)_mm512_setzero_pbh()); } static __inline__ __m512bh __DEFAULT_FN_ATTRS512 _mm512_max_pbh(__m512bh __A, __m512bh __B) { - return (__m512bh)__builtin_ia32_vmaxpbf16512((__v32bf)__A, (__v32bf)__B); + return (__m512bh)__builtin_ia32_vmaxbf16512((__v32bf)__A, (__v32bf)__B); } static __inline__ __m512bh __DEFAULT_FN_ATTRS512 @@ -270,7 +270,7 @@ _mm512_maskz_max_pbh(__mmask32 __U, __m512bh __A, __m512bh __B) { static __inline__ __m512bh __DEFAULT_FN_ATTRS512 _mm512_min_pbh(__m512bh __A, __m512bh __B) { - return (__m512bh)__builtin_ia32_vminpbf16512((__v32bf)__A, (__v32bf)__B); + return (__m512bh)__builtin_ia32_vminbf16512((__v32bf)__A, (__v32bf)__B); } static __inline__ __m512bh __DEFAULT_FN_ATTRS512 @@ -287,143 +287,143 @@ _mm512_maskz_min_pbh(__mmask32 __U, __m512bh __A, __m512bh __B) { } #define _mm512_cmp_pbh_mask(__A, __B, __P) \ - ((__mmask32)__builtin_ia32_vcmppbf16512_mask((__v32bf)(__m512bh)(__A), \ - (__v32bf)(__m512bh)(__B), \ - (int)(__P), (__mmask32) - 1)) + ((__mmask32)__builtin_ia32_vcmpbf16512_mask((__v32bf)(__m512bh)(__A), \ + (__v32bf)(__m512bh)(__B), \ + (int)(__P), (__mmask32) - 1)) #define _mm512_mask_cmp_pbh_mask(__U, __A, __B, __P) \ - ((__mmask32)__builtin_ia32_vcmppbf16512_mask((__v32bf)(__m512bh)(__A), \ - (__v32bf)(__m512bh)(__B), \ - (int)(__P), (__mmask32)(__U))) + ((__mmask32)__builtin_ia32_vcmpbf16512_mask((__v32bf)(__m512bh)(__A), \ + (__v32bf)(__m512bh)(__B), \ + (int)(__P), (__mmask32)(__U))) #define _mm512_mask_fpclass_pbh_mask(__U, __A, imm) \ - ((__mmask32)__builtin_ia32_vfpclasspbf16512_mask( \ + ((__mmask32)__builtin_ia32_vfpclassbf16512_mask( \ (__v32bf)(__m512bh)(__A), (int)(imm), (__mmask32)(__U))) #define _mm512_fpclass_pbh_mask(__A, imm) \ - ((__mmask32)__builtin_ia32_vfpclasspbf16512_mask( \ + ((__mmask32)__builtin_ia32_vfpclassbf16512_mask( \ (__v32bf)(__m512bh)(__A), (int)(imm), (__mmask32) - 1)) static __inline__ __m512bh __DEFAULT_FN_ATTRS512 _mm512_scalef_pbh(__m512bh __A, __m512bh __B) { - return (__m512bh)__builtin_ia32_vscalefpbf16512_mask( + return (__m512bh)__builtin_ia32_vscalefbf16512_mask( (__v32bf)__A, (__v32bf)__B, (__v32bf)_mm512_undefined_pbh(), (__mmask32)-1); } static __inline__ __m512bh __DEFAULT_FN_ATTRS512 _mm512_mask_scalef_pbh( __m512bh __W, __mmask32 __U, __m512bh __A, __m512bh __B) { - return (__m512bh)__builtin_ia32_vscalefpbf16512_mask( + return (__m512bh)__builtin_ia32_vscalefbf16512_mask( (__v32bf)__A, (__v32bf)__B, (__v32bf)__W, (__mmask32)__U); } static __inline__ __m512bh __DEFAULT_FN_ATTRS512 _mm512_maskz_scalef_pbh(__mmask32 __U, __m512bh __A, __m512bh __B) { - return (__m512bh)__builtin_ia32_vscalefpbf16512_mask( + return (__m512bh)__builtin_ia32_vscalefbf16512_mask( (__v32bf)__A, (__v32bf)__B, (__v32bf)_mm512_setzero_pbh(), (__mmask32)__U); } static __inline__ __m512bh __DEFAULT_FN_ATTRS512 _mm512_rcp_pbh(__m512bh __A) { - return (__m512bh)__builtin_ia32_vrcppbf16512_mask( + return (__m512bh)__builtin_ia32_vrcpbf16512_mask( (__v32bf)__A, (__v32bf)_mm512_undefined_pbh(), (__mmask32)-1); } static __inline__ __m512bh __DEFAULT_FN_ATTRS512 _mm512_mask_rcp_pbh(__m512bh __W, __mmask32 __U, __m512bh __A) { - return (__m512bh)__builtin_ia32_vrcppbf16512_mask((__v32bf)__A, (__v32bf)__W, - (__mmask32)__U); + return (__m512bh)__builtin_ia32_vrcpbf16512_mask((__v32bf)__A, (__v32bf)__W, + (__mmask32)__U); } static __inline__ __m512bh __DEFAULT_FN_ATTRS512 _mm512_maskz_rcp_pbh(__mmask32 __U, __m512bh __A) { - return (__m512bh)__builtin_ia32_vrcppbf16512_mask( + return (__m512bh)__builtin_ia32_vrcpbf16512_mask( (__v32bf)__A, (__v32bf)_mm512_setzero_pbh(), (__mmask32)__U); } static __inline__ __m512bh __DEFAULT_FN_ATTRS512 _mm512_getexp_pbh(__m512bh __A) { - return (__m512bh)__builtin_ia32_vgetexppbf16512_mask( + return (__m512bh)__builtin_ia32_vgetexpbf16512_mask( (__v32bf)__A, (__v32bf)_mm512_undefined_pbh(), (__mmask32)-1); } static __inline__ __m512bh __DEFAULT_FN_ATTRS512 _mm512_mask_getexp_pbh(__m512bh __W, __mmask32 __U, __m512bh __A) { - return (__m512bh)__builtin_ia32_vgetexppbf16512_mask( + return (__m512bh)__builtin_ia32_vgetexpbf16512_mask( (__v32bf)__A, (__v32bf)__W, (__mmask32)__U); } static __inline__ __m512bh __DEFAULT_FN_ATTRS512 _mm512_maskz_getexp_pbh(__mmask32 __U, __m512bh __A) { - return (__m512bh)__builtin_ia32_vgetexppbf16512_mask( + return (__m512bh)__builtin_ia32_vgetexpbf16512_mask( (__v32bf)__A, (__v32bf)_mm512_setzero_pbh(), (__mmask32)__U); } static __inline__ __m512bh __DEFAULT_FN_ATTRS512 _mm512_rsqrt_pbh(__m512bh __A) { - return (__m512bh)__builtin_ia32_vrsqrtpbf16512_mask( + return (__m512bh)__builtin_ia32_vrsqrtbf16512_mask( (__v32bf)__A, (__v32bf)_mm512_undefined_pbh(), (__mmask32)-1); } static __inline__ __m512bh __DEFAULT_FN_ATTRS512 _mm512_mask_rsqrt_pbh(__m512bh __W, __mmask32 __U, __m512bh __A) { - return (__m512bh)__builtin_ia32_vrsqrtpbf16512_mask( - (__v32bf)__A, (__v32bf)__W, (__mmask32)__U); + return (__m512bh)__builtin_ia32_vrsqrtbf16512_mask((__v32bf)__A, (__v32bf)__W, + (__mmask32)__U); } static __inline__ __m512bh __DEFAULT_FN_ATTRS512 _mm512_maskz_rsqrt_pbh(__mmask32 __U, __m512bh __A) { - return (__m512bh)__builtin_ia32_vrsqrtpbf16512_mask( + return (__m512bh)__builtin_ia32_vrsqrtbf16512_mask( (__v32bf)__A, (__v32bf)_mm512_setzero_pbh(), (__mmask32)__U); } -#define _mm512_reducene_pbh(__A, imm) \ - ((__m512bh)__builtin_ia32_vreducenepbf16512_mask( \ +#define _mm512_reduce_pbh(__A, imm) \ + ((__m512bh)__builtin_ia32_vreducebf16512_mask( \ (__v32bf)(__m512bh)(__A), (int)(imm), (__v32bf)_mm512_undefined_pbh(), \ (__mmask32) - 1)) -#define _mm512_mask_reducene_pbh(__W, __U, __A, imm) \ - ((__m512bh)__builtin_ia32_vreducenepbf16512_mask( \ +#define _mm512_mask_reduce_pbh(__W, __U, __A, imm) \ + ((__m512bh)__builtin_ia32_vreducebf16512_mask( \ (__v32bf)(__m512bh)(__A), (int)(imm), (__v32bf)(__m512bh)(__W), \ (__mmask32)(__U))) -#define _mm512_maskz_reducene_pbh(__U, __A, imm) \ - ((__m512bh)__builtin_ia32_vreducenepbf16512_mask( \ +#define _mm512_maskz_reduce_pbh(__U, __A, imm) \ + ((__m512bh)__builtin_ia32_vreducebf16512_mask( \ (__v32bf)(__m512bh)(__A), (int)(imm), (__v32bf)_mm512_setzero_pbh(), \ (__mmask32)(__U))) -#define _mm512_roundscalene_pbh(__A, imm) \ - ((__m512bh)__builtin_ia32_vrndscalenepbf16_mask( \ +#define _mm512_roundscale_pbh(__A, imm) \ + ((__m512bh)__builtin_ia32_vrndscalebf16_mask( \ (__v32bf)(__m512bh)(__A), (int)(imm), (__v32bf)_mm512_setzero_pbh(), \ (__mmask32) - 1)) -#define _mm512_mask_roundscalene_pbh(__W, __U, __A, imm) \ - ((__m512bh)__builtin_ia32_vrndscalenepbf16_mask( \ +#define _mm512_mask_roundscale_pbh(__W, __U, __A, imm) \ + ((__m512bh)__builtin_ia32_vrndscalebf16_mask( \ (__v32bf)(__m512bh)(__A), (int)(imm), (__v32bf)(__m512bh)(__W), \ (__mmask32)(__U))) -#define _mm512_maskz_roundscalene_pbh(__U, __A, imm) \ - ((__m512bh)__builtin_ia32_vrndscalenepbf16_mask( \ +#define _mm512_maskz_roundscale_pbh(__U, __A, imm) \ + ((__m512bh)__builtin_ia32_vrndscalebf16_mask( \ (__v32bf)(__m512bh)(__A), (int)(imm), (__v32bf)_mm512_setzero_pbh(), \ (__mmask32)(__U))) #define _mm512_getmant_pbh(__A, __B, __C) \ - ((__m512bh)__builtin_ia32_vgetmantpbf16512_mask( \ + ((__m512bh)__builtin_ia32_vgetmantbf16512_mask( \ (__v32bf)(__m512bh)(__A), (int)(((__C) << 2) | (__B)), \ (__v32bf)_mm512_undefined_pbh(), (__mmask32) - 1)) #define _mm512_mask_getmant_pbh(__W, __U, __A, __B, __C) \ - ((__m512bh)__builtin_ia32_vgetmantpbf16512_mask( \ + ((__m512bh)__builtin_ia32_vgetmantbf16512_mask( \ (__v32bf)(__m512bh)(__A), (int)(((__C) << 2) | (__B)), \ (__v32bf)(__m512bh)(__W), (__mmask32)(__U))) #define _mm512_maskz_getmant_pbh(__U, __A, __B, __C) \ - ((__m512bh)__builtin_ia32_vgetmantpbf16512_mask( \ + ((__m512bh)__builtin_ia32_vgetmantbf16512_mask( \ (__v32bf)(__m512bh)(__A), (int)(((__C) << 2) | (__B)), \ (__v32bf)_mm512_setzero_pbh(), (__mmask32)(__U))) static __inline__ __m512bh __DEFAULT_FN_ATTRS512 _mm512_sqrt_pbh(__m512bh __A) { - return (__m512bh)__builtin_ia32_vsqrtnepbf16512((__v32bf)__A); + return (__m512bh)__builtin_ia32_vsqrtbf16512((__v32bf)__A); } static __inline__ __m512bh __DEFAULT_FN_ATTRS512 @@ -440,122 +440,118 @@ _mm512_maskz_sqrt_pbh(__mmask32 __U, __m512bh __A) { } static __inline__ __m512bh __DEFAULT_FN_ATTRS512 -_mm512_fmaddne_pbh(__m512bh __A, __m512bh __B, __m512bh __C) { +_mm512_fmadd_pbh(__m512bh __A, __m512bh __B, __m512bh __C) { return (__m512bh)__builtin_ia32_vfmaddnepbh512((__v32bf)__A, (__v32bf)__B, (__v32bf)__C); } -static __inline__ __m512bh __DEFAULT_FN_ATTRS512 _mm512_mask_fmaddne_pbh( - __m512bh __A, __mmask32 __U, __m512bh __B, __m512bh __C) { +static __inline__ __m512bh __DEFAULT_FN_ATTRS512 +_mm512_mask_fmadd_pbh(__m512bh __A, __mmask32 __U, __m512bh __B, __m512bh __C) { return (__m512bh)__builtin_ia32_selectpbf_512( (__mmask32)__U, - _mm512_fmaddne_pbh((__v32bf)__A, (__v32bf)__B, (__v32bf)__C), - (__v32bf)__A); + _mm512_fmadd_pbh((__v32bf)__A, (__v32bf)__B, (__v32bf)__C), (__v32bf)__A); } -static __inline__ __m512bh __DEFAULT_FN_ATTRS512 _mm512_mask3_fmaddne_pbh( +static __inline__ __m512bh __DEFAULT_FN_ATTRS512 _mm512_mask3_fmadd_pbh( __m512bh __A, __m512bh __B, __m512bh __C, __mmask32 __U) { return (__m512bh)__builtin_ia32_selectpbf_512( (__mmask32)__U, - _mm512_fmaddne_pbh((__v32bf)__A, (__v32bf)__B, (__v32bf)__C), - (__v32bf)__C); + _mm512_fmadd_pbh((__v32bf)__A, (__v32bf)__B, (__v32bf)__C), (__v32bf)__C); } -static __inline__ __m512bh __DEFAULT_FN_ATTRS512 _mm512_maskz_fmaddne_pbh( +static __inline__ __m512bh __DEFAULT_FN_ATTRS512 _mm512_maskz_fmadd_pbh( __mmask32 __U, __m512bh __A, __m512bh __B, __m512bh __C) { return (__m512bh)__builtin_ia32_selectpbf_512( (__mmask32)__U, - _mm512_fmaddne_pbh((__v32bf)__A, (__v32bf)__B, (__v32bf)__C), + _mm512_fmadd_pbh((__v32bf)__A, (__v32bf)__B, (__v32bf)__C), (__v32bf)_mm512_setzero_pbh()); } static __inline__ __m512bh __DEFAULT_FN_ATTRS512 -_mm512_fmsubne_pbh(__m512bh __A, __m512bh __B, __m512bh __C) { +_mm512_fmsub_pbh(__m512bh __A, __m512bh __B, __m512bh __C) { return (__m512bh)__builtin_ia32_vfmaddnepbh512((__v32bf)__A, (__v32bf)__B, -(__v32bf)__C); } -static __inline__ __m512bh __DEFAULT_FN_ATTRS512 _mm512_mask_fmsubne_pbh( - __m512bh __A, __mmask32 __U, __m512bh __B, __m512bh __C) { +static __inline__ __m512bh __DEFAULT_FN_ATTRS512 +_mm512_mask_fmsub_pbh(__m512bh __A, __mmask32 __U, __m512bh __B, __m512bh __C) { return (__m512bh)__builtin_ia32_selectpbf_512( (__mmask32)__U, - _mm512_fmsubne_pbh((__v32bf)__A, (__v32bf)__B, (__v32bf)__C), - (__v32bf)__A); + _mm512_fmsub_pbh((__v32bf)__A, (__v32bf)__B, (__v32bf)__C), (__v32bf)__A); } -static __inline__ __m512bh __DEFAULT_FN_ATTRS512 _mm512_mask3_fmsubne_pbh( +static __inline__ __m512bh __DEFAULT_FN_ATTRS512 _mm512_mask3_fmsub_pbh( __m512bh __A, __m512bh __B, __m512bh __C, __mmask32 __U) { return (__m512bh)__builtin_ia32_selectpbf_512( (__mmask32)__U, - _mm512_fmsubne_pbh((__v32bf)__A, (__v32bf)__B, (__v32bf)__C), - (__v32bf)__C); + _mm512_fmsub_pbh((__v32bf)__A, (__v32bf)__B, (__v32bf)__C), (__v32bf)__C); } -static __inline__ __m512bh __DEFAULT_FN_ATTRS512 _mm512_maskz_fmsubne_pbh( +static __inline__ __m512bh __DEFAULT_FN_ATTRS512 _mm512_maskz_fmsub_pbh( __mmask32 __U, __m512bh __A, __m512bh __B, __m512bh __C) { return (__m512bh)__builtin_ia32_selectpbf_512( (__mmask32)__U, - _mm512_fmsubne_pbh((__v32bf)__A, (__v32bf)__B, (__v32bf)__C), + _mm512_fmsub_pbh((__v32bf)__A, (__v32bf)__B, (__v32bf)__C), (__v32bf)_mm512_setzero_pbh()); } static __inline__ __m512bh __DEFAULT_FN_ATTRS512 -_mm512_fnmaddne_pbh(__m512bh __A, __m512bh __B, __m512bh __C) { +_mm512_fnmadd_pbh(__m512bh __A, __m512bh __B, __m512bh __C) { return (__m512bh)__builtin_ia32_vfmaddnepbh512((__v32bf)__A, -(__v32bf)__B, (__v32bf)__C); } -static __inline__ __m512bh __DEFAULT_FN_ATTRS512 _mm512_mask_fnmaddne_pbh( +static __inline__ __m512bh __DEFAULT_FN_ATTRS512 _mm512_mask_fnmadd_pbh( __m512bh __A, __mmask32 __U, __m512bh __B, __m512bh __C) { return (__m512bh)__builtin_ia32_selectpbf_512( (__mmask32)__U, - _mm512_fnmaddne_pbh((__v32bf)__A, (__v32bf)__B, (__v32bf)__C), + _mm512_fnmadd_pbh((__v32bf)__A, (__v32bf)__B, (__v32bf)__C), (__v32bf)__A); } -static __inline__ __m512bh __DEFAULT_FN_ATTRS512 _mm512_mask3_fnmaddne_pbh( +static __inline__ __m512bh __DEFAULT_FN_ATTRS512 _mm512_mask3_fnmadd_pbh( __m512bh __A, __m512bh __B, __m512bh __C, __mmask32 __U) { return (__m512bh)__builtin_ia32_selectpbf_512( (__mmask32)__U, - _mm512_fnmaddne_pbh((__v32bf)__A, (__v32bf)__B, (__v32bf)__C), + _mm512_fnmadd_pbh((__v32bf)__A, (__v32bf)__B, (__v32bf)__C), (__v32bf)__C); } -static __inline__ __m512bh __DEFAULT_FN_ATTRS512 _mm512_maskz_fnmaddne_pbh( +static __inline__ __m512bh __DEFAULT_FN_ATTRS512 _mm512_maskz_fnmadd_pbh( __mmask32 __U, __m512bh __A, __m512bh __B, __m512bh __C) { return (__m512bh)__builtin_ia32_selectpbf_512( (__mmask32)__U, - _mm512_fnmaddne_pbh((__v32bf)__A, (__v32bf)__B, (__v32bf)__C), + _mm512_fnmadd_pbh((__v32bf)__A, (__v32bf)__B, (__v32bf)__C), (__v32bf)_mm512_setzero_pbh()); } static __inline__ __m512bh __DEFAULT_FN_ATTRS512 -_mm512_fnmsubne_pbh(__m512bh __A, __m512bh __B, __m512bh __C) { +_mm512_fnmsub_pbh(__m512bh __A, __m512bh __B, __m512bh __C) { return (__m512bh)__builtin_ia32_vfmaddnepbh512((__v32bf)__A, -(__v32bf)__B, -(__v32bf)__C); } -static __inline__ __m512bh __DEFAULT_FN_ATTRS512 _mm512_mask_fnmsubne_pbh( +static __inline__ __m512bh __DEFAULT_FN_ATTRS512 _mm512_mask_fnmsub_pbh( __m512bh __A, __mmask32 __U, __m512bh __B, __m512bh __C) { return (__m512bh)__builtin_ia32_selectpbf_512( (__mmask32)__U, - _mm512_fnmsubne_pbh((__v32bf)__A, (__v32bf)__B, (__v32bf)__C), + _mm512_fnmsub_pbh((__v32bf)__A, (__v32bf)__B, (__v32bf)__C), (__v32bf)__A); } -static __inline__ __m512bh __DEFAULT_FN_ATTRS512 _mm512_mask3_fnmsubne_pbh( +static __inline__ __m512bh __DEFAULT_FN_ATTRS512 _mm512_mask3_fnmsub_pbh( __m512bh __A, __m512bh __B, __m512bh __C, __mmask32 __U) { return (__m512bh)__builtin_ia32_selectpbf_512( (__mmask32)__U, - _mm512_fnmsubne_pbh((__v32bf)__A, (__v32bf)__B, (__v32bf)__C), + _mm512_fnmsub_pbh((__v32bf)__A, (__v32bf)__B, (__v32bf)__C), (__v32bf)__C); } -static __inline__ __m512bh __DEFAULT_FN_ATTRS512 _mm512_maskz_fnmsubne_pbh( +static __inline__ __m512bh __DEFAULT_FN_ATTRS512 _mm512_maskz_fnmsub_pbh( __mmask32 __U, __m512bh __A, __m512bh __B, __m512bh __C) { return (__m512bh)__builtin_ia32_selectpbf_512( (__mmask32)__U, - _mm512_fnmsubne_pbh((__v32bf)__A, (__v32bf)__B, (__v32bf)__C), + _mm512_fnmsub_pbh((__v32bf)__A, (__v32bf)__B, (__v32bf)__C), (__v32bf)_mm512_setzero_pbh()); } diff --git a/clang/lib/Headers/avx10_2bf16intrin.h b/clang/lib/Headers/avx10_2bf16intrin.h index 0a427b9b7418b..0f35f6e013707 100644 --- a/clang/lib/Headers/avx10_2bf16intrin.h +++ b/clang/lib/Headers/avx10_2bf16intrin.h @@ -35,31 +35,31 @@ static __inline __m128bh __DEFAULT_FN_ATTRS128 _mm_setzero_pbh(void) { return __builtin_bit_cast(__m128bh, _mm_setzero_ps()); } -static __inline__ __m128 __DEFAULT_FN_ATTRS128 _mm_castpbf16_ps(__m128bh __a) { +static __inline__ __m128 __DEFAULT_FN_ATTRS128 _mm_castbf16_ps(__m128bh __a) { return (__m128)__a; } static __inline__ __m256 __DEFAULT_FN_ATTRS256 -_mm256_castpbf16_ps(__m256bh __a) { +_mm256_castbf16_ps(__m256bh __a) { return (__m256)__a; } static __inline__ __m256d __DEFAULT_FN_ATTRS256 -_mm256_castpbf16_pd(__m256bh __a) { +_mm256_castbf16_pd(__m256bh __a) { return (__m256d)__a; } -static __inline__ __m128d __DEFAULT_FN_ATTRS128 _mm_castpbf16_pd(__m128bh __a) { +static __inline__ __m128d __DEFAULT_FN_ATTRS128 _mm_castbf16_pd(__m128bh __a) { return (__m128d)__a; } static __inline__ __m128i __DEFAULT_FN_ATTRS128 -_mm_castpbf16_si128(__m128bh __a) { +_mm_castbf16_si128(__m128bh __a) { return (__m128i)__a; } static __inline__ __m256i __DEFAULT_FN_ATTRS256 -_mm256_castpbf16_si256(__m256bh __a) { +_mm256_castbf16_si256(__m256bh __a) { return (__m256i)__a; } @@ -100,18 +100,18 @@ _mm256_castsi256_pbh(__m256i __a) { } static __inline__ __m128bh __DEFAULT_FN_ATTRS256 -_mm256_castpbf16256_pbh128(__m256bh __a) { +_mm256_castbf16256_pbh128(__m256bh __a) { return __builtin_shufflevector(__a, __a, 0, 1, 2, 3, 4, 5, 6, 7); } static __inline__ __m256bh __DEFAULT_FN_ATTRS256 -_mm256_castpbf16128_pbh256(__m128bh __a) { +_mm256_castbf16128_pbh256(__m128bh __a) { return __builtin_shufflevector(__a, __a, 0, 1, 2, 3, 4, 5, 6, 7, -1, -1, -1, -1, -1, -1, -1, -1); } static __inline__ __m256bh __DEFAULT_FN_ATTRS256 -_mm256_zextpbf16128_pbh256(__m128bh __a) { +_mm256_zextbf16128_pbh256(__m128bh __a) { return __builtin_shufflevector(__a, (__v8bf)_mm_setzero_pbh(), 0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15); } @@ -309,153 +309,149 @@ _mm256_permutexvar_pbh(__m256i __A, __m256bh __B) { return (__m256bh)__builtin_ia32_permvarhi256((__v16hi)__B, (__v16hi)__A); } -static __inline__ __m256bh __DEFAULT_FN_ATTRS256 -_mm256_addne_pbh(__m256bh __A, __m256bh __B) { +static __inline__ __m256bh __DEFAULT_FN_ATTRS256 _mm256_add_pbh(__m256bh __A, + __m256bh __B) { return (__m256bh)((__v16bf)__A + (__v16bf)__B); } static __inline__ __m256bh __DEFAULT_FN_ATTRS256 -_mm256_mask_addne_pbh(__m256bh __W, __mmask16 __U, __m256bh __A, __m256bh __B) { +_mm256_mask_add_pbh(__m256bh __W, __mmask16 __U, __m256bh __A, __m256bh __B) { return (__m256bh)__builtin_ia32_selectpbf_256( - (__mmask16)__U, (__v16bf)_mm256_addne_pbh(__A, __B), (__v16bf)__W); + (__mmask16)__U, (__v16bf)_mm256_add_pbh(__A, __B), (__v16bf)__W); } static __inline__ __m256bh __DEFAULT_FN_ATTRS256 -_mm256_maskz_addne_pbh(__mmask16 __U, __m256bh __A, __m256bh __B) { +_mm256_maskz_add_pbh(__mmask16 __U, __m256bh __A, __m256bh __B) { return (__m256bh)__builtin_ia32_selectpbf_256( - (__mmask16)__U, (__v16bf)_mm256_addne_pbh(__A, __B), + (__mmask16)__U, (__v16bf)_mm256_add_pbh(__A, __B), (__v16bf)_mm256_setzero_pbh()); } -static __inline__ __m128bh __DEFAULT_FN_ATTRS128 _mm_addne_pbh(__m128bh __A, - __m128bh __B) { +static __inline__ __m128bh __DEFAULT_FN_ATTRS128 _mm_add_pbh(__m128bh __A, + __m128bh __B) { return (__m128bh)((__v8bf)__A + (__v8bf)__B); } static __inline__ __m128bh __DEFAULT_FN_ATTRS128 -_mm_mask_addne_pbh(__m128bh __W, __mmask8 __U, __m128bh __A, __m128bh __B) { +_mm_mask_add_pbh(__m128bh __W, __mmask8 __U, __m128bh __A, __m128bh __B) { return (__m128bh)__builtin_ia32_selectpbf_128( - (__mmask8)__U, (__v8bf)_mm_addne_pbh(__A, __B), (__v8bf)__W); + (__mmask8)__U, (__v8bf)_mm_add_pbh(__A, __B), (__v8bf)__W); } static __inline__ __m128bh __DEFAULT_FN_ATTRS128 -_mm_maskz_addne_pbh(__mmask8 __U, __m128bh __A, __m128bh __B) { - return (__m128bh)__builtin_ia32_selectpbf_128((__mmask8)__U, - (__v8bf)_mm_addne_pbh(__A, __B), - (__v8bf)_mm_setzero_pbh()); +_mm_maskz_add_pbh(__mmask8 __U, __m128bh __A, __m128bh __B) { + return (__m128bh)__builtin_ia32_selectpbf_128( + (__mmask8)__U, (__v8bf)_mm_add_pbh(__A, __B), (__v8bf)_mm_setzero_pbh()); } -static __inline__ __m256bh __DEFAULT_FN_ATTRS256 -_mm256_subne_pbh(__m256bh __A, __m256bh __B) { +static __inline__ __m256bh __DEFAULT_FN_ATTRS256 _mm256_sub_pbh(__m256bh __A, + __m256bh __B) { return (__m256bh)((__v16bf)__A - (__v16bf)__B); } static __inline__ __m256bh __DEFAULT_FN_ATTRS256 -_mm256_mask_subne_pbh(__m256bh __W, __mmask16 __U, __m256bh __A, __m256bh __B) { +_mm256_mask_sub_pbh(__m256bh __W, __mmask16 __U, __m256bh __A, __m256bh __B) { return (__m256bh)__builtin_ia32_selectpbf_256( - (__mmask16)__U, (__v16bf)_mm256_subne_pbh(__A, __B), (__v16bf)__W); + (__mmask16)__U, (__v16bf)_mm256_sub_pbh(__A, __B), (__v16bf)__W); } static __inline__ __m256bh __DEFAULT_FN_ATTRS256 -_mm256_maskz_subne_pbh(__mmask16 __U, __m256bh __A, __m256bh __B) { +_mm256_maskz_sub_pbh(__mmask16 __U, __m256bh __A, __m256bh __B) { return (__m256bh)__builtin_ia32_selectpbf_256( - (__mmask16)__U, (__v16bf)_mm256_subne_pbh(__A, __B), + (__mmask16)__U, (__v16bf)_mm256_sub_pbh(__A, __B), (__v16bf)_mm256_setzero_pbh()); } -static __inline__ __m128bh __DEFAULT_FN_ATTRS128 _mm_subne_pbh(__m128bh __A, - __m128bh __B) { +static __inline__ __m128bh __DEFAULT_FN_ATTRS128 _mm_sub_pbh(__m128bh __A, + __m128bh __B) { return (__m128bh)((__v8bf)__A - (__v8bf)__B); } static __inline__ __m128bh __DEFAULT_FN_ATTRS128 -_mm_mask_subne_pbh(__m128bh __W, __mmask8 __U, __m128bh __A, __m128bh __B) { +_mm_mask_sub_pbh(__m128bh __W, __mmask8 __U, __m128bh __A, __m128bh __B) { return (__m128bh)__builtin_ia32_selectpbf_128( - (__mmask8)__U, (__v8bf)_mm_subne_pbh(__A, __B), (__v8bf)__W); + (__mmask8)__U, (__v8bf)_mm_sub_pbh(__A, __B), (__v8bf)__W); } static __inline__ __m128bh __DEFAULT_FN_ATTRS128 -_mm_maskz_subne_pbh(__mmask8 __U, __m128bh __A, __m128bh __B) { - return (__m128bh)__builtin_ia32_selectpbf_128((__mmask8)__U, - (__v8bf)_mm_subne_pbh(__A, __B), - (__v8bf)_mm_setzero_pbh()); +_mm_maskz_sub_pbh(__mmask8 __U, __m128bh __A, __m128bh __B) { + return (__m128bh)__builtin_ia32_selectpbf_128( + (__mmask8)__U, (__v8bf)_mm_sub_pbh(__A, __B), (__v8bf)_mm_setzero_pbh()); } -static __inline__ __m256bh __DEFAULT_FN_ATTRS256 -_mm256_mulne_pbh(__m256bh __A, __m256bh __B) { +static __inline__ __m256bh __DEFAULT_FN_ATTRS256 _mm256_mul_pbh(__m256bh __A, + __m256bh __B) { return (__m256bh)((__v16bf)__A * (__v16bf)__B); } static __inline__ __m256bh __DEFAULT_FN_ATTRS256 -_mm256_mask_mulne_pbh(__m256bh __W, __mmask16 __U, __m256bh __A, __m256bh __B) { +_mm256_mask_mul_pbh(__m256bh __W, __mmask16 __U, __m256bh __A, __m256bh __B) { return (__m256bh)__builtin_ia32_selectpbf_256( - (__mmask16)__U, (__v16bf)_mm256_mulne_pbh(__A, __B), (__v16bf)__W); + (__mmask16)__U, (__v16bf)_mm256_mul_pbh(__A, __B), (__v16bf)__W); } static __inline__ __m256bh __DEFAULT_FN_ATTRS256 -_mm256_maskz_mulne_pbh(__mmask16 __U, __m256bh __A, __m256bh __B) { +_mm256_maskz_mul_pbh(__mmask16 __U, __m256bh __A, __m256bh __B) { return (__m256bh)__builtin_ia32_selectpbf_256( - (__mmask16)__U, (__v16bf)_mm256_mulne_pbh(__A, __B), + (__mmask16)__U, (__v16bf)_mm256_mul_pbh(__A, __B), (__v16bf)_mm256_setzero_pbh()); } -static __inline__ __m128bh __DEFAULT_FN_ATTRS128 _mm_mulne_pbh(__m128bh __A, - __m128bh __B) { +static __inline__ __m128bh __DEFAULT_FN_ATTRS128 _mm_mul_pbh(__m128bh __A, + __m128bh __B) { return (__m128bh)((__v8bf)__A * (__v8bf)__B); } static __inline__ __m128bh __DEFAULT_FN_ATTRS128 -_mm_mask_mulne_pbh(__m128bh __W, __mmask8 __U, __m128bh __A, __m128bh __B) { +_mm_mask_mul_pbh(__m128bh __W, __mmask8 __U, __m128bh __A, __m128bh __B) { return (__m128bh)__builtin_ia32_selectpbf_128( - (__mmask8)__U, (__v8bf)_mm_mulne_pbh(__A, __B), (__v8bf)__W); + (__mmask8)__U, (__v8bf)_mm_mul_pbh(__A, __B), (__v8bf)__W); } static __inline__ __m128bh __DEFAULT_FN_ATTRS128 -_mm_maskz_mulne_pbh(__mmask8 __U, __m128bh __A, __m128bh __B) { - return (__m128bh)__builtin_ia32_selectpbf_128((__mmask8)__U, - (__v8bf)_mm_mulne_pbh(__A, __B), - (__v8bf)_mm_setzero_pbh()); +_mm_maskz_mul_pbh(__mmask8 __U, __m128bh __A, __m128bh __B) { + return (__m128bh)__builtin_ia32_selectpbf_128( + (__mmask8)__U, (__v8bf)_mm_mul_pbh(__A, __B), (__v8bf)_mm_setzero_pbh()); } -static __inline__ __m256bh __DEFAULT_FN_ATTRS256 -_mm256_divne_pbh(__m256bh __A, __m256bh __B) { +static __inline__ __m256bh __DEFAULT_FN_ATTRS256 _mm256_div_pbh(__m256bh __A, + __m256bh __B) { return (__m256bh)((__v16bf)__A / (__v16bf)__B); } static __inline__ __m256bh __DEFAULT_FN_ATTRS256 -_mm256_mask_divne_pbh(__m256bh __W, __mmask16 __U, __m256bh __A, __m256bh __B) { +_mm256_mask_div_pbh(__m256bh __W, __mmask16 __U, __m256bh __A, __m256bh __B) { return (__m256bh)__builtin_ia32_selectpbf_256( - (__mmask16)__U, (__v16bf)_mm256_divne_pbh(__A, __B), (__v16bf)__W); + (__mmask16)__U, (__v16bf)_mm256_div_pbh(__A, __B), (__v16bf)__W); } static __inline__ __m256bh __DEFAULT_FN_ATTRS256 -_mm256_maskz_divne_pbh(__mmask16 __U, __m256bh __A, __m256bh __B) { +_mm256_maskz_div_pbh(__mmask16 __U, __m256bh __A, __m256bh __B) { return (__m256bh)__builtin_ia32_selectpbf_256( - (__mmask16)__U, (__v16bf)_mm256_divne_pbh(__A, __B), + (__mmask16)__U, (__v16bf)_mm256_div_pbh(__A, __B), (__v16bf)_mm256_setzero_pbh()); } -static __inline__ __m128bh __DEFAULT_FN_ATTRS128 _mm_divne_pbh(__m128bh __A, - __m128bh __B) { +static __inline__ __m128bh __DEFAULT_FN_ATTRS128 _mm_div_pbh(__m128bh __A, + __m128bh __B) { return (__m128bh)((__v8bf)__A / (__v8bf)__B); } static __inline__ __m128bh __DEFAULT_FN_ATTRS128 -_mm_mask_divne_pbh(__m128bh __W, __mmask8 __U, __m128bh __A, __m128bh __B) { +_mm_mask_div_pbh(__m128bh __W, __mmask8 __U, __m128bh __A, __m128bh __B) { return (__m128bh)__builtin_ia32_selectpbf_128( - (__mmask8)__U, (__v8bf)_mm_divne_pbh(__A, __B), (__v8bf)__W); + (__mmask8)__U, (__v8bf)_mm_div_pbh(__A, __B), (__v8bf)__W); } static __inline__ __m128bh __DEFAULT_FN_ATTRS128 -_mm_maskz_divne_pbh(__mmask8 __U, __m128bh __A, __m128bh __B) { - return (__m128bh)__builtin_ia32_selectpbf_128((__mmask8)__U, - (__v8bf)_mm_divne_pbh(__A, __B), - (__v8bf)_mm_setzero_pbh()); +_mm_maskz_div_pbh(__mmask8 __U, __m128bh __A, __m128bh __B) { + return (__m128bh)__builtin_ia32_selectpbf_128( + (__mmask8)__U, (__v8bf)_mm_div_pbh(__A, __B), (__v8bf)_mm_setzero_pbh()); } static __inline__ __m256bh __DEFAULT_FN_ATTRS256 _mm256_max_pbh(__m256bh __A, __m256bh __B) { - return (__m256bh)__builtin_ia32_vmaxpbf16256((__v16bf)__A, (__v16bf)__B); + return (__m256bh)__builtin_ia32_vmaxbf16256((__v16bf)__A, (__v16bf)__B); } static __inline__ __m256bh __DEFAULT_FN_ATTRS256 @@ -473,7 +469,7 @@ _mm256_maskz_max_pbh(__mmask16 __U, __m256bh __A, __m256bh __B) { static __inline__ __m128bh __DEFAULT_FN_ATTRS128 _mm_max_pbh(__m128bh __A, __m128bh __B) { - return (__m128bh)__builtin_ia32_vmaxpbf16128((__v8bf)__A, (__v8bf)__B); + return (__m128bh)__builtin_ia32_vmaxbf16128((__v8bf)__A, (__v8bf)__B); } static __inline__ __m128bh __DEFAULT_FN_ATTRS128 @@ -490,7 +486,7 @@ _mm_maskz_max_pbh(__mmask8 __U, __m128bh __A, __m128bh __B) { static __inline__ __m256bh __DEFAULT_FN_ATTRS256 _mm256_min_pbh(__m256bh __A, __m256bh __B) { - return (__m256bh)__builtin_ia32_vminpbf16256((__v16bf)__A, (__v16bf)__B); + return (__m256bh)__builtin_ia32_vminbf16256((__v16bf)__A, (__v16bf)__B); } static __inline__ __m256bh __DEFAULT_FN_ATTRS256 @@ -508,7 +504,7 @@ _mm256_maskz_min_pbh(__mmask16 __U, __m256bh __A, __m256bh __B) { static __inline__ __m128bh __DEFAULT_FN_ATTRS128 _mm_min_pbh(__m128bh __A, __m128bh __B) { - return (__m128bh)__builtin_ia32_vminpbf16128((__v8bf)__A, (__v8bf)__B); + return (__m128bh)__builtin_ia32_vminbf16128((__v8bf)__A, (__v8bf)__B); } static __inline__ __m128bh __DEFAULT_FN_ATTRS128 @@ -554,275 +550,275 @@ static __inline__ int __DEFAULT_FN_ATTRS128 _mm_comneqsbh(__m128bh A, } #define _mm256_cmp_pbh_mask(__A, __B, __P) \ - ((__mmask16)__builtin_ia32_vcmppbf16256_mask((__v16bf)(__m256bh)(__A), \ - (__v16bf)(__m256bh)(__B), \ - (int)(__P), (__mmask16) - 1)) + ((__mmask16)__builtin_ia32_vcmpbf16256_mask((__v16bf)(__m256bh)(__A), \ + (__v16bf)(__m256bh)(__B), \ + (int)(__P), (__mmask16) - 1)) #define _mm256_mask_cmp_pbh_mask(__U, __A, __B, __P) \ - ((__mmask16)__builtin_ia32_vcmppbf16256_mask((__v16bf)(__m256bh)(__A), \ - (__v16bf)(__m256bh)(__B), \ - (int)(__P), (__mmask16)(__U))) + ((__mmask16)__builtin_ia32_vcmpbf16256_mask((__v16bf)(__m256bh)(__A), \ + (__v16bf)(__m256bh)(__B), \ + (int)(__P), (__mmask16)(__U))) #define _mm_cmp_pbh_mask(__A, __B, __P) \ - ((__mmask8)__builtin_ia32_vcmppbf16128_mask((__v8bf)(__m128bh)(__A), \ - (__v8bf)(__m128bh)(__B), \ - (int)(__P), (__mmask8) - 1)) + ((__mmask8)__builtin_ia32_vcmpbf16128_mask((__v8bf)(__m128bh)(__A), \ + (__v8bf)(__m128bh)(__B), \ + (int)(__P), (__mmask8) - 1)) #define _mm_mask_cmp_pbh_mask(__U, __A, __B, __P) \ - ((__mmask8)__builtin_ia32_vcmppbf16128_mask((__v8bf)(__m128bh)(__A), \ - (__v8bf)(__m128bh)(__B), \ - (int)(__P), (__mmask8)(__U))) + ((__mmask8)__builtin_ia32_vcmpbf16128_mask((__v8bf)(__m128bh)(__A), \ + (__v8bf)(__m128bh)(__B), \ + (int)(__P), (__mmask8)(__U))) #define _mm256_mask_fpclass_pbh_mask(__U, __A, imm) \ - ((__mmask16)__builtin_ia32_vfpclasspbf16256_mask( \ + ((__mmask16)__builtin_ia32_vfpclassbf16256_mask( \ (__v16bf)(__m256bh)(__A), (int)(imm), (__mmask16)(__U))) #define _mm256_fpclass_pbh_mask(__A, imm) \ - ((__mmask16)__builtin_ia32_vfpclasspbf16256_mask( \ + ((__mmask16)__builtin_ia32_vfpclassbf16256_mask( \ (__v16bf)(__m256bh)(__A), (int)(imm), (__mmask16) - 1)) #define _mm_mask_fpclass_pbh_mask(__U, __A, imm) \ - ((__mmask8)__builtin_ia32_vfpclasspbf16128_mask( \ - (__v8bf)(__m128bh)(__A), (int)(imm), (__mmask8)(__U))) + ((__mmask8)__builtin_ia32_vfpclassbf16128_mask((__v8bf)(__m128bh)(__A), \ + (int)(imm), (__mmask8)(__U))) #define _mm_fpclass_pbh_mask(__A, imm) \ - ((__mmask8)__builtin_ia32_vfpclasspbf16128_mask((__v8bf)(__m128bh)(__A), \ - (int)(imm), (__mmask8) - 1)) + ((__mmask8)__builtin_ia32_vfpclassbf16128_mask((__v8bf)(__m128bh)(__A), \ + (int)(imm), (__mmask8) - 1)) static __inline__ __m256bh __DEFAULT_FN_ATTRS256 _mm256_scalef_pbh(__m256bh __A, __m256bh __B) { - return (__m256bh)__builtin_ia32_vscalefpbf16256_mask( + return (__m256bh)__builtin_ia32_vscalefbf16256_mask( (__v16bf)__A, (__v16bf)__B, (__v16bf)_mm256_undefined_pbh(), (__mmask16)-1); } static __inline__ __m256bh __DEFAULT_FN_ATTRS256 _mm256_mask_scalef_pbh( __m256bh __W, __mmask16 __U, __m256bh __A, __m256bh __B) { - return (__m256bh)__builtin_ia32_vscalefpbf16256_mask( + return (__m256bh)__builtin_ia32_vscalefbf16256_mask( (__v16bf)__A, (__v16bf)__B, (__v16bf)__W, (__mmask16)__U); } static __inline__ __m256bh __DEFAULT_FN_ATTRS256 _mm256_maskz_scalef_pbh(__mmask16 __U, __m256bh __A, __m256bh __B) { - return (__m256bh)__builtin_ia32_vscalefpbf16256_mask( + return (__m256bh)__builtin_ia32_vscalefbf16256_mask( (__v16bf)__A, (__v16bf)__B, (__v16bf)_mm256_setzero_pbh(), (__mmask16)__U); } static __inline__ __m128bh __DEFAULT_FN_ATTRS128 _mm_scalef_pbh(__m128bh __A, __m128bh __B) { - return (__m128bh)__builtin_ia32_vscalefpbf16128_mask( + return (__m128bh)__builtin_ia32_vscalefbf16128_mask( (__v8bf)__A, (__v8bf)__B, (__v8bf)_mm_undefined_pbh(), (__mmask8)-1); } static __inline__ __m128bh __DEFAULT_FN_ATTRS128 _mm_mask_scalef_pbh(__m128bh __W, __mmask8 __U, __m128bh __A, __m128bh __B) { - return (__m128bh)__builtin_ia32_vscalefpbf16128_mask( + return (__m128bh)__builtin_ia32_vscalefbf16128_mask( (__v8bf)__A, (__v8bf)__B, (__v8bf)__W, (__mmask8)__U); } static __inline__ __m128bh __DEFAULT_FN_ATTRS128 _mm_maskz_scalef_pbh(__mmask8 __U, __m128bh __A, __m128bh __B) { - return (__m128bh)__builtin_ia32_vscalefpbf16128_mask( + return (__m128bh)__builtin_ia32_vscalefbf16128_mask( (__v8bf)__A, (__v8bf)__B, (__v8bf)_mm_setzero_pbh(), (__mmask8)__U); } static __inline__ __m256bh __DEFAULT_FN_ATTRS256 _mm256_rcp_pbh(__m256bh __A) { - return (__m256bh)__builtin_ia32_vrcppbf16256_mask( + return (__m256bh)__builtin_ia32_vrcpbf16256_mask( (__v16bf)__A, (__v16bf)_mm256_undefined_pbh(), (__mmask16)-1); } static __inline__ __m256bh __DEFAULT_FN_ATTRS256 _mm256_mask_rcp_pbh(__m256bh __W, __mmask16 __U, __m256bh __A) { - return (__m256bh)__builtin_ia32_vrcppbf16256_mask((__v16bf)__A, (__v16bf)__W, - (__mmask16)__U); + return (__m256bh)__builtin_ia32_vrcpbf16256_mask((__v16bf)__A, (__v16bf)__W, + (__mmask16)__U); } static __inline__ __m256bh __DEFAULT_FN_ATTRS256 _mm256_maskz_rcp_pbh(__mmask16 __U, __m256bh __A) { - return (__m256bh)__builtin_ia32_vrcppbf16256_mask( + return (__m256bh)__builtin_ia32_vrcpbf16256_mask( (__v16bf)__A, (__v16bf)_mm256_setzero_pbh(), (__mmask16)__U); } static __inline__ __m128bh __DEFAULT_FN_ATTRS128 _mm_rcp_pbh(__m128bh __A) { - return (__m128bh)__builtin_ia32_vrcppbf16128_mask( + return (__m128bh)__builtin_ia32_vrcpbf16128_mask( (__v8bf)__A, (__v8bf)_mm_undefined_pbh(), (__mmask8)-1); } static __inline__ __m128bh __DEFAULT_FN_ATTRS128 _mm_mask_rcp_pbh(__m128bh __W, __mmask8 __U, __m128bh __A) { - return (__m128bh)__builtin_ia32_vrcppbf16128_mask((__v8bf)__A, (__v8bf)__W, - (__mmask8)__U); + return (__m128bh)__builtin_ia32_vrcpbf16128_mask((__v8bf)__A, (__v8bf)__W, + (__mmask8)__U); } static __inline__ __m128bh __DEFAULT_FN_ATTRS128 _mm_maskz_rcp_pbh(__mmask8 __U, __m128bh __A) { - return (__m128bh)__builtin_ia32_vrcppbf16128_mask( + return (__m128bh)__builtin_ia32_vrcpbf16128_mask( (__v8bf)__A, (__v8bf)_mm_setzero_pbh(), (__mmask8)__U); } static __inline__ __m256bh __DEFAULT_FN_ATTRS256 _mm256_getexp_pbh(__m256bh __A) { - return (__m256bh)__builtin_ia32_vgetexppbf16256_mask( + return (__m256bh)__builtin_ia32_vgetexpbf16256_mask( (__v16bf)__A, (__v16bf)_mm256_undefined_pbh(), (__mmask16)-1); } static __inline__ __m256bh __DEFAULT_FN_ATTRS256 _mm256_mask_getexp_pbh(__m256bh __W, __mmask16 __U, __m256bh __A) { - return (__m256bh)__builtin_ia32_vgetexppbf16256_mask( + return (__m256bh)__builtin_ia32_vgetexpbf16256_mask( (__v16bf)__A, (__v16bf)__W, (__mmask16)__U); } static __inline__ __m256bh __DEFAULT_FN_ATTRS256 _mm256_maskz_getexp_pbh(__mmask16 __U, __m256bh __A) { - return (__m256bh)__builtin_ia32_vgetexppbf16256_mask( + return (__m256bh)__builtin_ia32_vgetexpbf16256_mask( (__v16bf)__A, (__v16bf)_mm256_setzero_pbh(), (__mmask16)__U); } static __inline__ __m128bh __DEFAULT_FN_ATTRS128 _mm_getexp_pbh(__m128bh __A) { - return (__m128bh)__builtin_ia32_vgetexppbf16128_mask( + return (__m128bh)__builtin_ia32_vgetexpbf16128_mask( (__v8bf)__A, (__v8bf)_mm_undefined_pbh(), (__mmask8)-1); } static __inline__ __m128bh __DEFAULT_FN_ATTRS128 _mm_mask_getexp_pbh(__m128bh __W, __mmask8 __U, __m128bh __A) { - return (__m128bh)__builtin_ia32_vgetexppbf16128_mask((__v8bf)__A, (__v8bf)__W, - (__mmask8)__U); + return (__m128bh)__builtin_ia32_vgetexpbf16128_mask((__v8bf)__A, (__v8bf)__W, + (__mmask8)__U); } static __inline__ __m128bh __DEFAULT_FN_ATTRS128 _mm_maskz_getexp_pbh(__mmask8 __U, __m128bh __A) { - return (__m128bh)__builtin_ia32_vgetexppbf16128_mask( + return (__m128bh)__builtin_ia32_vgetexpbf16128_mask( (__v8bf)__A, (__v8bf)_mm_setzero_pbh(), (__mmask8)__U); } static __inline__ __m256bh __DEFAULT_FN_ATTRS256 _mm256_rsqrt_pbh(__m256bh __A) { - return (__m256bh)__builtin_ia32_vrsqrtpbf16256_mask( + return (__m256bh)__builtin_ia32_vrsqrtbf16256_mask( (__v16bf)__A, (__v16bf)_mm256_undefined_pbh(), (__mmask16)-1); } static __inline__ __m256bh __DEFAULT_FN_ATTRS256 _mm256_mask_rsqrt_pbh(__m256bh __W, __mmask16 __U, __m256bh __A) { - return (__m256bh)__builtin_ia32_vrsqrtpbf16256_mask( - (__v16bf)__A, (__v16bf)__W, (__mmask16)__U); + return (__m256bh)__builtin_ia32_vrsqrtbf16256_mask((__v16bf)__A, (__v16bf)__W, + (__mmask16)__U); } static __inline__ __m256bh __DEFAULT_FN_ATTRS256 _mm256_maskz_rsqrt_pbh(__mmask16 __U, __m256bh __A) { - return (__m256bh)__builtin_ia32_vrsqrtpbf16256_mask( + return (__m256bh)__builtin_ia32_vrsqrtbf16256_mask( (__v16bf)__A, (__v16bf)_mm256_setzero_pbh(), (__mmask16)__U); } static __inline__ __m128bh __DEFAULT_FN_ATTRS128 _mm_rsqrt_pbh(__m128bh __A) { - return (__m128bh)__builtin_ia32_vrsqrtpbf16128_mask( + return (__m128bh)__builtin_ia32_vrsqrtbf16128_mask( (__v8bf)__A, (__v8bf)_mm_undefined_pbh(), (__mmask8)-1); } static __inline__ __m128bh __DEFAULT_FN_ATTRS128 _mm_mask_rsqrt_pbh(__m128bh __W, __mmask8 __U, __m128bh __A) { - return (__m128bh)__builtin_ia32_vrsqrtpbf16128_mask((__v8bf)__A, (__v8bf)__W, - (__mmask8)__U); + return (__m128bh)__builtin_ia32_vrsqrtbf16128_mask((__v8bf)__A, (__v8bf)__W, + (__mmask8)__U); } static __inline__ __m128bh __DEFAULT_FN_ATTRS128 _mm_maskz_rsqrt_pbh(__mmask8 __U, __m128bh __A) { - return (__m128bh)__builtin_ia32_vrsqrtpbf16128_mask( + return (__m128bh)__builtin_ia32_vrsqrtbf16128_mask( (__v8bf)__A, (__v8bf)_mm_setzero_pbh(), (__mmask8)__U); } -#define _mm256_reducene_pbh(__A, imm) \ - ((__m256bh)__builtin_ia32_vreducenepbf16256_mask( \ +#define _mm256_reduce_pbh(__A, imm) \ + ((__m256bh)__builtin_ia32_vreducebf16256_mask( \ (__v16bf)(__m256bh)(__A), (int)(imm), (__v16bf)_mm256_undefined_pbh(), \ (__mmask16) - 1)) -#define _mm256_mask_reducene_pbh(__W, __U, __A, imm) \ - ((__m256bh)__builtin_ia32_vreducenepbf16256_mask( \ +#define _mm256_mask_reduce_pbh(__W, __U, __A, imm) \ + ((__m256bh)__builtin_ia32_vreducebf16256_mask( \ (__v16bf)(__m256bh)(__A), (int)(imm), (__v16bf)(__m256bh)(__W), \ (__mmask16)(__U))) -#define _mm256_maskz_reducene_pbh(__U, __A, imm) \ - ((__m256bh)__builtin_ia32_vreducenepbf16256_mask( \ +#define _mm256_maskz_reduce_pbh(__U, __A, imm) \ + ((__m256bh)__builtin_ia32_vreducebf16256_mask( \ (__v16bf)(__m256bh)(__A), (int)(imm), (__v16bf)_mm256_setzero_pbh(), \ (__mmask16)(__U))) -#define _mm_reducene_pbh(__A, imm) \ - ((__m128bh)__builtin_ia32_vreducenepbf16128_mask( \ +#define _mm_reduce_pbh(__A, imm) \ + ((__m128bh)__builtin_ia32_vreducebf16128_mask( \ (__v8bf)(__m128bh)(__A), (int)(imm), (__v8bf)_mm_undefined_pbh(), \ (__mmask8) - 1)) -#define _mm_mask_reducene_pbh(__W, __U, __A, imm) \ - ((__m128bh)__builtin_ia32_vreducenepbf16128_mask( \ +#define _mm_mask_reduce_pbh(__W, __U, __A, imm) \ + ((__m128bh)__builtin_ia32_vreducebf16128_mask( \ (__v8bf)(__m128bh)(__A), (int)(imm), (__v8bf)(__m128bh)(__W), \ (__mmask8)(__U))) -#define _mm_maskz_reducene_pbh(__U, __A, imm) \ - ((__m128bh)__builtin_ia32_vreducenepbf16128_mask( \ +#define _mm_maskz_reduce_pbh(__U, __A, imm) \ + ((__m128bh)__builtin_ia32_vreducebf16128_mask( \ (__v8bf)(__m128bh)(__A), (int)(imm), (__v8bf)_mm_setzero_pbh(), \ (__mmask8)(__U))) -#define _mm256_roundscalene_pbh(__A, imm) \ - ((__m256bh)__builtin_ia32_vrndscalenepbf16_256_mask( \ +#define _mm256_roundscale_pbh(__A, imm) \ + ((__m256bh)__builtin_ia32_vrndscalebf16_256_mask( \ (__v16bf)(__m256bh)(__A), (int)(imm), (__v16bf)_mm256_setzero_pbh(), \ (__mmask16) - 1)) -#define _mm256_mask_roundscalene_pbh(__W, __U, __A, imm) \ - ((__m256bh)__builtin_ia32_vrndscalenepbf16_256_mask( \ +#define _mm256_mask_roundscale_pbh(__W, __U, __A, imm) \ + ((__m256bh)__builtin_ia32_vrndscalebf16_256_mask( \ (__v16bf)(__m256bh)(__A), (int)(imm), (__v16bf)(__m256bh)(__W), \ (__mmask16)(__U))) -#define _mm256_maskz_roundscalene_pbh(__U, __A, imm) \ - ((__m256bh)__builtin_ia32_vrndscalenepbf16_256_mask( \ +#define _mm256_maskz_roundscale_pbh(__U, __A, imm) \ + ((__m256bh)__builtin_ia32_vrndscalebf16_256_mask( \ (__v16bf)(__m256bh)(__A), (int)(imm), (__v16bf)_mm256_setzero_pbh(), \ (__mmask16)(__U))) -#define _mm_roundscalene_pbh(__A, imm) \ - ((__m128bh)__builtin_ia32_vrndscalenepbf16_128_mask( \ +#define _mm_roundscale_pbh(__A, imm) \ + ((__m128bh)__builtin_ia32_vrndscalebf16_128_mask( \ (__v8bf)(__m128bh)(__A), (int)(imm), (__v8bf)_mm_setzero_pbh(), \ (__mmask8) - 1)) -#define _mm_mask_roundscalene_pbh(__W, __U, __A, imm) \ - ((__m128bh)__builtin_ia32_vrndscalenepbf16_128_mask( \ +#define _mm_mask_roundscale_pbh(__W, __U, __A, imm) \ + ((__m128bh)__builtin_ia32_vrndscalebf16_128_mask( \ (__v8bf)(__m128bh)(__A), (int)(imm), (__v8bf)(__m128bh)(__W), \ (__mmask8)(__U))) -#define _mm_maskz_roundscalene_pbh(__U, __A, imm) \ - ((__m128bh)__builtin_ia32_vrndscalenepbf16_128_mask( \ +#define _mm_maskz_roundscale_pbh(__U, __A, imm) \ + ((__m128bh)__builtin_ia32_vrndscalebf16_128_mask( \ (__v8bf)(__m128bh)(__A), (int)(imm), (__v8bf)_mm_setzero_pbh(), \ (__mmask8)(__U))) #define _mm256_getmant_pbh(__A, __B, __C) \ - ((__m256bh)__builtin_ia32_vgetmantpbf16256_mask( \ + ((__m256bh)__builtin_ia32_vgetmantbf16256_mask( \ (__v16bf)(__m256bh)(__A), (int)(((__C) << 2) | (__B)), \ (__v16bf)_mm256_undefined_pbh(), (__mmask16) - 1)) #define _mm256_mask_getmant_pbh(__W, __U, __A, __B, __C) \ - ((__m256bh)__builtin_ia32_vgetmantpbf16256_mask( \ + ((__m256bh)__builtin_ia32_vgetmantbf16256_mask( \ (__v16bf)(__m256bh)(__A), (int)(((__C) << 2) | (__B)), \ (__v16bf)(__m256bh)(__W), (__mmask16)(__U))) #define _mm256_maskz_getmant_pbh(__U, __A, __B, __C) \ - ((__m256bh)__builtin_ia32_vgetmantpbf16256_mask( \ + ((__m256bh)__builtin_ia32_vgetmantbf16256_mask( \ (__v16bf)(__m256bh)(__A), (int)(((__C) << 2) | (__B)), \ (__v16bf)_mm256_setzero_pbh(), (__mmask16)(__U))) #define _mm_getmant_pbh(__A, __B, __C) \ - ((__m128bh)__builtin_ia32_vgetmantpbf16128_mask( \ + ((__m128bh)__builtin_ia32_vgetmantbf16128_mask( \ (__v8bf)(__m128bh)(__A), (int)(((__C) << 2) | (__B)), \ (__v8bf)_mm_undefined_pbh(), (__mmask8) - 1)) #define _mm_mask_getmant_pbh(__W, __U, __A, __B, __C) \ - ((__m128bh)__builtin_ia32_vgetmantpbf16128_mask( \ + ((__m128bh)__builtin_ia32_vgetmantbf16128_mask( \ (__v8bf)(__m128bh)(__A), (int)(((__C) << 2) | (__B)), \ (__v8bf)(__m128bh)(__W), (__mmask8)(__U))) #define _mm_maskz_getmant_pbh(__U, __A, __B, __C) \ - ((__m128bh)__builtin_ia32_vgetmantpbf16128_mask( \ + ((__m128bh)__builtin_ia32_vgetmantbf16128_mask( \ (__v8bf)(__m128bh)(__A), (int)(((__C) << 2) | (__B)), \ (__v8bf)_mm_setzero_pbh(), (__mmask8)(__U))) static __inline__ __m256bh __DEFAULT_FN_ATTRS256 _mm256_sqrt_pbh(__m256bh __A) { - return (__m256bh)__builtin_ia32_vsqrtnepbf16256((__v16bf)__A); + return (__m256bh)__builtin_ia32_vsqrtbf16256((__v16bf)__A); } static __inline__ __m256bh __DEFAULT_FN_ATTRS256 @@ -839,7 +835,7 @@ _mm256_maskz_sqrt_pbh(__mmask16 __U, __m256bh __A) { } static __inline__ __m128bh __DEFAULT_FN_ATTRS128 _mm_sqrt_pbh(__m128bh __A) { - return (__m128bh)__builtin_ia32_vsqrtnepbf16((__v8bf)__A); + return (__m128bh)__builtin_ia32_vsqrtbf16((__v8bf)__A); } static __inline__ __m128bh __DEFAULT_FN_ATTRS128 @@ -855,232 +851,230 @@ _mm_maskz_sqrt_pbh(__mmask8 __U, __m128bh __A) { } static __inline__ __m256bh __DEFAULT_FN_ATTRS256 -_mm256_fmaddne_pbh(__m256bh __A, __m256bh __B, __m256bh __C) { +_mm256_fmadd_pbh(__m256bh __A, __m256bh __B, __m256bh __C) { return (__m256bh)__builtin_ia32_vfmaddnepbh256((__v16bf)__A, (__v16bf)__B, (__v16bf)__C); } -static __inline__ __m256bh __DEFAULT_FN_ATTRS256 _mm256_mask_fmaddne_pbh( - __m256bh __A, __mmask16 __U, __m256bh __B, __m256bh __C) { +static __inline__ __m256bh __DEFAULT_FN_ATTRS256 +_mm256_mask_fmadd_pbh(__m256bh __A, __mmask16 __U, __m256bh __B, __m256bh __C) { return (__m256bh)__builtin_ia32_selectpbf_256( (__mmask16)__U, - _mm256_fmaddne_pbh((__v16bf)__A, (__v16bf)__B, (__v16bf)__C), - (__v16bf)__A); + _mm256_fmadd_pbh((__v16bf)__A, (__v16bf)__B, (__v16bf)__C), (__v16bf)__A); } -static __inline__ __m256bh __DEFAULT_FN_ATTRS256 _mm256_mask3_fmaddne_pbh( +static __inline__ __m256bh __DEFAULT_FN_ATTRS256 _mm256_mask3_fmadd_pbh( __m256bh __A, __m256bh __B, __m256bh __C, __mmask16 __U) { return (__m256bh)__builtin_ia32_selectpbf_256( (__mmask16)__U, - _mm256_fmaddne_pbh((__v16bf)__A, (__v16bf)__B, (__v16bf)__C), - (__v16bf)__C); + _mm256_fmadd_pbh((__v16bf)__A, (__v16bf)__B, (__v16bf)__C), (__v16bf)__C); } -static __inline__ __m256bh __DEFAULT_FN_ATTRS256 _mm256_maskz_fmaddne_pbh( +static __inline__ __m256bh __DEFAULT_FN_ATTRS256 _mm256_maskz_fmadd_pbh( __mmask16 __U, __m256bh __A, __m256bh __B, __m256bh __C) { return (__m256bh)__builtin_ia32_selectpbf_256( (__mmask16)__U, - _mm256_fmaddne_pbh((__v16bf)__A, (__v16bf)__B, (__v16bf)__C), + _mm256_fmadd_pbh((__v16bf)__A, (__v16bf)__B, (__v16bf)__C), (__v16bf)_mm256_setzero_pbh()); } static __inline__ __m256bh __DEFAULT_FN_ATTRS256 -_mm256_fmsubne_pbh(__m256bh __A, __m256bh __B, __m256bh __C) { +_mm256_fmsub_pbh(__m256bh __A, __m256bh __B, __m256bh __C) { return (__m256bh)__builtin_ia32_vfmaddnepbh256((__v16bf)__A, (__v16bf)__B, -(__v16bf)__C); } -static __inline__ __m256bh __DEFAULT_FN_ATTRS256 _mm256_mask_fmsubne_pbh( - __m256bh __A, __mmask16 __U, __m256bh __B, __m256bh __C) { +static __inline__ __m256bh __DEFAULT_FN_ATTRS256 +_mm256_mask_fmsub_pbh(__m256bh __A, __mmask16 __U, __m256bh __B, __m256bh __C) { return (__m256bh)__builtin_ia32_selectpbf_256( (__mmask16)__U, - _mm256_fmsubne_pbh((__v16bf)__A, (__v16bf)__B, (__v16bf)__C), - (__v16bf)__A); + _mm256_fmsub_pbh((__v16bf)__A, (__v16bf)__B, (__v16bf)__C), (__v16bf)__A); } -static __inline__ __m256bh __DEFAULT_FN_ATTRS256 _mm256_mask3_fmsubne_pbh( +static __inline__ __m256bh __DEFAULT_FN_ATTRS256 _mm256_mask3_fmsub_pbh( __m256bh __A, __m256bh __B, __m256bh __C, __mmask16 __U) { return (__m256bh)__builtin_ia32_selectpbf_256( (__mmask16)__U, - _mm256_fmsubne_pbh((__v16bf)__A, (__v16bf)__B, (__v16bf)__C), - (__v16bf)__C); + _mm256_fmsub_pbh((__v16bf)__A, (__v16bf)__B, (__v16bf)__C), (__v16bf)__C); } -static __inline__ __m256bh __DEFAULT_FN_ATTRS256 _mm256_maskz_fmsubne_pbh( +static __inline__ __m256bh __DEFAULT_FN_ATTRS256 _mm256_maskz_fmsub_pbh( __mmask16 __U, __m256bh __A, __m256bh __B, __m256bh __C) { return (__m256bh)__builtin_ia32_selectpbf_256( (__mmask16)__U, - _mm256_fmsubne_pbh((__v16bf)__A, (__v16bf)__B, (__v16bf)__C), + _mm256_fmsub_pbh((__v16bf)__A, (__v16bf)__B, (__v16bf)__C), (__v16bf)_mm256_setzero_pbh()); } static __inline__ __m256bh __DEFAULT_FN_ATTRS256 -_mm256_fnmaddne_pbh(__m256bh __A, __m256bh __B, __m256bh __C) { +_mm256_fnmadd_pbh(__m256bh __A, __m256bh __B, __m256bh __C) { return (__m256bh)__builtin_ia32_vfmaddnepbh256((__v16bf)__A, -(__v16bf)__B, (__v16bf)__C); } -static __inline__ __m256bh __DEFAULT_FN_ATTRS256 _mm256_mask_fnmaddne_pbh( +static __inline__ __m256bh __DEFAULT_FN_ATTRS256 _mm256_mask_fnmadd_pbh( __m256bh __A, __mmask16 __U, __m256bh __B, __m256bh __C) { return (__m256bh)__builtin_ia32_selectpbf_256( (__mmask16)__U, - _mm256_fnmaddne_pbh((__v16bf)__A, (__v16bf)__B, (__v16bf)__C), + _mm256_fnmadd_pbh((__v16bf)__A, (__v16bf)__B, (__v16bf)__C), (__v16bf)__A); } -static __inline__ __m256bh __DEFAULT_FN_ATTRS256 _mm256_mask3_fnmaddne_pbh( +static __inline__ __m256bh __DEFAULT_FN_ATTRS256 _mm256_mask3_fnmadd_pbh( __m256bh __A, __m256bh __B, __m256bh __C, __mmask16 __U) { return (__m256bh)__builtin_ia32_selectpbf_256( (__mmask16)__U, - _mm256_fnmaddne_pbh((__v16bf)__A, (__v16bf)__B, (__v16bf)__C), + _mm256_fnmadd_pbh((__v16bf)__A, (__v16bf)__B, (__v16bf)__C), (__v16bf)__C); } -static __inline__ __m256bh __DEFAULT_FN_ATTRS256 _mm256_maskz_fnmaddne_pbh( +static __inline__ __m256bh __DEFAULT_FN_ATTRS256 _mm256_maskz_fnmadd_pbh( __mmask16 __U, __m256bh __A, __m256bh __B, __m256bh __C) { return (__m256bh)__builtin_ia32_selectpbf_256( (__mmask16)__U, - _mm256_fnmaddne_pbh((__v16bf)__A, (__v16bf)__B, (__v16bf)__C), + _mm256_fnmadd_pbh((__v16bf)__A, (__v16bf)__B, (__v16bf)__C), (__v16bf)_mm256_setzero_pbh()); } static __inline__ __m256bh __DEFAULT_FN_ATTRS256 -_mm256_fnmsubne_pbh(__m256bh __A, __m256bh __B, __m256bh __C) { +_mm256_fnmsub_pbh(__m256bh __A, __m256bh __B, __m256bh __C) { return (__m256bh)__builtin_ia32_vfmaddnepbh256((__v16bf)__A, -(__v16bf)__B, -(__v16bf)__C); } -static __inline__ __m256bh __DEFAULT_FN_ATTRS256 _mm256_mask_fnmsubne_pbh( +static __inline__ __m256bh __DEFAULT_FN_ATTRS256 _mm256_mask_fnmsub_pbh( __m256bh __A, __mmask16 __U, __m256bh __B, __m256bh __C) { return (__m256bh)__builtin_ia32_selectpbf_256( (__mmask16)__U, - _mm256_fnmsubne_pbh((__v16bf)__A, (__v16bf)__B, (__v16bf)__C), + _mm256_fnmsub_pbh((__v16bf)__A, (__v16bf)__B, (__v16bf)__C), (__v16bf)__A); } -static __inline__ __m256bh __DEFAULT_FN_ATTRS256 _mm256_mask3_fnmsubne_pbh( +static __inline__ __m256bh __DEFAULT_FN_ATTRS256 _mm256_mask3_fnmsub_pbh( __m256bh __A, __m256bh __B, __m256bh __C, __mmask16 __U) { return (__m256bh)__builtin_ia32_selectpbf_256( (__mmask16)__U, - _mm256_fnmsubne_pbh((__v16bf)__A, (__v16bf)__B, (__v16bf)__C), + _mm256_fnmsub_pbh((__v16bf)__A, (__v16bf)__B, (__v16bf)__C), (__v16bf)__C); } -static __inline__ __m256bh __DEFAULT_FN_ATTRS256 _mm256_maskz_fnmsubne_pbh( +static __inline__ __m256bh __DEFAULT_FN_ATTRS256 _mm256_maskz_fnmsub_pbh( __mmask16 __U, __m256bh __A, __m256bh __B, __m256bh __C) { return (__m256bh)__builtin_ia32_selectpbf_256( (__mmask16)__U, - _mm256_fnmsubne_pbh((__v16bf)__A, (__v16bf)__B, (__v16bf)__C), + _mm256_fnmsub_pbh((__v16bf)__A, (__v16bf)__B, (__v16bf)__C), (__v16bf)_mm256_setzero_pbh()); } -static __inline__ __m128bh __DEFAULT_FN_ATTRS128 _mm_fmaddne_pbh(__m128bh __A, - __m128bh __B, - __m128bh __C) { +static __inline__ __m128bh __DEFAULT_FN_ATTRS128 _mm_fmadd_pbh(__m128bh __A, + __m128bh __B, + __m128bh __C) { return (__m128bh)__builtin_ia32_vfmaddnepbh128((__v8bf)__A, (__v8bf)__B, (__v8bf)__C); } static __inline__ __m128bh __DEFAULT_FN_ATTRS128 -_mm_mask_fmaddne_pbh(__m128bh __A, __mmask8 __U, __m128bh __B, __m128bh __C) { +_mm_mask_fmadd_pbh(__m128bh __A, __mmask8 __U, __m128bh __B, __m128bh __C) { return (__m128bh)__builtin_ia32_selectpbf_128( - (__mmask8)__U, _mm_fmaddne_pbh((__v8bf)__A, (__v8bf)__B, (__v8bf)__C), + (__mmask8)__U, _mm_fmadd_pbh((__v8bf)__A, (__v8bf)__B, (__v8bf)__C), (__v8bf)__A); } static __inline__ __m128bh __DEFAULT_FN_ATTRS128 -_mm_mask3_fmaddne_pbh(__m128bh __A, __m128bh __B, __m128bh __C, __mmask8 __U) { +_mm_mask3_fmadd_pbh(__m128bh __A, __m128bh __B, __m128bh __C, __mmask8 __U) { return (__m128bh)__builtin_ia32_selectpbf_128( - (__mmask8)__U, _mm_fmaddne_pbh((__v8bf)__A, (__v8bf)__B, (__v8bf)__C), + (__mmask8)__U, _mm_fmadd_pbh((__v8bf)__A, (__v8bf)__B, (__v8bf)__C), (__v8bf)__C); } static __inline__ __m128bh __DEFAULT_FN_ATTRS128 -_mm_maskz_fmaddne_pbh(__mmask8 __U, __m128bh __A, __m128bh __B, __m128bh __C) { +_mm_maskz_fmadd_pbh(__mmask8 __U, __m128bh __A, __m128bh __B, __m128bh __C) { return (__m128bh)__builtin_ia32_selectpbf_128( - (__mmask8)__U, _mm_fmaddne_pbh((__v8bf)__A, (__v8bf)__B, (__v8bf)__C), + (__mmask8)__U, _mm_fmadd_pbh((__v8bf)__A, (__v8bf)__B, (__v8bf)__C), (__v8bf)_mm_setzero_pbh()); } -static __inline__ __m128bh __DEFAULT_FN_ATTRS128 _mm_fmsubne_pbh(__m128bh __A, - __m128bh __B, - __m128bh __C) { +static __inline__ __m128bh __DEFAULT_FN_ATTRS128 _mm_fmsub_pbh(__m128bh __A, + __m128bh __B, + __m128bh __C) { return (__m128bh)__builtin_ia32_vfmaddnepbh128((__v8bf)__A, (__v8bf)__B, -(__v8bf)__C); } static __inline__ __m128bh __DEFAULT_FN_ATTRS128 -_mm_mask_fmsubne_pbh(__m128bh __A, __mmask8 __U, __m128bh __B, __m128bh __C) { +_mm_mask_fmsub_pbh(__m128bh __A, __mmask8 __U, __m128bh __B, __m128bh __C) { return (__m128bh)__builtin_ia32_selectpbf_128( - (__mmask8)__U, _mm_fmsubne_pbh((__v8bf)__A, (__v8bf)__B, (__v8bf)__C), + (__mmask8)__U, _mm_fmsub_pbh((__v8bf)__A, (__v8bf)__B, (__v8bf)__C), (__v8bf)__A); } static __inline__ __m128bh __DEFAULT_FN_ATTRS128 -_mm_mask3_fmsubne_pbh(__m128bh __A, __m128bh __B, __m128bh __C, __mmask8 __U) { +_mm_mask3_fmsub_pbh(__m128bh __A, __m128bh __B, __m128bh __C, __mmask8 __U) { return (__m128bh)__builtin_ia32_selectpbf_128( - (__mmask8)__U, _mm_fmsubne_pbh((__v8bf)__A, (__v8bf)__B, (__v8bf)__C), + (__mmask8)__U, _mm_fmsub_pbh((__v8bf)__A, (__v8bf)__B, (__v8bf)__C), (__v8bf)__C); } static __inline__ __m128bh __DEFAULT_FN_ATTRS128 -_mm_maskz_fmsubne_pbh(__mmask8 __U, __m128bh __A, __m128bh __B, __m128bh __C) { +_mm_maskz_fmsub_pbh(__mmask8 __U, __m128bh __A, __m128bh __B, __m128bh __C) { return (__m128bh)__builtin_ia32_selectpbf_128( - (__mmask8)__U, _mm_fmsubne_pbh((__v8bf)__A, (__v8bf)__B, (__v8bf)__C), + (__mmask8)__U, _mm_fmsub_pbh((__v8bf)__A, (__v8bf)__B, (__v8bf)__C), (__v8bf)_mm_setzero_pbh()); } -static __inline__ __m128bh __DEFAULT_FN_ATTRS128 -_mm_fnmaddne_pbh(__m128bh __A, __m128bh __B, __m128bh __C) { +static __inline__ __m128bh __DEFAULT_FN_ATTRS128 _mm_fnmadd_pbh(__m128bh __A, + __m128bh __B, + __m128bh __C) { return (__m128bh)__builtin_ia32_vfmaddnepbh128((__v8bf)__A, -(__v8bf)__B, (__v8bf)__C); } static __inline__ __m128bh __DEFAULT_FN_ATTRS128 -_mm_mask_fnmaddne_pbh(__m128bh __A, __mmask8 __U, __m128bh __B, __m128bh __C) { +_mm_mask_fnmadd_pbh(__m128bh __A, __mmask8 __U, __m128bh __B, __m128bh __C) { return (__m128bh)__builtin_ia32_selectpbf_128( - (__mmask8)__U, _mm_fnmaddne_pbh((__v8bf)__A, (__v8bf)__B, (__v8bf)__C), + (__mmask8)__U, _mm_fnmadd_pbh((__v8bf)__A, (__v8bf)__B, (__v8bf)__C), (__v8bf)__A); } static __inline__ __m128bh __DEFAULT_FN_ATTRS128 -_mm_mask3_fnmaddne_pbh(__m128bh __A, __m128bh __B, __m128bh __C, __mmask8 __U) { +_mm_mask3_fnmadd_pbh(__m128bh __A, __m128bh __B, __m128bh __C, __mmask8 __U) { return (__m128bh)__builtin_ia32_selectpbf_128( - (__mmask8)__U, _mm_fnmaddne_pbh((__v8bf)__A, (__v8bf)__B, (__v8bf)__C), + (__mmask8)__U, _mm_fnmadd_pbh((__v8bf)__A, (__v8bf)__B, (__v8bf)__C), (__v8bf)__C); } static __inline__ __m128bh __DEFAULT_FN_ATTRS128 -_mm_maskz_fnmaddne_pbh(__mmask8 __U, __m128bh __A, __m128bh __B, __m128bh __C) { +_mm_maskz_fnmadd_pbh(__mmask8 __U, __m128bh __A, __m128bh __B, __m128bh __C) { return (__m128bh)__builtin_ia32_selectpbf_128( - (__mmask8)__U, _mm_fnmaddne_pbh((__v8bf)__A, (__v8bf)__B, (__v8bf)__C), + (__mmask8)__U, _mm_fnmadd_pbh((__v8bf)__A, (__v8bf)__B, (__v8bf)__C), (__v8bf)_mm_setzero_pbh()); } -static __inline__ __m128bh __DEFAULT_FN_ATTRS128 -_mm_fnmsubne_pbh(__m128bh __A, __m128bh __B, __m128bh __C) { +static __inline__ __m128bh __DEFAULT_FN_ATTRS128 _mm_fnmsub_pbh(__m128bh __A, + __m128bh __B, + __m128bh __C) { return (__m128bh)__builtin_ia32_vfmaddnepbh128((__v8bf)__A, -(__v8bf)__B, -(__v8bf)__C); } static __inline__ __m128bh __DEFAULT_FN_ATTRS128 -_mm_mask_fnmsubne_pbh(__m128bh __A, __mmask8 __U, __m128bh __B, __m128bh __C) { +_mm_mask_fnmsub_pbh(__m128bh __A, __mmask8 __U, __m128bh __B, __m128bh __C) { return (__m128bh)__builtin_ia32_selectpbf_128( - (__mmask8)__U, _mm_fnmsubne_pbh((__v8bf)__A, (__v8bf)__B, (__v8bf)__C), + (__mmask8)__U, _mm_fnmsub_pbh((__v8bf)__A, (__v8bf)__B, (__v8bf)__C), (__v8bf)__A); } static __inline__ __m128bh __DEFAULT_FN_ATTRS128 -_mm_mask3_fnmsubne_pbh(__m128bh __A, __m128bh __B, __m128bh __C, __mmask8 __U) { +_mm_mask3_fnmsub_pbh(__m128bh __A, __m128bh __B, __m128bh __C, __mmask8 __U) { return (__m128bh)__builtin_ia32_selectpbf_128( - (__mmask8)__U, _mm_fnmsubne_pbh((__v8bf)__A, (__v8bf)__B, (__v8bf)__C), + (__mmask8)__U, _mm_fnmsub_pbh((__v8bf)__A, (__v8bf)__B, (__v8bf)__C), (__v8bf)__C); } static __inline__ __m128bh __DEFAULT_FN_ATTRS128 -_mm_maskz_fnmsubne_pbh(__mmask8 __U, __m128bh __A, __m128bh __B, __m128bh __C) { +_mm_maskz_fnmsub_pbh(__mmask8 __U, __m128bh __A, __m128bh __B, __m128bh __C) { return (__m128bh)__builtin_ia32_selectpbf_128( - (__mmask8)__U, _mm_fnmsubne_pbh((__v8bf)__A, (__v8bf)__B, (__v8bf)__C), + (__mmask8)__U, _mm_fnmsub_pbh((__v8bf)__A, (__v8bf)__B, (__v8bf)__C), (__v8bf)_mm_setzero_pbh()); } diff --git a/clang/lib/Sema/SemaX86.cpp b/clang/lib/Sema/SemaX86.cpp index 0b4b78c5b15dc..39c8ce1534c22 100644 --- a/clang/lib/Sema/SemaX86.cpp +++ b/clang/lib/Sema/SemaX86.cpp @@ -931,9 +931,9 @@ bool SemaX86::CheckBuiltinFunctionCall(const TargetInfo &TI, unsigned BuiltinID, case X86::BI__builtin_ia32_rndscaleps_mask: case X86::BI__builtin_ia32_rndscalepd_mask: case X86::BI__builtin_ia32_rndscaleph_mask: - case X86::BI__builtin_ia32_vrndscalenepbf16_128_mask: - case X86::BI__builtin_ia32_vrndscalenepbf16_256_mask: - case X86::BI__builtin_ia32_vrndscalenepbf16_mask: + case X86::BI__builtin_ia32_vrndscalebf16_128_mask: + case X86::BI__builtin_ia32_vrndscalebf16_256_mask: + case X86::BI__builtin_ia32_vrndscalebf16_mask: case X86::BI__builtin_ia32_reducepd128_mask: case X86::BI__builtin_ia32_reducepd256_mask: case X86::BI__builtin_ia32_reducepd512_mask: @@ -943,9 +943,9 @@ bool SemaX86::CheckBuiltinFunctionCall(const TargetInfo &TI, unsigned BuiltinID, case X86::BI__builtin_ia32_reduceph128_mask: case X86::BI__builtin_ia32_reduceph256_mask: case X86::BI__builtin_ia32_reduceph512_mask: - case X86::BI__builtin_ia32_vreducenepbf16128_mask: - case X86::BI__builtin_ia32_vreducenepbf16256_mask: - case X86::BI__builtin_ia32_vreducenepbf16512_mask: + case X86::BI__builtin_ia32_vreducebf16128_mask: + case X86::BI__builtin_ia32_vreducebf16256_mask: + case X86::BI__builtin_ia32_vreducebf16512_mask: case X86::BI__builtin_ia32_vreducepd256_round_mask: case X86::BI__builtin_ia32_vreduceps256_round_mask: case X86::BI__builtin_ia32_vreduceph256_round_mask: @@ -973,9 +973,9 @@ bool SemaX86::CheckBuiltinFunctionCall(const TargetInfo &TI, unsigned BuiltinID, case X86::BI__builtin_ia32_fpclassph128_mask: case X86::BI__builtin_ia32_fpclassph256_mask: case X86::BI__builtin_ia32_fpclassph512_mask: - case X86::BI__builtin_ia32_vfpclasspbf16128_mask: - case X86::BI__builtin_ia32_vfpclasspbf16256_mask: - case X86::BI__builtin_ia32_vfpclasspbf16512_mask: + case X86::BI__builtin_ia32_vfpclassbf16128_mask: + case X86::BI__builtin_ia32_vfpclassbf16256_mask: + case X86::BI__builtin_ia32_vfpclassbf16512_mask: case X86::BI__builtin_ia32_fpclasssd_mask: case X86::BI__builtin_ia32_fpclassss_mask: case X86::BI__builtin_ia32_fpclasssh_mask: diff --git a/clang/test/CodeGen/X86/avx10_2_512bf16-builtins.c b/clang/test/CodeGen/X86/avx10_2_512bf16-builtins.c index b00859c174fba..78405d63984f6 100644 --- a/clang/test/CodeGen/X86/avx10_2_512bf16-builtins.c +++ b/clang/test/CodeGen/X86/avx10_2_512bf16-builtins.c @@ -146,22 +146,22 @@ __m512bh test_mm512_setr_pbh(__bf16 bf1, __bf16 bf2, __bf16 bf3, __bf16 bf4, bf25, bf26, bf27, bf28, bf29, bf30, bf31, bf32); } -__m512 test_mm512_castpbf16_ps(__m512bh A) { - // CHECK-LABEL: test_mm512_castpbf16_ps +__m512 test_mm512_castbf16_ps(__m512bh A) { + // CHECK-LABEL: test_mm512_castbf16_ps // CHECK: bitcast <32 x bfloat> %{{.*}} to <16 x float> - return _mm512_castpbf16_ps(A); + return _mm512_castbf16_ps(A); } -__m512d test_mm512_castpbf16_pd(__m512bh A) { - // CHECK-LABEL: test_mm512_castpbf16_pd +__m512d test_mm512_castbf16_pd(__m512bh A) { + // CHECK-LABEL: test_mm512_castbf16_pd // CHECK: bitcast <32 x bfloat> %{{.*}} to <8 x double> - return _mm512_castpbf16_pd(A); + return _mm512_castbf16_pd(A); } -__m512i test_mm512_castpbf16_si512(__m512bh A) { - // CHECK-LABEL: test_mm512_castpbf16_si512 +__m512i test_mm512_castbf16_si512(__m512bh A) { + // CHECK-LABEL: test_mm512_castbf16_si512 // CHECK: bitcast <32 x bfloat> %{{.*}} to <8 x i64> - return _mm512_castpbf16_si512(A); + return _mm512_castbf16_si512(A); } __m512bh test_mm512_castps_pbh(__m512 A) { @@ -182,40 +182,40 @@ __m512bh test_mm512_castsi512_pbh(__m512i A) { return _mm512_castsi512_pbh(A); } -__m128bh test_mm512_castpbf16512_pbh128(__m512bh __a) { - // CHECK-LABEL: test_mm512_castpbf16512_pbh128 +__m128bh test_mm512_castbf16512_pbh128(__m512bh __a) { + // CHECK-LABEL: test_mm512_castbf16512_pbh128 // CHECK: shufflevector <32 x bfloat> %{{.*}}, <32 x bfloat> %{{.*}}, <8 x i32> - return _mm512_castpbf16512_pbh128(__a); + return _mm512_castbf16512_pbh128(__a); } -__m256bh test_mm512_castpbf16512_pbh256(__m512bh __a) { - // CHECK-LABEL: test_mm512_castpbf16512_pbh256 +__m256bh test_mm512_castbf16512_pbh256(__m512bh __a) { + // CHECK-LABEL: test_mm512_castbf16512_pbh256 // CHECK: shufflevector <32 x bfloat> %{{.*}}, <32 x bfloat> %{{.*}}, <16 x i32> - return _mm512_castpbf16512_pbh256(__a); + return _mm512_castbf16512_pbh256(__a); } -__m512bh test_mm512_castpbf16128_pbh512(__m128bh __a) { - // CHECK-LABEL: test_mm512_castpbf16128_pbh512 +__m512bh test_mm512_castbf16128_pbh512(__m128bh __a) { + // CHECK-LABEL: test_mm512_castbf16128_pbh512 // CHECK: shufflevector <8 x bfloat> %{{.*}}, <8 x bfloat> %{{.*}}, <32 x i32> - return _mm512_castpbf16128_pbh512(__a); + return _mm512_castbf16128_pbh512(__a); } -__m512bh test_mm512_castpbf16256_pbh512(__m256bh __a) { - // CHECK-LABEL: test_mm512_castpbf16256_pbh512 +__m512bh test_mm512_castbf16256_pbh512(__m256bh __a) { + // CHECK-LABEL: test_mm512_castbf16256_pbh512 // CHECK: shufflevector <16 x bfloat> %{{.*}}, <16 x bfloat> %{{.*}}, <32 x i32> - return _mm512_castpbf16256_pbh512(__a); + return _mm512_castbf16256_pbh512(__a); } -__m512bh test_mm512_zextpbf16128_pbh512(__m128bh __a) { - // CHECK-LABEL: test_mm512_zextpbf16128_pbh512 +__m512bh test_mm512_zextbf16128_pbh512(__m128bh __a) { + // CHECK-LABEL: test_mm512_zextbf16128_pbh512 // CHECK: shufflevector <8 x bfloat> %{{.*}}, <8 x bfloat> {{.*}}, <32 x i32> - return _mm512_zextpbf16128_pbh512(__a); + return _mm512_zextbf16128_pbh512(__a); } -__m512bh test_mm512_zextpbf16256_pbh512(__m256bh __a) { - // CHECK-LABEL: test_mm512_zextpbf16256_pbh512 +__m512bh test_mm512_zextbf16256_pbh512(__m256bh __a) { + // CHECK-LABEL: test_mm512_zextbf16256_pbh512 // CHECK: shufflevector <16 x bfloat> %{{.*}}, <16 x bfloat> {{.*}}, <32 x i32> - return _mm512_zextpbf16256_pbh512(__a); + return _mm512_zextbf16256_pbh512(__a); } __m512bh test_mm512_abs_pbh(__m512bh a) { @@ -277,110 +277,110 @@ __m512bh test_mm512_permutexvar_epi16(__m512i __A, __m512bh __B) { return _mm512_permutexvar_pbh(__A, __B); } -__m512bh test_mm512_addne_pbh(__m512bh __A, __m512bh __B) { - // CHECK-LABEL: @test_mm512_addne_pbh +__m512bh test_mm512_add_pbh(__m512bh __A, __m512bh __B) { + // CHECK-LABEL: @test_mm512_add_pbh // CHECK: %{{.*}} = fadd <32 x bfloat> %{{.*}}, %{{.*}} - return _mm512_addne_pbh(__A, __B); + return _mm512_add_pbh(__A, __B); } -__m512bh test_mm512_mask_addne_pbh(__m512bh __W, __mmask32 __U, __m512bh __A, __m512bh __B) { +__m512bh test_mm512_mask_add_pbh(__m512bh __W, __mmask32 __U, __m512bh __A, __m512bh __B) { // CHECK: %{{.*}} = fadd <32 x bfloat> %{{.*}}, %{{.*}} // CHECK: select <32 x i1> %{{.*}}, <32 x bfloat> %{{.*}}, <32 x bfloat> %{{.*}} - return _mm512_mask_addne_pbh(__W, __U, __A, __B); + return _mm512_mask_add_pbh(__W, __U, __A, __B); } -__m512bh test_mm512_maskz_addne_pbh(__mmask32 __U, __m512bh __A, __m512bh __B) { +__m512bh test_mm512_maskz_add_pbh(__mmask32 __U, __m512bh __A, __m512bh __B) { // CHECK: %{{.*}} = fadd <32 x bfloat> %{{.*}}, %{{.*}} // CHECK: select <32 x i1> %{{.*}}, <32 x bfloat> %{{.*}}, <32 x bfloat> %{{.*}} - return _mm512_maskz_addne_pbh(__U, __A, __B); + return _mm512_maskz_add_pbh(__U, __A, __B); } -__m512bh test_mm512_subne_pbh(__m512bh __A, __m512bh __B) { - // CHECK-LABEL: @test_mm512_subne_pbh +__m512bh test_mm512_sub_pbh(__m512bh __A, __m512bh __B) { + // CHECK-LABEL: @test_mm512_sub_pbh // CHECK: %{{.*}} = fsub <32 x bfloat> %{{.*}}, %{{.*}} - return _mm512_subne_pbh(__A, __B); + return _mm512_sub_pbh(__A, __B); } -__m512bh test_mm512_mask_subne_pbh(__m512bh __W, __mmask32 __U, __m512bh __A, __m512bh __B) { +__m512bh test_mm512_mask_sub_pbh(__m512bh __W, __mmask32 __U, __m512bh __A, __m512bh __B) { // CHECK: %{{.*}} = fsub <32 x bfloat> %{{.*}}, %{{.*}} // CHECK: select <32 x i1> %{{.*}}, <32 x bfloat> %{{.*}}, <32 x bfloat> %{{.*}} - return _mm512_mask_subne_pbh(__W, __U, __A, __B); + return _mm512_mask_sub_pbh(__W, __U, __A, __B); } -__m512bh test_mm512_maskz_subne_pbh(__mmask32 __U, __m512bh __A, __m512bh __B) { +__m512bh test_mm512_maskz_sub_pbh(__mmask32 __U, __m512bh __A, __m512bh __B) { // CHECK: %{{.*}} = fsub <32 x bfloat> %{{.*}}, %{{.*}} // CHECK: select <32 x i1> %{{.*}}, <32 x bfloat> %{{.*}}, <32 x bfloat> %{{.*}} - return _mm512_maskz_subne_pbh(__U, __A, __B); + return _mm512_maskz_sub_pbh(__U, __A, __B); } -__m512bh test_mm512_mulne_pbh(__m512bh __A, __m512bh __B) { - // CHECK-LABEL: @test_mm512_mulne_pbh +__m512bh test_mm512_mul_pbh(__m512bh __A, __m512bh __B) { + // CHECK-LABEL: @test_mm512_mul_pbh // CHECK: %{{.*}} = fmul <32 x bfloat> %{{.*}}, %{{.*}} - return _mm512_mulne_pbh(__A, __B); + return _mm512_mul_pbh(__A, __B); } -__m512bh test_mm512_mask_mulne_pbh(__m512bh __W, __mmask32 __U, __m512bh __A, __m512bh __B) { +__m512bh test_mm512_mask_mul_pbh(__m512bh __W, __mmask32 __U, __m512bh __A, __m512bh __B) { // CHECK: %{{.*}} = fmul <32 x bfloat> %{{.*}}, %{{.*}} // CHECK: select <32 x i1> %{{.*}}, <32 x bfloat> %{{.*}}, <32 x bfloat> %{{.*}} - return _mm512_mask_mulne_pbh(__W, __U, __A, __B); + return _mm512_mask_mul_pbh(__W, __U, __A, __B); } -__m512bh test_mm512_maskz_mulne_pbh(__mmask32 __U, __m512bh __A, __m512bh __B) { +__m512bh test_mm512_maskz_mul_pbh(__mmask32 __U, __m512bh __A, __m512bh __B) { // CHECK: %{{.*}} = fmul <32 x bfloat> %{{.*}}, %{{.*}} // CHECK: select <32 x i1> %{{.*}}, <32 x bfloat> %{{.*}}, <32 x bfloat> %{{.*}} - return _mm512_maskz_mulne_pbh(__U, __A, __B); + return _mm512_maskz_mul_pbh(__U, __A, __B); } -__m512bh test_mm512_divne_pbh(__m512bh __A, __m512bh __B) { - // CHECK-LABEL: @test_mm512_divne_pbh +__m512bh test_mm512_div_pbh(__m512bh __A, __m512bh __B) { + // CHECK-LABEL: @test_mm512_div_pbh // CHECK: %{{.*}} = fdiv <32 x bfloat> %{{.*}}, %{{.*}} - return _mm512_divne_pbh(__A, __B); + return _mm512_div_pbh(__A, __B); } -__m512bh test_mm512_mask_divne_pbh(__m512bh __W, __mmask32 __U, __m512bh __A, __m512bh __B) { +__m512bh test_mm512_mask_div_pbh(__m512bh __W, __mmask32 __U, __m512bh __A, __m512bh __B) { // CHECK: %{{.*}} = fdiv <32 x bfloat> %{{.*}}, %{{.*}} // CHECK: select <32 x i1> %{{.*}}, <32 x bfloat> %{{.*}}, <32 x bfloat> %{{.*}} - return _mm512_mask_divne_pbh(__W, __U, __A, __B); + return _mm512_mask_div_pbh(__W, __U, __A, __B); } -__m512bh test_mm512_maskz_divne_pbh(__mmask32 __U, __m512bh __A, __m512bh __B) { +__m512bh test_mm512_maskz_div_pbh(__mmask32 __U, __m512bh __A, __m512bh __B) { // CHECK: %{{.*}} = fdiv <32 x bfloat> %{{.*}}, %{{.*}} // CHECK: select <32 x i1> %{{.*}}, <32 x bfloat> %{{.*}}, <32 x bfloat> %{{.*}} - return _mm512_maskz_divne_pbh(__U, __A, __B); + return _mm512_maskz_div_pbh(__U, __A, __B); } __m512bh test_mm512_max_pbh(__m512bh __A, __m512bh __B) { // CHECK-LABEL: @test_mm512_max_pbh - // CHECK: @llvm.x86.avx10.vmaxpbf16512( + // CHECK: @llvm.x86.avx10.vmaxbf16512( return _mm512_max_pbh(__A, __B); } __m512bh test_mm512_mask_max_pbh(__m512bh __W, __mmask32 __U, __m512bh __A, __m512bh __B) { - // CHECK: @llvm.x86.avx10.vmaxpbf16512 + // CHECK: @llvm.x86.avx10.vmaxbf16512 // CHECK: select <32 x i1> %{{.*}}, <32 x bfloat> %{{.*}}, <32 x bfloat> %{{.*}} return _mm512_mask_max_pbh(__W, __U, __A, __B); } __m512bh test_mm512_maskz_max_pbh(__mmask32 __U, __m512bh __A, __m512bh __B) { - // CHECK: @llvm.x86.avx10.vmaxpbf16512 + // CHECK: @llvm.x86.avx10.vmaxbf16512 // CHECK: select <32 x i1> %{{.*}}, <32 x bfloat> %{{.*}}, <32 x bfloat> %{{.*}} return _mm512_maskz_max_pbh(__U, __A, __B); } __m512bh test_mm512_min_pbh(__m512bh __A, __m512bh __B) { // CHECK-LABEL: @test_mm512_min_pbh - // CHECK: @llvm.x86.avx10.vminpbf16512( + // CHECK: @llvm.x86.avx10.vminbf16512( return _mm512_min_pbh(__A, __B); } __m512bh test_mm512_mask_min_pbh(__m512bh __W, __mmask32 __U, __m512bh __A, __m512bh __B) { - // CHECK: @llvm.x86.avx10.vminpbf16512 + // CHECK: @llvm.x86.avx10.vminbf16512 // CHECK: select <32 x i1> %{{.*}}, <32 x bfloat> %{{.*}}, <32 x bfloat> %{{.*}} return _mm512_mask_min_pbh(__W, __U, __A, __B); } __m512bh test_mm512_maskz_min_pbh(__mmask32 __U, __m512bh __A, __m512bh __B) { - // CHECK: @llvm.x86.avx10.vminpbf16512 + // CHECK: @llvm.x86.avx10.vminbf16512 // CHECK: select <32 x i1> %{{.*}}, <32 x bfloat> %{{.*}}, <32 x bfloat> %{{.*}} return _mm512_maskz_min_pbh(__U, __A, __B); } @@ -802,139 +802,139 @@ __mmask32 test_mm512_mask_cmp_pbh_mask_true_us(__mmask32 m, __m512bh a, __m512bh __mmask32 test_mm512_mask_fpclass_pbh_mask(__mmask32 __U, __m512bh __A) { // CHECK-LABEL: @test_mm512_mask_fpclass_pbh_mask - // CHECK: @llvm.x86.avx10.fpclass.nepbf16.512 + // CHECK: @llvm.x86.avx10.fpclass.bf16.512 return _mm512_mask_fpclass_pbh_mask(__U, __A, 4); } __mmask32 test_mm512_fpclass_pbh_mask(__m512bh __A) { // CHECK-LABEL: @test_mm512_fpclass_pbh_mask - // CHECK: @llvm.x86.avx10.fpclass.nepbf16.512 + // CHECK: @llvm.x86.avx10.fpclass.bf16.512 return _mm512_fpclass_pbh_mask(__A, 4); } __m512bh test_mm512_scalef_pbh(__m512bh __A, __m512bh __B) { // CHECK-LABEL: @test_mm512_scalef_pbh - // CHECK: @llvm.x86.avx10.mask.scalef.nepbf16.512 + // CHECK: @llvm.x86.avx10.mask.scalef.bf16.512 return _mm512_scalef_pbh(__A, __B); } __m512bh test_mm512_mask_scalef_pbh(__m512bh __W, __mmask32 __U, __m512bh __A, __m512bh __B) { // CHECK-LABEL: @test_mm512_mask_scalef_pbh - // CHECK: @llvm.x86.avx10.mask.scalef.nepbf16.512 + // CHECK: @llvm.x86.avx10.mask.scalef.bf16.512 return _mm512_mask_scalef_pbh(__W, __U, __A, __B); } __m512bh test_mm512_maskz_scalef_pbh(__mmask32 __U, __m512bh __A, __m512bh __B) { // CHECK-LABEL: @test_mm512_maskz_scalef_pbh - // CHECK: @llvm.x86.avx10.mask.scalef.nepbf16.512 + // CHECK: @llvm.x86.avx10.mask.scalef.bf16.512 return _mm512_maskz_scalef_pbh(__U, __A, __B); } __m512bh test_mm512_rcp_pbh(__m512bh __A) { // CHECK-LABEL: @test_mm512_rcp_pbh - // CHECK: @llvm.x86.avx10.mask.rcp.nepbf16.512 + // CHECK: @llvm.x86.avx10.mask.rcp.bf16.512 return _mm512_rcp_pbh(__A); } __m512bh test_mm512_mask_rcp_pbh(__m512bh __W, __mmask32 __U, __m512bh __A) { // CHECK-LABEL: @test_mm512_mask_rcp_pbh - // CHECK: @llvm.x86.avx10.mask.rcp.nepbf16.512 + // CHECK: @llvm.x86.avx10.mask.rcp.bf16.512 return (__m512bh)_mm512_mask_rcp_pbh(__W, __U, __A); } __m512bh test_mm512_maskz_rcp_pbh(__mmask32 __U, __m512bh __A) { // CHECK-LABEL: @test_mm512_maskz_rcp_pbh - // CHECK: @llvm.x86.avx10.mask.rcp.nepbf16.512 + // CHECK: @llvm.x86.avx10.mask.rcp.bf16.512 return _mm512_maskz_rcp_pbh(__U, __A); } __m512bh test_mm512_getexp_pbh(__m512bh __A) { // CHECK-LABEL: @test_mm512_getexp_pbh - // CHECK: @llvm.x86.avx10.mask.getexp.nepbf16.512 + // CHECK: @llvm.x86.avx10.mask.getexp.bf16.512 return _mm512_getexp_pbh(__A); } __m512bh test_mm512_mask_getexp_pbh(__m512bh __W, __mmask32 __U, __m512bh __A) { // CHECK-LABEL: @test_mm512_mask_getexp_pbh - // CHECK: @llvm.x86.avx10.mask.getexp.nepbf16.512 + // CHECK: @llvm.x86.avx10.mask.getexp.bf16.512 return _mm512_mask_getexp_pbh(__W, __U, __A); } __m512bh test_mm512_maskz_getexp_pbh(__mmask32 __U, __m512bh __A) { // CHECK-LABEL: @test_mm512_maskz_getexp_pbh - // CHECK: @llvm.x86.avx10.mask.getexp.nepbf16.512 + // CHECK: @llvm.x86.avx10.mask.getexp.bf16.512 return _mm512_maskz_getexp_pbh(__U, __A); } __m512bh test_mm512_rsqrt_pbh(__m512bh __A) { // CHECK-LABEL: @test_mm512_rsqrt_pbh - // CHECK: @llvm.x86.avx10.mask.rsqrt.nepbf16.512 + // CHECK: @llvm.x86.avx10.mask.rsqrt.bf16.512 return _mm512_rsqrt_pbh(__A); } __m512bh test_mm512_mask_rsqrt_pbh(__m512bh __W, __mmask32 __U, __m512bh __A) { // CHECK-LABEL: @test_mm512_mask_rsqrt_pbh - // CHECK: @llvm.x86.avx10.mask.rsqrt.nepbf16.512 + // CHECK: @llvm.x86.avx10.mask.rsqrt.bf16.512 return (__m512bh)_mm512_mask_rsqrt_pbh(__W, __U, __A); } __m512bh test_mm512_maskz_rsqrt_pbh(__mmask32 __U, __m512bh __A) { // CHECK-LABEL: @test_mm512_maskz_rsqrt_pbh - // CHECK: @llvm.x86.avx10.mask.rsqrt.nepbf16.512 + // CHECK: @llvm.x86.avx10.mask.rsqrt.bf16.512 return _mm512_maskz_rsqrt_pbh(__U, __A); } -__m512bh test_mm512_reducene_pbh(__m512bh __A) { - // CHECK-LABEL: @test_mm512_reducene_pbh - // CHECK: @llvm.x86.avx10.mask.reduce.nepbf16.512 - return _mm512_reducene_pbh(__A, 3); +__m512bh test_mm512_reduce_pbh(__m512bh __A) { + // CHECK-LABEL: @test_mm512_reduce_pbh + // CHECK: @llvm.x86.avx10.mask.reduce.bf16.512 + return _mm512_reduce_pbh(__A, 3); } -__m512bh test_mm512_mask_reducene_pbh(__m512bh __W, __mmask16 __U, __m512bh __A) { - // CHECK-LABEL: @test_mm512_mask_reducene_pbh - // CHECK: @llvm.x86.avx10.mask.reduce.nepbf16.512 - return _mm512_mask_reducene_pbh(__W, __U, __A, 1); +__m512bh test_mm512_mask_reduce_pbh(__m512bh __W, __mmask16 __U, __m512bh __A) { + // CHECK-LABEL: @test_mm512_mask_reduce_pbh + // CHECK: @llvm.x86.avx10.mask.reduce.bf16.512 + return _mm512_mask_reduce_pbh(__W, __U, __A, 1); } -__m512bh test_mm512_maskz_reducene_pbh(__mmask16 __U, __m512bh __A) { - // CHECK-LABEL: @test_mm512_maskz_reducene_pbh - // CHECK: @llvm.x86.avx10.mask.reduce.nepbf16.512 - return _mm512_maskz_reducene_pbh(__U, __A, 1); +__m512bh test_mm512_maskz_reduce_pbh(__mmask16 __U, __m512bh __A) { + // CHECK-LABEL: @test_mm512_maskz_reduce_pbh + // CHECK: @llvm.x86.avx10.mask.reduce.bf16.512 + return _mm512_maskz_reduce_pbh(__U, __A, 1); } -__m512bh test_mm512_roundscalene_pbh(__m512bh __A) { - // CHECK-LABEL: @test_mm512_roundscalene_pbh - // CHECK: @llvm.x86.avx10.mask.rndscale.nepbf16.512 - return _mm512_roundscalene_pbh(__A, 3); +__m512bh test_mm512_roundscale_pbh(__m512bh __A) { + // CHECK-LABEL: @test_mm512_roundscale_pbh + // CHECK: @llvm.x86.avx10.mask.rndscale.bf16.512 + return _mm512_roundscale_pbh(__A, 3); } -__m512bh test_mm512_mask_roundscalene_pbh(__m512bh __W, __mmask16 __U, __m512bh __A) { - // CHECK-LABEL: @test_mm512_mask_roundscalene_pbh - // CHECK: @llvm.x86.avx10.mask.rndscale.nepbf16.512 - return _mm512_mask_roundscalene_pbh(__W, __U, __A, 1); +__m512bh test_mm512_mask_roundscale_pbh(__m512bh __W, __mmask16 __U, __m512bh __A) { + // CHECK-LABEL: @test_mm512_mask_roundscale_pbh + // CHECK: @llvm.x86.avx10.mask.rndscale.bf16.512 + return _mm512_mask_roundscale_pbh(__W, __U, __A, 1); } -__m512bh test_mm512_maskz_roundscalene_pbh(__mmask16 __U, __m512bh __A) { - // CHECK-LABEL: @test_mm512_maskz_roundscalene_pbh - // CHECK: @llvm.x86.avx10.mask.rndscale.nepbf16.512 - return _mm512_maskz_roundscalene_pbh(__U, __A, 1 ); +__m512bh test_mm512_maskz_roundscale_pbh(__mmask16 __U, __m512bh __A) { + // CHECK-LABEL: @test_mm512_maskz_roundscale_pbh + // CHECK: @llvm.x86.avx10.mask.rndscale.bf16.512 + return _mm512_maskz_roundscale_pbh(__U, __A, 1 ); } __m512bh test_mm512_getmant_pbh(__m512bh __A) { // CHECK-LABEL: @test_mm512_getmant_pbh - // CHECK: @llvm.x86.avx10.mask.getmant.nepbf16.512 + // CHECK: @llvm.x86.avx10.mask.getmant.bf16.512 return _mm512_getmant_pbh(__A, _MM_MANT_NORM_p5_2, _MM_MANT_SIGN_nan); } __m512bh test_mm512_mask_getmant_pbh(__m512bh __W, __mmask32 __U, __m512bh __A) { // CHECK-LABEL: @test_mm512_mask_getmant_pbh - // CHECK: @llvm.x86.avx10.mask.getmant.nepbf16.512 + // CHECK: @llvm.x86.avx10.mask.getmant.bf16.512 return _mm512_mask_getmant_pbh(__W, __U, __A, _MM_MANT_NORM_p5_2, _MM_MANT_SIGN_nan); } __m512bh test_mm512_maskz_getmant_pbh(__mmask32 __U, __m512bh __A) { // CHECK-LABEL: @test_mm512_maskz_getmant_pbh - // CHECK: @llvm.x86.avx10.mask.getmant.nepbf16.512 + // CHECK: @llvm.x86.avx10.mask.getmant.bf16.512 return _mm512_maskz_getmant_pbh(__U, __A, _MM_MANT_NORM_p5_2, _MM_MANT_SIGN_nan); } @@ -960,126 +960,126 @@ __m512bh test_mm512_maskz_sqrt_pbh(__mmask32 __U, __m512bh __A) { return _mm512_maskz_sqrt_pbh(__U, __A); } -__m512bh test_mm512_fmaddne_pbh(__m512bh __A, __m512bh __B, __m512bh __C) { - // CHECK-LABEL: @test_mm512_fmaddne_pbh +__m512bh test_mm512_fmadd_pbh(__m512bh __A, __m512bh __B, __m512bh __C) { + // CHECK-LABEL: @test_mm512_fmadd_pbh // CHECK: call <32 x bfloat> @llvm.fma.v32bf16(<32 x bfloat> %{{.*}}, <32 x bfloat> %{{.*}}, <32 x bfloat> %{{.*}}) - return _mm512_fmaddne_pbh(__A, __B, __C); + return _mm512_fmadd_pbh(__A, __B, __C); } -__m512bh test_mm512_mask_fmaddne_pbh(__m512bh __A, __mmask32 __U, __m512bh __B, __m512bh __C) { - // CHECK-LABEL: @test_mm512_mask_fmaddne_pbh +__m512bh test_mm512_mask_fmadd_pbh(__m512bh __A, __mmask32 __U, __m512bh __B, __m512bh __C) { + // CHECK-LABEL: @test_mm512_mask_fmadd_pbh // CHECK: call <32 x bfloat> @llvm.fma.v32bf16(<32 x bfloat> %{{.*}}, <32 x bfloat> %{{.*}}, <32 x bfloat> %{{.*}}) // CHECK: select <32 x i1> %{{.*}}, <32 x bfloat> %{{.*}}, <32 x bfloat> %{{.*}} - return _mm512_mask_fmaddne_pbh(__A, __U, __B, __C); + return _mm512_mask_fmadd_pbh(__A, __U, __B, __C); } -__m512bh test_mm512_mask3_fmaddne_pbh(__m512bh __A, __m512bh __B, __m512bh __C, __mmask32 __U) { - // CHECK-LABEL: @test_mm512_mask3_fmaddne_pbh +__m512bh test_mm512_mask3_fmadd_pbh(__m512bh __A, __m512bh __B, __m512bh __C, __mmask32 __U) { + // CHECK-LABEL: @test_mm512_mask3_fmadd_pbh // CHECK: call <32 x bfloat> @llvm.fma.v32bf16(<32 x bfloat> %{{.*}}, <32 x bfloat> %{{.*}}, <32 x bfloat> %{{.*}}) // CHECK: select <32 x i1> %{{.*}}, <32 x bfloat> %{{.*}}, <32 x bfloat> %{{.*}} - return _mm512_mask3_fmaddne_pbh(__A, __B, __C, __U); + return _mm512_mask3_fmadd_pbh(__A, __B, __C, __U); } -__m512bh test_mm512_maskz_fmaddne_pbh(__mmask32 __U, __m512bh __A, __m512bh __B, __m512bh __C) { - // CHECK-LABEL: @test_mm512_maskz_fmaddne_pbh +__m512bh test_mm512_maskz_fmadd_pbh(__mmask32 __U, __m512bh __A, __m512bh __B, __m512bh __C) { + // CHECK-LABEL: @test_mm512_maskz_fmadd_pbh // CHECK: call <32 x bfloat> @llvm.fma.v32bf16(<32 x bfloat> %{{.*}}, <32 x bfloat> %{{.*}}, <32 x bfloat> %{{.*}}) // CHECK: select <32 x i1> %{{.*}}, <32 x bfloat> %{{.*}}, <32 x bfloat> %{{.*}} - return _mm512_maskz_fmaddne_pbh(__U, __A, __B, __C); + return _mm512_maskz_fmadd_pbh(__U, __A, __B, __C); } -__m512bh test_mm512_fmsubne_pbh(__m512bh __A, __m512bh __B, __m512bh __C) { - // CHECK-LABEL: @test_mm512_fmsubne_pbh +__m512bh test_mm512_fmsub_pbh(__m512bh __A, __m512bh __B, __m512bh __C) { + // CHECK-LABEL: @test_mm512_fmsub_pbh // CHECK: fneg // CHECK: call <32 x bfloat> @llvm.fma.v32bf16(<32 x bfloat> %{{.*}}, <32 x bfloat> %{{.*}}, <32 x bfloat> %{{.*}}) - return _mm512_fmsubne_pbh(__A, __B, __C); + return _mm512_fmsub_pbh(__A, __B, __C); } -__m512bh test_mm512_mask_fmsubne_pbh(__m512bh __A, __mmask32 __U, __m512bh __B, __m512bh __C) { - // CHECK-LABEL: @test_mm512_mask_fmsubne_pbh +__m512bh test_mm512_mask_fmsub_pbh(__m512bh __A, __mmask32 __U, __m512bh __B, __m512bh __C) { + // CHECK-LABEL: @test_mm512_mask_fmsub_pbh // CHECK: fneg // CHECK: call <32 x bfloat> @llvm.fma.v32bf16(<32 x bfloat> %{{.*}}, <32 x bfloat> %{{.*}}, <32 x bfloat> %{{.*}}) // CHECK: select <32 x i1> %{{.*}}, <32 x bfloat> %{{.*}}, <32 x bfloat> %{{.*}} - return _mm512_mask_fmsubne_pbh(__A, __U, __B, __C); + return _mm512_mask_fmsub_pbh(__A, __U, __B, __C); } -__m512bh test_mm512_mask3_fmsubne_pbh(__m512bh __A, __m512bh __B, __m512bh __C, __mmask32 __U) { - // CHECK-LABEL: @test_mm512_mask3_fmsubne_pbh +__m512bh test_mm512_mask3_fmsub_pbh(__m512bh __A, __m512bh __B, __m512bh __C, __mmask32 __U) { + // CHECK-LABEL: @test_mm512_mask3_fmsub_pbh // CHECK: fneg // CHECK: call <32 x bfloat> @llvm.fma.v32bf16(<32 x bfloat> %{{.*}}, <32 x bfloat> %{{.*}}, <32 x bfloat> %{{.*}}) // CHECK: select <32 x i1> %{{.*}}, <32 x bfloat> %{{.*}}, <32 x bfloat> %{{.*}} - return _mm512_mask3_fmsubne_pbh(__A, __B, __C, __U); + return _mm512_mask3_fmsub_pbh(__A, __B, __C, __U); } -__m512bh test_mm512_maskz_fmsubne_pbh(__mmask32 __U, __m512bh __A, __m512bh __B, __m512bh __C) { - // CHECK-LABEL: @test_mm512_maskz_fmsubne_pbh +__m512bh test_mm512_maskz_fmsub_pbh(__mmask32 __U, __m512bh __A, __m512bh __B, __m512bh __C) { + // CHECK-LABEL: @test_mm512_maskz_fmsub_pbh // CHECK: fneg // CHECK: call <32 x bfloat> @llvm.fma.v32bf16(<32 x bfloat> %{{.*}}, <32 x bfloat> %{{.*}}, <32 x bfloat> %{{.*}}) // CHECK: select <32 x i1> %{{.*}}, <32 x bfloat> %{{.*}}, <32 x bfloat> %{{.*}} - return _mm512_maskz_fmsubne_pbh(__U, __A, __B, __C); + return _mm512_maskz_fmsub_pbh(__U, __A, __B, __C); } -__m512bh test_mm512_fnmaddne_pbh(__m512bh __A, __m512bh __B, __m512bh __C) { - // CHECK-LABEL: @test_mm512_fnmaddne_pbh +__m512bh test_mm512_fnmadd_pbh(__m512bh __A, __m512bh __B, __m512bh __C) { + // CHECK-LABEL: @test_mm512_fnmadd_pbh // CHECK: fneg // CHECK: call <32 x bfloat> @llvm.fma.v32bf16(<32 x bfloat> %{{.*}}, <32 x bfloat> %{{.*}}, <32 x bfloat> %{{.*}}) - return _mm512_fnmaddne_pbh(__A, __B, __C); + return _mm512_fnmadd_pbh(__A, __B, __C); } -__m512bh test_mm512_mask_fnmaddne_pbh(__m512bh __A, __mmask32 __U, __m512bh __B, __m512bh __C) { - // CHECK-LABEL: @test_mm512_mask_fnmaddne_pbh +__m512bh test_mm512_mask_fnmadd_pbh(__m512bh __A, __mmask32 __U, __m512bh __B, __m512bh __C) { + // CHECK-LABEL: @test_mm512_mask_fnmadd_pbh // CHECK: fneg // CHECK: call <32 x bfloat> @llvm.fma.v32bf16(<32 x bfloat> %{{.*}}, <32 x bfloat> %{{.*}}, <32 x bfloat> %{{.*}}) // CHECK: select <32 x i1> %{{.*}}, <32 x bfloat> %{{.*}}, <32 x bfloat> %{{.*}} - return _mm512_mask_fnmaddne_pbh(__A, __U, __B, __C); + return _mm512_mask_fnmadd_pbh(__A, __U, __B, __C); } -__m512bh test_mm512_mask3_fnmaddne_pbh(__m512bh __A, __m512bh __B, __m512bh __C, __mmask32 __U) { - // CHECK-LABEL: @test_mm512_mask3_fnmaddne_pbh +__m512bh test_mm512_mask3_fnmadd_pbh(__m512bh __A, __m512bh __B, __m512bh __C, __mmask32 __U) { + // CHECK-LABEL: @test_mm512_mask3_fnmadd_pbh // CHECK: fneg // CHECK: call <32 x bfloat> @llvm.fma.v32bf16(<32 x bfloat> %{{.*}}, <32 x bfloat> %{{.*}}, <32 x bfloat> %{{.*}}) // CHECK: select <32 x i1> %{{.*}}, <32 x bfloat> %{{.*}}, <32 x bfloat> %{{.*}} - return _mm512_mask3_fnmaddne_pbh(__A, __B, __C, __U); + return _mm512_mask3_fnmadd_pbh(__A, __B, __C, __U); } -__m512bh test_mm512_maskz_fnmaddne_pbh(__mmask32 __U, __m512bh __A, __m512bh __B, __m512bh __C) { - // CHECK-LABEL: @test_mm512_maskz_fnmaddne_pbh +__m512bh test_mm512_maskz_fnmadd_pbh(__mmask32 __U, __m512bh __A, __m512bh __B, __m512bh __C) { + // CHECK-LABEL: @test_mm512_maskz_fnmadd_pbh // CHECK: fneg // CHECK: call <32 x bfloat> @llvm.fma.v32bf16(<32 x bfloat> %{{.*}}, <32 x bfloat> %{{.*}}, <32 x bfloat> %{{.*}}) // CHECK: select <32 x i1> %{{.*}}, <32 x bfloat> %{{.*}}, <32 x bfloat> %{{.*}} - return _mm512_maskz_fnmaddne_pbh(__U, __A, __B, __C); + return _mm512_maskz_fnmadd_pbh(__U, __A, __B, __C); } -__m512bh test_mm512_fnmsubne_pbh(__m512bh __A, __m512bh __B, __m512bh __C) { - // CHECK-LABEL: @test_mm512_fnmsubne_pbh +__m512bh test_mm512_fnmsub_pbh(__m512bh __A, __m512bh __B, __m512bh __C) { + // CHECK-LABEL: @test_mm512_fnmsub_pbh // CHECK: fneg // CHECK: fneg // CHECK: call <32 x bfloat> @llvm.fma.v32bf16(<32 x bfloat> %{{.*}}, <32 x bfloat> %{{.*}}, <32 x bfloat> %{{.*}}) - return _mm512_fnmsubne_pbh(__A, __B, __C); + return _mm512_fnmsub_pbh(__A, __B, __C); } -__m512bh test_mm512_mask_fnmsubne_pbh(__m512bh __A, __mmask32 __U, __m512bh __B, __m512bh __C) { - // CHECK-LABEL: @test_mm512_mask_fnmsubne_pbh +__m512bh test_mm512_mask_fnmsub_pbh(__m512bh __A, __mmask32 __U, __m512bh __B, __m512bh __C) { + // CHECK-LABEL: @test_mm512_mask_fnmsub_pbh // CHECK: fneg // CHECK: fneg // CHECK: call <32 x bfloat> @llvm.fma.v32bf16(<32 x bfloat> %{{.*}}, <32 x bfloat> %{{.*}}, <32 x bfloat> %{{.*}}) // CHECK: select <32 x i1> %{{.*}}, <32 x bfloat> %{{.*}}, <32 x bfloat> %{{.*}} - return _mm512_mask_fnmsubne_pbh(__A, __U, __B, __C); + return _mm512_mask_fnmsub_pbh(__A, __U, __B, __C); } -__m512bh test_mm512_mask3_fnmsubne_pbh(__m512bh __A, __m512bh __B, __m512bh __C, __mmask32 __U) { - // CHECK-LABEL: @test_mm512_mask3_fnmsubne_pbh +__m512bh test_mm512_mask3_fnmsub_pbh(__m512bh __A, __m512bh __B, __m512bh __C, __mmask32 __U) { + // CHECK-LABEL: @test_mm512_mask3_fnmsub_pbh // CHECK: fneg // CHECK: fneg // CHECK: call <32 x bfloat> @llvm.fma.v32bf16(<32 x bfloat> %{{.*}}, <32 x bfloat> %{{.*}}, <32 x bfloat> %{{.*}}) // CHECK: select <32 x i1> %{{.*}}, <32 x bfloat> %{{.*}}, <32 x bfloat> %{{.*}} - return _mm512_mask3_fnmsubne_pbh(__A, __B, __C, __U); + return _mm512_mask3_fnmsub_pbh(__A, __B, __C, __U); } -__m512bh test_mm512_maskz_fnmsubne_pbh(__mmask32 __U, __m512bh __A, __m512bh __B, __m512bh __C) { - // CHECK-LABEL: @test_mm512_maskz_fnmsubne_pbh +__m512bh test_mm512_maskz_fnmsub_pbh(__mmask32 __U, __m512bh __A, __m512bh __B, __m512bh __C) { + // CHECK-LABEL: @test_mm512_maskz_fnmsub_pbh // CHECK: fneg // CHECK: fneg // CHECK: call <32 x bfloat> @llvm.fma.v32bf16(<32 x bfloat> %{{.*}}, <32 x bfloat> %{{.*}}, <32 x bfloat> %{{.*}}) // CHECK: select <32 x i1> %{{.*}}, <32 x bfloat> %{{.*}}, <32 x bfloat> %{{.*}} - return _mm512_maskz_fnmsubne_pbh(__U, __A, __B, __C); + return _mm512_maskz_fnmsub_pbh(__U, __A, __B, __C); } diff --git a/clang/test/CodeGen/X86/avx10_2bf16-builtins.c b/clang/test/CodeGen/X86/avx10_2bf16-builtins.c index 9935137ca8677..931381af5df75 100644 --- a/clang/test/CodeGen/X86/avx10_2bf16-builtins.c +++ b/clang/test/CodeGen/X86/avx10_2bf16-builtins.c @@ -164,28 +164,28 @@ __m256bh test_mm256_setr_pbh(__bf16 bf1, __bf16 bf2, __bf16 bf3, __bf16 bf4, bf9, bf10, bf11, bf12, bf13, bf14, bf15, bf16); } -__m128 test_mm_castpbf16_ps(__m128bh A) { - // CHECK-LABEL: test_mm_castpbf16_ps +__m128 test_mm_castbf16_ps(__m128bh A) { + // CHECK-LABEL: test_mm_castbf16_ps // CHECK: bitcast <8 x bfloat> %{{.*}} to <4 x float> - return _mm_castpbf16_ps(A); + return _mm_castbf16_ps(A); } -__m256 test_mm256_castpbf16_ps(__m256bh A) { - // CHECK-LABEL: test_mm256_castpbf16_ps +__m256 test_mm256_castbf16_ps(__m256bh A) { + // CHECK-LABEL: test_mm256_castbf16_ps // CHECK: bitcast <16 x bfloat> %{{.*}} to <8 x float> - return _mm256_castpbf16_ps(A); + return _mm256_castbf16_ps(A); } -__m128i test_mm_castpbf16_si128(__m128bh A) { - // CHECK-LABEL: test_mm_castpbf16_si128 +__m128i test_mm_castbf16_si128(__m128bh A) { + // CHECK-LABEL: test_mm_castbf16_si128 // CHECK: bitcast <8 x bfloat> %{{.*}} to <2 x i64> - return _mm_castpbf16_si128(A); + return _mm_castbf16_si128(A); } -__m256i test_mm256_castpbf16_si256(__m256bh A) { - // CHECK-LABEL: test_mm256_castpbf16_si256 +__m256i test_mm256_castbf16_si256(__m256bh A) { + // CHECK-LABEL: test_mm256_castbf16_si256 // CHECK: bitcast <16 x bfloat> %{{.*}} to <4 x i64> - return _mm256_castpbf16_si256(A); + return _mm256_castbf16_si256(A); } __m128bh test_mm_castps_pbh(__m128 A) { @@ -224,34 +224,34 @@ __m256bh test_mm256_castsi256_pbh(__m256i A) { return _mm256_castsi256_pbh(A); } -__m128d test_mm_castpbf16_pd(__m128bh A) { - // CHECK-LABEL: test_mm_castpbf16_pd +__m128d test_mm_castbf16_pd(__m128bh A) { + // CHECK-LABEL: test_mm_castbf16_pd // CHECK: bitcast <8 x bfloat> %{{.*}} to <2 x double> - return _mm_castpbf16_pd(A); + return _mm_castbf16_pd(A); } -__m128bh test_mm256_castpbf16256_pbh128(__m256bh __a) { - // CHECK-LABEL: test_mm256_castpbf16256_pbh128 +__m128bh test_mm256_castbf16256_pbh128(__m256bh __a) { + // CHECK-LABEL: test_mm256_castbf16256_pbh128 // CHECK: shufflevector <16 x bfloat> %{{.*}}, <16 x bfloat> %{{.*}}, <8 x i32> - return _mm256_castpbf16256_pbh128(__a); + return _mm256_castbf16256_pbh128(__a); } -__m256bh test_mm256_castpbf16128_pbh256(__m128bh __a) { - // CHECK-LABEL: test_mm256_castpbf16128_pbh256 +__m256bh test_mm256_castbf16128_pbh256(__m128bh __a) { + // CHECK-LABEL: test_mm256_castbf16128_pbh256 // CHECK: shufflevector <8 x bfloat> %{{.*}}, <8 x bfloat> %{{.*}}, <16 x i32> - return _mm256_castpbf16128_pbh256(__a); + return _mm256_castbf16128_pbh256(__a); } -__m256d test_mm256_castpbf16_pd(__m256bh A) { - // CHECK-LABEL: test_mm256_castpbf16_pd +__m256d test_mm256_castbf16_pd(__m256bh A) { + // CHECK-LABEL: test_mm256_castbf16_pd // CHECK: bitcast <16 x bfloat> %{{.*}} to <4 x double> - return _mm256_castpbf16_pd(A); + return _mm256_castbf16_pd(A); } -__m256bh test_mm256_zextpbf16128_pbh256(__m128bh __a) { - // CHECK-LABEL: test_mm256_zextpbf16128_pbh256 +__m256bh test_mm256_zextbf16128_pbh256(__m128bh __a) { + // CHECK-LABEL: test_mm256_zextbf16128_pbh256 // CHECK: shufflevector <8 x bfloat> %{{.*}}, <8 x bfloat> {{.*}}, <16 x i32> - return _mm256_zextpbf16128_pbh256(__a); + return _mm256_zextbf16128_pbh256(__a); } __m128bh test_mm_abs_pbh(__m128bh a) { @@ -432,218 +432,218 @@ __m256bh test_mm256_permutexvar_pbh(__m256i __A, __m256bh __B) { return _mm256_permutexvar_pbh(__A, __B); } -__m256bh test_mm256_addne_pbh(__m256bh __A, __m256bh __B) { - // CHECK-LABEL: @test_mm256_addne_pbh +__m256bh test_mm256_add_pbh(__m256bh __A, __m256bh __B) { + // CHECK-LABEL: @test_mm256_add_pbh // CHECK: %{{.*}} = fadd <16 x bfloat> %{{.*}}, %{{.*}} - return _mm256_addne_pbh(__A, __B); + return _mm256_add_pbh(__A, __B); } -__m256bh test_mm256_mask_addne_pbh(__m256bh __W, __mmask16 __U, __m256bh __A, __m256bh __B) { +__m256bh test_mm256_mask_add_pbh(__m256bh __W, __mmask16 __U, __m256bh __A, __m256bh __B) { // CHECK: %{{.*}} = fadd <16 x bfloat> %{{.*}}, %{{.*}} // CHECK: select <16 x i1> %{{.*}}, <16 x bfloat> %{{.*}}, <16 x bfloat> %{{.*}} - return (__m256bh)_mm256_mask_addne_pbh(__W, __U, __A, __B); + return (__m256bh)_mm256_mask_add_pbh(__W, __U, __A, __B); } -__m256bh test_mm256_maskz_addne_pbh(__mmask16 __U, __m256bh __A, __m256bh __B) { +__m256bh test_mm256_maskz_add_pbh(__mmask16 __U, __m256bh __A, __m256bh __B) { // CHECK: %{{.*}} = fadd <16 x bfloat> %{{.*}}, %{{.*}} // CHECK: select <16 x i1> %{{.*}}, <16 x bfloat> %{{.*}}, <16 x bfloat> %{{.*}} - return _mm256_maskz_addne_pbh(__U, __A, __B); + return _mm256_maskz_add_pbh(__U, __A, __B); } -__m128bh test_mm_addne_pbh(__m128bh __A, __m128bh __B) { - // CHECK-LABEL: @test_mm_addne_pbh +__m128bh test_mm_add_pbh(__m128bh __A, __m128bh __B) { + // CHECK-LABEL: @test_mm_add_pbh // CHECK: %{{.*}} = fadd <8 x bfloat> %{{.*}}, %{{.*}} - return _mm_addne_pbh(__A, __B); + return _mm_add_pbh(__A, __B); } -__m128bh test_mm_mask_addne_pbh(__m128bh __W, __mmask16 __U, __m128bh __A, __m128bh __B) { +__m128bh test_mm_mask_add_pbh(__m128bh __W, __mmask16 __U, __m128bh __A, __m128bh __B) { // CHECK: %{{.*}} = fadd <8 x bfloat> %{{.*}}, %{{.*}} // CHECK: select <8 x i1> %{{.*}}, <8 x bfloat> %{{.*}}, <8 x bfloat> %{{.*}} - return (__m128bh)_mm_mask_addne_pbh(__W, __U, __A, __B); + return (__m128bh)_mm_mask_add_pbh(__W, __U, __A, __B); } -__m128bh test_mm_maskz_addne_pbh(__mmask16 __U, __m128bh __A, __m128bh __B) { +__m128bh test_mm_maskz_add_pbh(__mmask16 __U, __m128bh __A, __m128bh __B) { // CHECK: %{{.*}} = fadd <8 x bfloat> %{{.*}}, %{{.*}} // CHECK: select <8 x i1> %{{.*}}, <8 x bfloat> %{{.*}}, <8 x bfloat> %{{.*}} - return _mm_maskz_addne_pbh(__U, __A, __B); + return _mm_maskz_add_pbh(__U, __A, __B); } -__m256bh test_mm256_subne_pbh(__m256bh __A, __m256bh __B) { - // CHECK-LABEL: @test_mm256_subne_pbh +__m256bh test_mm256_sub_pbh(__m256bh __A, __m256bh __B) { + // CHECK-LABEL: @test_mm256_sub_pbh // CHECK: %{{.*}} = fsub <16 x bfloat> %{{.*}}, %{{.*}} - return _mm256_subne_pbh(__A, __B); + return _mm256_sub_pbh(__A, __B); } -__m256bh test_mm256_mask_subne_pbh(__m256bh __W, __mmask16 __U, __m256bh __A, __m256bh __B) { +__m256bh test_mm256_mask_sub_pbh(__m256bh __W, __mmask16 __U, __m256bh __A, __m256bh __B) { // CHECK: %{{.*}} = fsub <16 x bfloat> %{{.*}}, %{{.*}} // CHECK: select <16 x i1> %{{.*}}, <16 x bfloat> %{{.*}}, <16 x bfloat> %{{.*}} - return (__m256bh)_mm256_mask_subne_pbh(__W, __U, __A, __B); + return (__m256bh)_mm256_mask_sub_pbh(__W, __U, __A, __B); } -__m256bh test_mm256_maskz_subne_pbh(__mmask16 __U, __m256bh __A, __m256bh __B) { +__m256bh test_mm256_maskz_sub_pbh(__mmask16 __U, __m256bh __A, __m256bh __B) { // CHECK: %{{.*}} = fsub <16 x bfloat> %{{.*}}, %{{.*}} // CHECK: select <16 x i1> %{{.*}}, <16 x bfloat> %{{.*}}, <16 x bfloat> %{{.*}} - return _mm256_maskz_subne_pbh(__U, __A, __B); + return _mm256_maskz_sub_pbh(__U, __A, __B); } -__m128bh test_mm_subne_pbh(__m128bh __A, __m128bh __B) { - // CHECK-LABEL: @test_mm_subne_pbh +__m128bh test_mm_sub_pbh(__m128bh __A, __m128bh __B) { + // CHECK-LABEL: @test_mm_sub_pbh // CHECK: %{{.*}} = fsub <8 x bfloat> %{{.*}}, %{{.*}} - return _mm_subne_pbh(__A, __B); + return _mm_sub_pbh(__A, __B); } -__m128bh test_mm_mask_subne_pbh(__m128bh __W, __mmask16 __U, __m128bh __A, __m128bh __B) { +__m128bh test_mm_mask_sub_pbh(__m128bh __W, __mmask16 __U, __m128bh __A, __m128bh __B) { // CHECK: %{{.*}} = fsub <8 x bfloat> %{{.*}}, %{{.*}} // CHECK: select <8 x i1> %{{.*}}, <8 x bfloat> %{{.*}}, <8 x bfloat> %{{.*}} - return (__m128bh)_mm_mask_subne_pbh(__W, __U, __A, __B); + return (__m128bh)_mm_mask_sub_pbh(__W, __U, __A, __B); } -__m128bh test_mm_maskz_subne_pbh(__mmask16 __U, __m128bh __A, __m128bh __B) { +__m128bh test_mm_maskz_sub_pbh(__mmask16 __U, __m128bh __A, __m128bh __B) { // CHECK: %{{.*}} = fsub <8 x bfloat> %{{.*}}, %{{.*}} // CHECK: select <8 x i1> %{{.*}}, <8 x bfloat> %{{.*}}, <8 x bfloat> %{{.*}} - return _mm_maskz_subne_pbh(__U, __A, __B); + return _mm_maskz_sub_pbh(__U, __A, __B); } -__m256bh test_mm256_mulne_pbh(__m256bh __A, __m256bh __B) { - // CHECK-LABEL: @test_mm256_mulne_pbh +__m256bh test_mm256_mul_pbh(__m256bh __A, __m256bh __B) { + // CHECK-LABEL: @test_mm256_mul_pbh // CHECK: %{{.*}} = fmul <16 x bfloat> %{{.*}}, %{{.*}} - return _mm256_mulne_pbh(__A, __B); + return _mm256_mul_pbh(__A, __B); } -__m256bh test_mm256_mask_mulne_pbh(__m256bh __W, __mmask16 __U, __m256bh __A, __m256bh __B) { +__m256bh test_mm256_mask_mul_pbh(__m256bh __W, __mmask16 __U, __m256bh __A, __m256bh __B) { // CHECK: %{{.*}} = fmul <16 x bfloat> %{{.*}}, %{{.*}} // CHECK: select <16 x i1> %{{.*}}, <16 x bfloat> %{{.*}}, <16 x bfloat> %{{.*}} - return (__m256bh)_mm256_mask_mulne_pbh(__W, __U, __A, __B); + return (__m256bh)_mm256_mask_mul_pbh(__W, __U, __A, __B); } -__m256bh test_mm256_maskz_mulne_pbh(__mmask16 __U, __m256bh __A, __m256bh __B) { +__m256bh test_mm256_maskz_mul_pbh(__mmask16 __U, __m256bh __A, __m256bh __B) { // CHECK: %{{.*}} = fmul <16 x bfloat> %{{.*}}, %{{.*}} // CHECK: select <16 x i1> %{{.*}}, <16 x bfloat> %{{.*}}, <16 x bfloat> %{{.*}} - return _mm256_maskz_mulne_pbh(__U, __A, __B); + return _mm256_maskz_mul_pbh(__U, __A, __B); } -__m128bh test_mm_mulne_pbh(__m128bh __A, __m128bh __B) { - // CHECK-LABEL: @test_mm_mulne_pbh +__m128bh test_mm_mul_pbh(__m128bh __A, __m128bh __B) { + // CHECK-LABEL: @test_mm_mul_pbh // CHECK: %{{.*}} = fmul <8 x bfloat> %{{.*}}, %{{.*}} - return _mm_mulne_pbh(__A, __B); + return _mm_mul_pbh(__A, __B); } -__m128bh test_mm_mask_mulne_pbh(__m128bh __W, __mmask16 __U, __m128bh __A, __m128bh __B) { +__m128bh test_mm_mask_mul_pbh(__m128bh __W, __mmask16 __U, __m128bh __A, __m128bh __B) { // CHECK: %{{.*}} = fmul <8 x bfloat> %{{.*}}, %{{.*}} // CHECK: select <8 x i1> %{{.*}}, <8 x bfloat> %{{.*}}, <8 x bfloat> %{{.*}} - return (__m128bh)_mm_mask_mulne_pbh(__W, __U, __A, __B); + return (__m128bh)_mm_mask_mul_pbh(__W, __U, __A, __B); } -__m128bh test_mm_maskz_mulne_pbh(__mmask16 __U, __m128bh __A, __m128bh __B) { +__m128bh test_mm_maskz_mul_pbh(__mmask16 __U, __m128bh __A, __m128bh __B) { // CHECK: %{{.*}} = fmul <8 x bfloat> %{{.*}}, %{{.*}} // CHECK: select <8 x i1> %{{.*}}, <8 x bfloat> %{{.*}}, <8 x bfloat> %{{.*}} - return _mm_maskz_mulne_pbh(__U, __A, __B); + return _mm_maskz_mul_pbh(__U, __A, __B); } -__m256bh test_mm256_divne_pbh(__m256bh __A, __m256bh __B) { - // CHECK-LABEL: @test_mm256_divne_pbh +__m256bh test_mm256_div_pbh(__m256bh __A, __m256bh __B) { + // CHECK-LABEL: @test_mm256_div_pbh // CHECK: %{{.*}} = fdiv <16 x bfloat> %{{.*}}, %{{.*}} - return _mm256_divne_pbh(__A, __B); + return _mm256_div_pbh(__A, __B); } -__m256bh test_mm256_mask_divne_pbh(__m256bh __W, __mmask16 __U, __m256bh __A, __m256bh __B) { +__m256bh test_mm256_mask_div_pbh(__m256bh __W, __mmask16 __U, __m256bh __A, __m256bh __B) { // CHECK: %{{.*}} = fdiv <16 x bfloat> %{{.*}}, %{{.*}} // CHECK: select <16 x i1> %{{.*}}, <16 x bfloat> %{{.*}}, <16 x bfloat> %{{.*}} - return (__m256bh)_mm256_mask_divne_pbh(__W, __U, __A, __B); + return (__m256bh)_mm256_mask_div_pbh(__W, __U, __A, __B); } -__m256bh test_mm256_maskz_divne_pbh(__mmask16 __U, __m256bh __A, __m256bh __B) { +__m256bh test_mm256_maskz_div_pbh(__mmask16 __U, __m256bh __A, __m256bh __B) { // CHECK: %{{.*}} = fdiv <16 x bfloat> %{{.*}}, %{{.*}} // CHECK: select <16 x i1> %{{.*}}, <16 x bfloat> %{{.*}}, <16 x bfloat> %{{.*}} - return _mm256_maskz_divne_pbh(__U, __A, __B); + return _mm256_maskz_div_pbh(__U, __A, __B); } -__m128bh test_mm_divne_pbh(__m128bh __A, __m128bh __B) { - // CHECK-LABEL: @test_mm_divne_pbh +__m128bh test_mm_div_pbh(__m128bh __A, __m128bh __B) { + // CHECK-LABEL: @test_mm_div_pbh // CHECK: %{{.*}} = fdiv <8 x bfloat> %{{.*}}, %{{.*}} - return _mm_divne_pbh(__A, __B); + return _mm_div_pbh(__A, __B); } -__m128bh test_mm_mask_divne_pbh(__m128bh __W, __mmask16 __U, __m128bh __A, __m128bh __B) { +__m128bh test_mm_mask_div_pbh(__m128bh __W, __mmask16 __U, __m128bh __A, __m128bh __B) { // CHECK: %{{.*}} = fdiv <8 x bfloat> %{{.*}}, %{{.*}} // CHECK: select <8 x i1> %{{.*}}, <8 x bfloat> %{{.*}}, <8 x bfloat> %{{.*}} - return (__m128bh)_mm_mask_divne_pbh(__W, __U, __A, __B); + return (__m128bh)_mm_mask_div_pbh(__W, __U, __A, __B); } -__m128bh test_mm_maskz_divne_pbh(__mmask16 __U, __m128bh __A, __m128bh __B) { +__m128bh test_mm_maskz_div_pbh(__mmask16 __U, __m128bh __A, __m128bh __B) { // CHECK: %{{.*}} = fdiv <8 x bfloat> %{{.*}}, %{{.*}} // CHECK: select <8 x i1> %{{.*}}, <8 x bfloat> %{{.*}}, <8 x bfloat> %{{.*}} - return _mm_maskz_divne_pbh(__U, __A, __B); + return _mm_maskz_div_pbh(__U, __A, __B); } __m256bh test_mm256_max_pbh(__m256bh __A, __m256bh __B) { // CHECK-LABEL: @test_mm256_max_pbh - // CHECK: @llvm.x86.avx10.vmaxpbf16256( + // CHECK: @llvm.x86.avx10.vmaxbf16256( return _mm256_max_pbh(__A, __B); } __m256bh test_mm256_mask_max_pbh(__m256bh __W, __mmask16 __U, __m256bh __A, __m256bh __B) { - // CHECK: @llvm.x86.avx10.vmaxpbf16256 + // CHECK: @llvm.x86.avx10.vmaxbf16256 // CHECK: select <16 x i1> %{{.*}}, <16 x bfloat> %{{.*}}, <16 x bfloat> %{{.*}} return (__m256bh)_mm256_mask_max_pbh(__W, __U, __A, __B); } __m256bh test_mm256_maskz_max_pbh(__mmask16 __U, __m256bh __A, __m256bh __B) { - // CHECK: @llvm.x86.avx10.vmaxpbf16256 + // CHECK: @llvm.x86.avx10.vmaxbf16256 // CHECK: select <16 x i1> %{{.*}}, <16 x bfloat> %{{.*}}, <16 x bfloat> %{{.*}} return _mm256_maskz_max_pbh(__U, __A, __B); } __m128bh test_mm_max_pbh(__m128bh __A, __m128bh __B) { // CHECK-LABEL: @test_mm_max_pbh - // CHECK: @llvm.x86.avx10.vmaxpbf16128( + // CHECK: @llvm.x86.avx10.vmaxbf16128( return _mm_max_pbh(__A, __B); } __m128bh test_mm_mask_max_pbh(__m128bh __W, __mmask16 __U, __m128bh __A, __m128bh __B) { - // CHECK: @llvm.x86.avx10.vmaxpbf16128 + // CHECK: @llvm.x86.avx10.vmaxbf16128 // CHECK: select <8 x i1> %{{.*}}, <8 x bfloat> %{{.*}}, <8 x bfloat> %{{.*}} return (__m128bh)_mm_mask_max_pbh(__W, __U, __A, __B); } __m128bh test_mm_maskz_max_pbh(__mmask16 __U, __m128bh __A, __m128bh __B) { - // CHECK: @llvm.x86.avx10.vmaxpbf16128 + // CHECK: @llvm.x86.avx10.vmaxbf16128 // CHECK: select <8 x i1> %{{.*}}, <8 x bfloat> %{{.*}}, <8 x bfloat> %{{.*}} return _mm_maskz_max_pbh(__U, __A, __B); } __m256bh test_mm256_min_pbh(__m256bh __A, __m256bh __B) { // CHECK-LABEL: @test_mm256_min_pbh - // CHECK: @llvm.x86.avx10.vminpbf16256( + // CHECK: @llvm.x86.avx10.vminbf16256( return _mm256_min_pbh(__A, __B); } __m256bh test_mm256_mask_min_pbh(__m256bh __W, __mmask16 __U, __m256bh __A, __m256bh __B) { - // CHECK: @llvm.x86.avx10.vminpbf16256 + // CHECK: @llvm.x86.avx10.vminbf16256 // CHECK: select <16 x i1> %{{.*}}, <16 x bfloat> %{{.*}}, <16 x bfloat> %{{.*}} return (__m256bh)_mm256_mask_min_pbh(__W, __U, __A, __B); } __m256bh test_mm256_maskz_min_pbh(__mmask16 __U, __m256bh __A, __m256bh __B) { - // CHECK: @llvm.x86.avx10.vminpbf16256 + // CHECK: @llvm.x86.avx10.vminbf16256 // CHECK: select <16 x i1> %{{.*}}, <16 x bfloat> %{{.*}}, <16 x bfloat> %{{.*}} return _mm256_maskz_min_pbh(__U, __A, __B); } __m128bh test_mm_min_pbh(__m128bh __A, __m128bh __B) { // CHECK-LABEL: @test_mm_min_pbh - // CHECK: @llvm.x86.avx10.vminpbf16128( + // CHECK: @llvm.x86.avx10.vminbf16128( return _mm_min_pbh(__A, __B); } __m128bh test_mm_mask_min_pbh(__m128bh __W, __mmask16 __U, __m128bh __A, __m128bh __B) { - // CHECK: @llvm.x86.avx10.vminpbf16128 + // CHECK: @llvm.x86.avx10.vminbf16128 // CHECK: select <8 x i1> %{{.*}}, <8 x bfloat> %{{.*}}, <8 x bfloat> %{{.*}} return (__m128bh)_mm_mask_min_pbh(__W, __U, __A, __B); } __m128bh test_mm_maskz_min_pbh(__mmask16 __U, __m128bh __A, __m128bh __B) { - // CHECK: @llvm.x86.avx10.vminpbf16128 + // CHECK: @llvm.x86.avx10.vminbf16128 // CHECK: select <8 x i1> %{{.*}}, <8 x bfloat> %{{.*}}, <8 x bfloat> %{{.*}} return _mm_maskz_min_pbh(__U, __A, __B); } @@ -1519,151 +1519,151 @@ __mmask8 test_mm_mask_cmp_pbh_mask_true_us(__mmask8 m, __m128bh a, __m128bh b) { __mmask16 test_mm256_mask_fpclass_pbh_mask(__mmask16 __U, __m256bh __A) { // CHECK-LABEL: @test_mm256_mask_fpclass_pbh_mask - // CHECK: @llvm.x86.avx10.fpclass.nepbf16.256 + // CHECK: @llvm.x86.avx10.fpclass.bf16.256 return _mm256_mask_fpclass_pbh_mask(__U, __A, 4); } __mmask16 test_mm256_fpclass_pbh_mask(__m256bh __A) { // CHECK-LABEL: @test_mm256_fpclass_pbh_mask - // CHECK: @llvm.x86.avx10.fpclass.nepbf16.256 + // CHECK: @llvm.x86.avx10.fpclass.bf16.256 return _mm256_fpclass_pbh_mask(__A, 4); } __mmask8 test_mm_mask_fpclass_pbh_mask(__mmask8 __U, __m128bh __A) { // CHECK-LABEL: @test_mm_mask_fpclass_pbh_mask - // CHECK: @llvm.x86.avx10.fpclass.nepbf16.128 + // CHECK: @llvm.x86.avx10.fpclass.bf16.128 return _mm_mask_fpclass_pbh_mask(__U, __A, 4); } __mmask8 test_mm_fpclass_pbh_mask(__m128bh __A) { // CHECK-LABEL: @test_mm_fpclass_pbh_mask - // CHECK: @llvm.x86.avx10.fpclass.nepbf16.128 + // CHECK: @llvm.x86.avx10.fpclass.bf16.128 return _mm_fpclass_pbh_mask(__A, 4); } __m256bh test_mm256_scalef_pbh(__m256bh __A, __m256bh __B) { // CHECK-LABEL: @test_mm256_scalef_pbh - // CHECK: @llvm.x86.avx10.mask.scalef.nepbf16.256 + // CHECK: @llvm.x86.avx10.mask.scalef.bf16.256 return _mm256_scalef_pbh(__A, __B); } __m256bh test_mm256_mask_scalef_pbh(__m256bh __W, __mmask16 __U, __m256bh __A, __m256bh __B) { // CHECK-LABEL: @test_mm256_mask_scalef_pbh - // CHECK: @llvm.x86.avx10.mask.scalef.nepbf16.256 + // CHECK: @llvm.x86.avx10.mask.scalef.bf16.256 return _mm256_mask_scalef_pbh(__W, __U, __A, __B); } __m256bh test_mm256_maskz_scalef_pbh(__mmask16 __U, __m256bh __A, __m256bh __B) { // CHECK-LABEL: @test_mm256_maskz_scalef_pbh - // CHECK: @llvm.x86.avx10.mask.scalef.nepbf16.256 + // CHECK: @llvm.x86.avx10.mask.scalef.bf16.256 return _mm256_maskz_scalef_pbh(__U, __A, __B); } __m256bh test_mm256_rcp_pbh(__m256bh __A) { // CHECK-LABEL: @test_mm256_rcp_pbh - // CHECK: @llvm.x86.avx10.mask.rcp.nepbf16.256 + // CHECK: @llvm.x86.avx10.mask.rcp.bf16.256 return _mm256_rcp_pbh(__A); } __m256bh test_mm256_mask_rcp_pbh(__m256bh __W, __mmask16 __U, __m256bh __A) { // CHECK-LABEL: @test_mm256_mask_rcp_pbh - // CHECK: @llvm.x86.avx10.mask.rcp.nepbf16.256 + // CHECK: @llvm.x86.avx10.mask.rcp.bf16.256 return (__m256bh)_mm256_mask_rcp_pbh(__W, __U, __A); } __m256bh test_mm256_maskz_rcp_pbh(__mmask16 __U, __m256bh __A) { // CHECK-LABEL: @test_mm256_maskz_rcp_pbh - // CHECK: @llvm.x86.avx10.mask.rcp.nepbf16.256 + // CHECK: @llvm.x86.avx10.mask.rcp.bf16.256 return _mm256_maskz_rcp_pbh(__U, __A); } __m256bh test_mm256_getexp_pbh(__m256bh __A) { // CHECK-LABEL: @test_mm256_getexp_pbh - // CHECK: @llvm.x86.avx10.mask.getexp.nepbf16.256 + // CHECK: @llvm.x86.avx10.mask.getexp.bf16.256 return _mm256_getexp_pbh(__A); } __m256bh test_mm256_mask_getexp_pbh(__m256bh __W, __mmask16 __U, __m256bh __A) { // CHECK-LABEL: @test_mm256_mask_getexp_pbh - // CHECK: @llvm.x86.avx10.mask.getexp.nepbf16.256 + // CHECK: @llvm.x86.avx10.mask.getexp.bf16.256 return _mm256_mask_getexp_pbh(__W, __U, __A); } __m256bh test_mm256_maskz_getexp_pbh(__mmask16 __U, __m256bh __A) { // CHECK-LABEL: @test_mm256_maskz_getexp_pbh - // CHECK: @llvm.x86.avx10.mask.getexp.nepbf16.256 + // CHECK: @llvm.x86.avx10.mask.getexp.bf16.256 return _mm256_maskz_getexp_pbh(__U, __A); } __m256bh test_mm256_rsqrt_pbh(__m256bh __A) { // CHECK-LABEL: @test_mm256_rsqrt_pbh - // CHECK: @llvm.x86.avx10.mask.rsqrt.nepbf16.256 + // CHECK: @llvm.x86.avx10.mask.rsqrt.bf16.256 return _mm256_rsqrt_pbh(__A); } __m256bh test_mm256_mask_rsqrt_pbh(__m256bh __W, __mmask16 __U, __m256bh __A) { // CHECK-LABEL: @test_mm256_mask_rsqrt_pbh - // CHECK: @llvm.x86.avx10.mask.rsqrt.nepbf16.256 + // CHECK: @llvm.x86.avx10.mask.rsqrt.bf16.256 return (__m256bh)_mm256_mask_rsqrt_pbh(__W, __U, __A); } __m256bh test_mm256_maskz_rsqrt_pbh(__mmask16 __U, __m256bh __A) { // CHECK-LABEL: @test_mm256_maskz_rsqrt_pbh - // CHECK: @llvm.x86.avx10.mask.rsqrt.nepbf16.256 + // CHECK: @llvm.x86.avx10.mask.rsqrt.bf16.256 return _mm256_maskz_rsqrt_pbh(__U, __A); } -__m256bh test_mm256_reducene_pbh(__m256bh __A) { - // CHECK-LABEL: @test_mm256_reducene_pbh - // CHECK: @llvm.x86.avx10.mask.reduce.nepbf16.256 - return _mm256_reducene_pbh(__A, 3); +__m256bh test_mm256_reduce_pbh(__m256bh __A) { + // CHECK-LABEL: @test_mm256_reduce_pbh + // CHECK: @llvm.x86.avx10.mask.reduce.bf16.256 + return _mm256_reduce_pbh(__A, 3); } -__m256bh test_mm256_mask_reducene_pbh(__m256bh __W, __mmask16 __U, __m256bh __A) { - // CHECK-LABEL: @test_mm256_mask_reducene_pbh - // CHECK: @llvm.x86.avx10.mask.reduce.nepbf16.256 - return _mm256_mask_reducene_pbh(__W, __U, __A, 1); +__m256bh test_mm256_mask_reduce_pbh(__m256bh __W, __mmask16 __U, __m256bh __A) { + // CHECK-LABEL: @test_mm256_mask_reduce_pbh + // CHECK: @llvm.x86.avx10.mask.reduce.bf16.256 + return _mm256_mask_reduce_pbh(__W, __U, __A, 1); } -__m256bh test_mm256_maskz_reducene_pbh(__mmask16 __U, __m256bh __A) { - // CHECK-LABEL: @test_mm256_maskz_reducene_pbh - // CHECK: @llvm.x86.avx10.mask.reduce.nepbf16.256 - return _mm256_maskz_reducene_pbh(__U, __A, 1); +__m256bh test_mm256_maskz_reduce_pbh(__mmask16 __U, __m256bh __A) { + // CHECK-LABEL: @test_mm256_maskz_reduce_pbh + // CHECK: @llvm.x86.avx10.mask.reduce.bf16.256 + return _mm256_maskz_reduce_pbh(__U, __A, 1); } -__m256bh test_mm256_roundscalene_pbh(__m256bh __A) { - // CHECK-LABEL: @test_mm256_roundscalene_pbh - // CHECK: @llvm.x86.avx10.mask.rndscale.nepbf16.256 - return _mm256_roundscalene_pbh(__A, 3); +__m256bh test_mm256_roundscale_pbh(__m256bh __A) { + // CHECK-LABEL: @test_mm256_roundscale_pbh + // CHECK: @llvm.x86.avx10.mask.rndscale.bf16.256 + return _mm256_roundscale_pbh(__A, 3); } -__m256bh test_mm256_mask_roundscalene_pbh(__m256bh __W, __mmask16 __U, __m256bh __A) { - // CHECK-LABEL: @test_mm256_mask_roundscalene_pbh - // CHECK: @llvm.x86.avx10.mask.rndscale.nepbf16.256 - return _mm256_mask_roundscalene_pbh(__W, __U, __A, 1); +__m256bh test_mm256_mask_roundscale_pbh(__m256bh __W, __mmask16 __U, __m256bh __A) { + // CHECK-LABEL: @test_mm256_mask_roundscale_pbh + // CHECK: @llvm.x86.avx10.mask.rndscale.bf16.256 + return _mm256_mask_roundscale_pbh(__W, __U, __A, 1); } -__m256bh test_mm256_maskz_roundscalene_pbh(__mmask16 __U, __m256bh __A) { - // CHECK-LABEL: @test_mm256_maskz_roundscalene_pbh - // CHECK: @llvm.x86.avx10.mask.rndscale.nepbf16.256 - return _mm256_maskz_roundscalene_pbh(__U, __A, 1 ); +__m256bh test_mm256_maskz_roundscale_pbh(__mmask16 __U, __m256bh __A) { + // CHECK-LABEL: @test_mm256_maskz_roundscale_pbh + // CHECK: @llvm.x86.avx10.mask.rndscale.bf16.256 + return _mm256_maskz_roundscale_pbh(__U, __A, 1 ); } __m256bh test_mm256_getmant_pbh(__m256bh __A) { // CHECK-LABEL: @test_mm256_getmant_pbh - // CHECK: @llvm.x86.avx10.mask.getmant.nepbf16.256 + // CHECK: @llvm.x86.avx10.mask.getmant.bf16.256 return _mm256_getmant_pbh(__A, _MM_MANT_NORM_p5_2, _MM_MANT_SIGN_nan); } __m256bh test_mm256_mask_getmant_pbh(__m256bh __W, __mmask16 __U, __m256bh __A) { // CHECK-LABEL: @test_mm256_mask_getmant_pbh - // CHECK: @llvm.x86.avx10.mask.getmant.nepbf16.256 + // CHECK: @llvm.x86.avx10.mask.getmant.bf16.256 return _mm256_mask_getmant_pbh(__W, __U, __A, _MM_MANT_NORM_p5_2, _MM_MANT_SIGN_nan); } __m256bh test_mm256_maskz_getmant_pbh(__mmask16 __U, __m256bh __A) { // CHECK-LABEL: @test_mm256_maskz_getmant_pbh - // CHECK: @llvm.x86.avx10.mask.getmant.nepbf16.256 + // CHECK: @llvm.x86.avx10.mask.getmant.bf16.256 return _mm256_maskz_getmant_pbh(__U, __A, _MM_MANT_NORM_p5_2, _MM_MANT_SIGN_nan); } @@ -1689,127 +1689,127 @@ __m256bh test_mm256_maskz_sqrt_pbh(__mmask16 __U, __m256bh __A) { __m128bh test_mm_scalef_pbh(__m128bh __A, __m128bh __B) { // CHECK-LABEL: @test_mm_scalef_pbh - // CHECK: @llvm.x86.avx10.mask.scalef.nepbf16.128 + // CHECK: @llvm.x86.avx10.mask.scalef.bf16.128 return _mm_scalef_pbh(__A, __B); } __m128bh test_mm_mask_scalef_pbh(__m128bh __W, __mmask8 __U, __m128bh __A, __m128bh __B) { // CHECK-LABEL: @test_mm_mask_scalef_pbh - // CHECK: @llvm.x86.avx10.mask.scalef.nepbf16.128 + // CHECK: @llvm.x86.avx10.mask.scalef.bf16.128 return _mm_mask_scalef_pbh(__W, __U, __A, __B); } __m128bh test_mm_maskz_scalef_pbh(__mmask8 __U, __m128bh __A, __m128bh __B) { // CHECK-LABEL: @test_mm_maskz_scalef_pbh - // CHECK: @llvm.x86.avx10.mask.scalef.nepbf16.128 + // CHECK: @llvm.x86.avx10.mask.scalef.bf16.128 return _mm_maskz_scalef_pbh(__U, __A, __B); } __m128bh test_mm_rcp_pbh(__m128bh __A) { // CHECK-LABEL: @test_mm_rcp_pbh - // CHECK: @llvm.x86.avx10.mask.rcp.nepbf16.128 + // CHECK: @llvm.x86.avx10.mask.rcp.bf16.128 return _mm_rcp_pbh(__A); } __m128bh test_mm_mask_rcp_pbh(__m128bh __W, __mmask8 __U, __m128bh __A) { // CHECK-LABEL: @test_mm_mask_rcp_pbh - // CHECK: @llvm.x86.avx10.mask.rcp.nepbf16.128 + // CHECK: @llvm.x86.avx10.mask.rcp.bf16.128 return (__m128bh)_mm_mask_rcp_pbh(__W, __U, __A); } __m128bh test_mm_maskz_rcp_pbh(__mmask8 __U, __m128bh __A) { // CHECK-LABEL: @test_mm_maskz_rcp_pbh - // CHECK: @llvm.x86.avx10.mask.rcp.nepbf16.128 + // CHECK: @llvm.x86.avx10.mask.rcp.bf16.128 return _mm_maskz_rcp_pbh(__U, __A); } __m128bh test_mm_getexp_pbh(__m128bh __A) { // CHECK-LABEL: @test_mm_getexp_pbh - // CHECK: @llvm.x86.avx10.mask.getexp.nepbf16.128 + // CHECK: @llvm.x86.avx10.mask.getexp.bf16.128 return _mm_getexp_pbh(__A); } __m128bh test_mm_mask_getexp_pbh(__m128bh __W, __mmask8 __U, __m128bh __A) { // CHECK-LABEL: @test_mm_mask_getexp_pbh - // CHECK: @llvm.x86.avx10.mask.getexp.nepbf16.128 + // CHECK: @llvm.x86.avx10.mask.getexp.bf16.128 return _mm_mask_getexp_pbh(__W, __U, __A); } __m128bh test_mm_maskz_getexp_pbh(__mmask8 __U, __m128bh __A) { // CHECK-LABEL: @test_mm_maskz_getexp_pbh - // CHECK: @llvm.x86.avx10.mask.getexp.nepbf16.128 + // CHECK: @llvm.x86.avx10.mask.getexp.bf16.128 return _mm_maskz_getexp_pbh(__U, __A); } __m128bh test_mm_rsqrt_pbh(__m128bh __A) { // CHECK-LABEL: @test_mm_rsqrt_pbh - // CHECK: @llvm.x86.avx10.mask.rsqrt.nepbf16.128 + // CHECK: @llvm.x86.avx10.mask.rsqrt.bf16.128 return _mm_rsqrt_pbh(__A); } __m128bh test_mm_mask_rsqrt_pbh(__m128bh __W, __mmask8 __U, __m128bh __A) { // CHECK-LABEL: @test_mm_mask_rsqrt_pbh - // CHECK: @llvm.x86.avx10.mask.rsqrt.nepbf16.128 + // CHECK: @llvm.x86.avx10.mask.rsqrt.bf16.128 return (__m128bh)_mm_mask_rsqrt_pbh(__W, __U, __A); } __m128bh test_mm_maskz_rsqrt_pbh(__mmask8 __U, __m128bh __A) { // CHECK-LABEL: @test_mm_maskz_rsqrt_pbh - // CHECK: @llvm.x86.avx10.mask.rsqrt.nepbf16.128 + // CHECK: @llvm.x86.avx10.mask.rsqrt.bf16.128 return _mm_maskz_rsqrt_pbh(__U, __A); } -__m128bh test_mm_reducene_pbh(__m128bh __A) { - // CHECK-LABEL: @test_mm_reducene_pbh - // CHECK: @llvm.x86.avx10.mask.reduce.nepbf16.128 - return _mm_reducene_pbh(__A, 3); +__m128bh test_mm_reduce_pbh(__m128bh __A) { + // CHECK-LABEL: @test_mm_reduce_pbh + // CHECK: @llvm.x86.avx10.mask.reduce.bf16.128 + return _mm_reduce_pbh(__A, 3); } -__m128bh test_mm_mask_reducene_pbh(__m128bh __W, __mmask8 __U, __m128bh __A) { - // CHECK-LABEL: @test_mm_mask_reducene_pbh - // CHECK: @llvm.x86.avx10.mask.reduce.nepbf16.128 - return _mm_mask_reducene_pbh(__W, __U, __A, 1); +__m128bh test_mm_mask_reduce_pbh(__m128bh __W, __mmask8 __U, __m128bh __A) { + // CHECK-LABEL: @test_mm_mask_reduce_pbh + // CHECK: @llvm.x86.avx10.mask.reduce.bf16.128 + return _mm_mask_reduce_pbh(__W, __U, __A, 1); } -__m128bh test_mm_maskz_reducene_pbh(__mmask8 __U, __m128bh __A) { - // CHECK-LABEL: @test_mm_maskz_reducene_pbh - // CHECK: @llvm.x86.avx10.mask.reduce.nepbf16.128 - return _mm_maskz_reducene_pbh(__U, __A, 1); +__m128bh test_mm_maskz_reduce_pbh(__mmask8 __U, __m128bh __A) { + // CHECK-LABEL: @test_mm_maskz_reduce_pbh + // CHECK: @llvm.x86.avx10.mask.reduce.bf16.128 + return _mm_maskz_reduce_pbh(__U, __A, 1); } -__m128bh test_mm_roundscalene_pbh(__m128bh __A) { - // CHECK-LABEL: @test_mm_roundscalene_pbh - // CHECK: @llvm.x86.avx10.mask.rndscale.nepbf16.128 - return _mm_roundscalene_pbh(__A, 3); +__m128bh test_mm_roundscale_pbh(__m128bh __A) { + // CHECK-LABEL: @test_mm_roundscale_pbh + // CHECK: @llvm.x86.avx10.mask.rndscale.bf16.128 + return _mm_roundscale_pbh(__A, 3); } -__m128bh test_mm_mask_roundscalene_pbh(__m128bh __W, __mmask8 __U, __m128bh __A) { - // CHECK-LABEL: @test_mm_mask_roundscalene_pbh - // CHECK: @llvm.x86.avx10.mask.rndscale.nepbf16.128 - return _mm_mask_roundscalene_pbh(__W, __U, __A, 1); +__m128bh test_mm_mask_roundscale_pbh(__m128bh __W, __mmask8 __U, __m128bh __A) { + // CHECK-LABEL: @test_mm_mask_roundscale_pbh + // CHECK: @llvm.x86.avx10.mask.rndscale.bf16.128 + return _mm_mask_roundscale_pbh(__W, __U, __A, 1); } -__m128bh test_mm_maskz_roundscalene_pbh(__mmask8 __U, __m128bh __A) { - // CHECK-LABEL: @test_mm_maskz_roundscalene_pbh - // CHECK: @llvm.x86.avx10.mask.rndscale.nepbf16.128 - return _mm_maskz_roundscalene_pbh(__U, __A, 1 ); +__m128bh test_mm_maskz_roundscale_pbh(__mmask8 __U, __m128bh __A) { + // CHECK-LABEL: @test_mm_maskz_roundscale_pbh + // CHECK: @llvm.x86.avx10.mask.rndscale.bf16.128 + return _mm_maskz_roundscale_pbh(__U, __A, 1 ); } __m128bh test_mm_getmant_pbh(__m128bh __A) { // CHECK-LABEL: @test_mm_getmant_pbh - // CHECK: @llvm.x86.avx10.mask.getmant.nepbf16.128 + // CHECK: @llvm.x86.avx10.mask.getmant.bf16.128 return _mm_getmant_pbh(__A, _MM_MANT_NORM_p5_2, _MM_MANT_SIGN_nan); } __m128bh test_mm_mask_getmant_pbh(__m128bh __W, __mmask8 __U, __m128bh __A) { // CHECK-LABEL: @test_mm_mask_getmant_pbh - // CHECK: @llvm.x86.avx10.mask.getmant.nepbf16.128 + // CHECK: @llvm.x86.avx10.mask.getmant.bf16.128 return _mm_mask_getmant_pbh(__W, __U, __A, _MM_MANT_NORM_p5_2, _MM_MANT_SIGN_nan); } __m128bh test_mm_maskz_getmant_pbh(__mmask8 __U, __m128bh __A) { // CHECK-LABEL: @test_mm_maskz_getmant_pbh - // CHECK: @llvm.x86.avx10.mask.getmant.nepbf16.128 + // CHECK: @llvm.x86.avx10.mask.getmant.bf16.128 return _mm_maskz_getmant_pbh(__U, __A, _MM_MANT_NORM_p5_2, _MM_MANT_SIGN_nan); } @@ -1833,250 +1833,250 @@ __m128bh test_mm_maskz_sqrt_pbh(__mmask8 __U, __m128bh __A) { return _mm_maskz_sqrt_pbh(__U, __A); } -__m256bh test_mm256_fmaddne_pbh(__m256bh __A, __m256bh __B, __m256bh __C) { - // CHECK-LABEL: @test_mm256_fmaddne_pbh +__m256bh test_mm256_fmadd_pbh(__m256bh __A, __m256bh __B, __m256bh __C) { + // CHECK-LABEL: @test_mm256_fmadd_pbh // CHECK: call <16 x bfloat> @llvm.fma.v16bf16(<16 x bfloat> %{{.*}}, <16 x bfloat> %{{.*}}, <16 x bfloat> %{{.*}}) - return _mm256_fmaddne_pbh(__A, __B, __C); + return _mm256_fmadd_pbh(__A, __B, __C); } -__m256bh test_mm256_mask_fmaddne_pbh(__m256bh __A, __mmask16 __U, __m256bh __B, __m256bh __C) { - // CHECK-LABEL: @test_mm256_mask_fmaddne_pbh +__m256bh test_mm256_mask_fmadd_pbh(__m256bh __A, __mmask16 __U, __m256bh __B, __m256bh __C) { + // CHECK-LABEL: @test_mm256_mask_fmadd_pbh // CHECK: call <16 x bfloat> @llvm.fma.v16bf16(<16 x bfloat> %{{.*}}, <16 x bfloat> %{{.*}}, <16 x bfloat> %{{.*}}) // CHECK: select <16 x i1> %{{.*}}, <16 x bfloat> %{{.*}}, <16 x bfloat> %{{.*}} - return _mm256_mask_fmaddne_pbh(__A, __U, __B, __C); + return _mm256_mask_fmadd_pbh(__A, __U, __B, __C); } -__m256bh test_mm256_mask3_fmaddne_pbh(__m256bh __A, __m256bh __B, __m256bh __C, __mmask16 __U) { - // CHECK-LABEL: @test_mm256_mask3_fmaddne_pbh +__m256bh test_mm256_mask3_fmadd_pbh(__m256bh __A, __m256bh __B, __m256bh __C, __mmask16 __U) { + // CHECK-LABEL: @test_mm256_mask3_fmadd_pbh // CHECK: call <16 x bfloat> @llvm.fma.v16bf16(<16 x bfloat> %{{.*}}, <16 x bfloat> %{{.*}}, <16 x bfloat> %{{.*}}) // CHECK: select <16 x i1> %{{.*}}, <16 x bfloat> %{{.*}}, <16 x bfloat> %{{.*}} - return _mm256_mask3_fmaddne_pbh(__A, __B, __C, __U); + return _mm256_mask3_fmadd_pbh(__A, __B, __C, __U); } -__m256bh test_mm256_maskz_fmaddne_pbh(__mmask16 __U, __m256bh __A, __m256bh __B, __m256bh __C) { - // CHECK-LABEL: @test_mm256_maskz_fmaddne_pbh +__m256bh test_mm256_maskz_fmadd_pbh(__mmask16 __U, __m256bh __A, __m256bh __B, __m256bh __C) { + // CHECK-LABEL: @test_mm256_maskz_fmadd_pbh // CHECK: call <16 x bfloat> @llvm.fma.v16bf16(<16 x bfloat> %{{.*}}, <16 x bfloat> %{{.*}}, <16 x bfloat> %{{.*}}) // CHECK: select <16 x i1> %{{.*}}, <16 x bfloat> %{{.*}}, <16 x bfloat> %{{.*}} - return _mm256_maskz_fmaddne_pbh(__U, __A, __B, __C); + return _mm256_maskz_fmadd_pbh(__U, __A, __B, __C); } -__m256bh test_mm256_fmsubne_pbh(__m256bh __A, __m256bh __B, __m256bh __C) { - // CHECK-LABEL: @test_mm256_fmsubne_pbh +__m256bh test_mm256_fmsub_pbh(__m256bh __A, __m256bh __B, __m256bh __C) { + // CHECK-LABEL: @test_mm256_fmsub_pbh // CHECK: fneg // CHECK: call <16 x bfloat> @llvm.fma.v16bf16(<16 x bfloat> %{{.*}}, <16 x bfloat> %{{.*}}, <16 x bfloat> %{{.*}}) - return _mm256_fmsubne_pbh(__A, __B, __C); + return _mm256_fmsub_pbh(__A, __B, __C); } -__m256bh test_mm256_mask_fmsubne_pbh(__m256bh __A, __mmask16 __U, __m256bh __B, __m256bh __C) { - // CHECK-LABEL: @test_mm256_mask_fmsubne_pbh +__m256bh test_mm256_mask_fmsub_pbh(__m256bh __A, __mmask16 __U, __m256bh __B, __m256bh __C) { + // CHECK-LABEL: @test_mm256_mask_fmsub_pbh // CHECK: fneg // CHECK: call <16 x bfloat> @llvm.fma.v16bf16(<16 x bfloat> %{{.*}}, <16 x bfloat> %{{.*}}, <16 x bfloat> %{{.*}}) // CHECK: select <16 x i1> %{{.*}}, <16 x bfloat> %{{.*}}, <16 x bfloat> %{{.*}} - return _mm256_mask_fmsubne_pbh(__A, __U, __B, __C); + return _mm256_mask_fmsub_pbh(__A, __U, __B, __C); } -__m256bh test_mm256_mask3_fmsubne_pbh(__m256bh __A, __m256bh __B, __m256bh __C, __mmask16 __U) { - // CHECK-LABEL: @test_mm256_mask3_fmsubne_pbh +__m256bh test_mm256_mask3_fmsub_pbh(__m256bh __A, __m256bh __B, __m256bh __C, __mmask16 __U) { + // CHECK-LABEL: @test_mm256_mask3_fmsub_pbh // CHECK: fneg // CHECK: call <16 x bfloat> @llvm.fma.v16bf16(<16 x bfloat> %{{.*}}, <16 x bfloat> %{{.*}}, <16 x bfloat> %{{.*}}) // CHECK: select <16 x i1> %{{.*}}, <16 x bfloat> %{{.*}}, <16 x bfloat> %{{.*}} - return _mm256_mask3_fmsubne_pbh(__A, __B, __C, __U); + return _mm256_mask3_fmsub_pbh(__A, __B, __C, __U); } -__m256bh test_mm256_maskz_fmsubne_pbh(__mmask16 __U, __m256bh __A, __m256bh __B, __m256bh __C) { - // CHECK-LABEL: @test_mm256_maskz_fmsubne_pbh +__m256bh test_mm256_maskz_fmsub_pbh(__mmask16 __U, __m256bh __A, __m256bh __B, __m256bh __C) { + // CHECK-LABEL: @test_mm256_maskz_fmsub_pbh // CHECK: fneg // CHECK: call <16 x bfloat> @llvm.fma.v16bf16(<16 x bfloat> %{{.*}}, <16 x bfloat> %{{.*}}, <16 x bfloat> %{{.*}}) // CHECK: select <16 x i1> %{{.*}}, <16 x bfloat> %{{.*}}, <16 x bfloat> %{{.*}} - return _mm256_maskz_fmsubne_pbh(__U, __A, __B, __C); + return _mm256_maskz_fmsub_pbh(__U, __A, __B, __C); } -__m256bh test_mm256_fnmaddne_pbh(__m256bh __A, __m256bh __B, __m256bh __C) { - // CHECK-LABEL: @test_mm256_fnmaddne_pbh +__m256bh test_mm256_fnmadd_pbh(__m256bh __A, __m256bh __B, __m256bh __C) { + // CHECK-LABEL: @test_mm256_fnmadd_pbh // CHECK: fneg // CHECK: call <16 x bfloat> @llvm.fma.v16bf16(<16 x bfloat> %{{.*}}, <16 x bfloat> %{{.*}}, <16 x bfloat> %{{.*}}) - return _mm256_fnmaddne_pbh(__A, __B, __C); + return _mm256_fnmadd_pbh(__A, __B, __C); } -__m256bh test_mm256_mask_fnmaddne_pbh(__m256bh __A, __mmask16 __U, __m256bh __B, __m256bh __C) { - // CHECK-LABEL: @test_mm256_mask_fnmaddne_pbh +__m256bh test_mm256_mask_fnmadd_pbh(__m256bh __A, __mmask16 __U, __m256bh __B, __m256bh __C) { + // CHECK-LABEL: @test_mm256_mask_fnmadd_pbh // CHECK: fneg // CHECK: call <16 x bfloat> @llvm.fma.v16bf16(<16 x bfloat> %{{.*}}, <16 x bfloat> %{{.*}}, <16 x bfloat> %{{.*}}) // CHECK: select <16 x i1> %{{.*}}, <16 x bfloat> %{{.*}}, <16 x bfloat> %{{.*}} - return _mm256_mask_fnmaddne_pbh(__A, __U, __B, __C); + return _mm256_mask_fnmadd_pbh(__A, __U, __B, __C); } -__m256bh test_mm256_mask3_fnmaddne_pbh(__m256bh __A, __m256bh __B, __m256bh __C, __mmask16 __U) { - // CHECK-LABEL: @test_mm256_mask3_fnmaddne_pbh +__m256bh test_mm256_mask3_fnmadd_pbh(__m256bh __A, __m256bh __B, __m256bh __C, __mmask16 __U) { + // CHECK-LABEL: @test_mm256_mask3_fnmadd_pbh // CHECK: fneg // CHECK: call <16 x bfloat> @llvm.fma.v16bf16(<16 x bfloat> %{{.*}}, <16 x bfloat> %{{.*}}, <16 x bfloat> %{{.*}}) // CHECK: select <16 x i1> %{{.*}}, <16 x bfloat> %{{.*}}, <16 x bfloat> %{{.*}} - return _mm256_mask3_fnmaddne_pbh(__A, __B, __C, __U); + return _mm256_mask3_fnmadd_pbh(__A, __B, __C, __U); } -__m256bh test_mm256_maskz_fnmaddne_pbh(__mmask16 __U, __m256bh __A, __m256bh __B, __m256bh __C) { - // CHECK-LABEL: @test_mm256_maskz_fnmaddne_pbh +__m256bh test_mm256_maskz_fnmadd_pbh(__mmask16 __U, __m256bh __A, __m256bh __B, __m256bh __C) { + // CHECK-LABEL: @test_mm256_maskz_fnmadd_pbh // CHECK: fneg // CHECK: call <16 x bfloat> @llvm.fma.v16bf16(<16 x bfloat> %{{.*}}, <16 x bfloat> %{{.*}}, <16 x bfloat> %{{.*}}) // CHECK: select <16 x i1> %{{.*}}, <16 x bfloat> %{{.*}}, <16 x bfloat> %{{.*}} - return _mm256_maskz_fnmaddne_pbh(__U, __A, __B, __C); + return _mm256_maskz_fnmadd_pbh(__U, __A, __B, __C); } -__m256bh test_mm256_fnmsubne_pbh(__m256bh __A, __m256bh __B, __m256bh __C) { - // CHECK-LABEL: @test_mm256_fnmsubne_pbh +__m256bh test_mm256_fnmsub_pbh(__m256bh __A, __m256bh __B, __m256bh __C) { + // CHECK-LABEL: @test_mm256_fnmsub_pbh // CHECK: fneg // CHECK: fneg // CHECK: call <16 x bfloat> @llvm.fma.v16bf16(<16 x bfloat> %{{.*}}, <16 x bfloat> %{{.*}}, <16 x bfloat> %{{.*}}) - return _mm256_fnmsubne_pbh(__A, __B, __C); + return _mm256_fnmsub_pbh(__A, __B, __C); } -__m256bh test_mm256_mask_fnmsubne_pbh(__m256bh __A, __mmask16 __U, __m256bh __B, __m256bh __C) { - // CHECK-LABEL: @test_mm256_mask_fnmsubne_pbh +__m256bh test_mm256_mask_fnmsub_pbh(__m256bh __A, __mmask16 __U, __m256bh __B, __m256bh __C) { + // CHECK-LABEL: @test_mm256_mask_fnmsub_pbh // CHECK: fneg // CHECK: fneg // CHECK: call <16 x bfloat> @llvm.fma.v16bf16(<16 x bfloat> %{{.*}}, <16 x bfloat> %{{.*}}, <16 x bfloat> %{{.*}}) // CHECK: select <16 x i1> %{{.*}}, <16 x bfloat> %{{.*}}, <16 x bfloat> %{{.*}} - return _mm256_mask_fnmsubne_pbh(__A, __U, __B, __C); + return _mm256_mask_fnmsub_pbh(__A, __U, __B, __C); } -__m256bh test_mm256_mask3_fnmsubne_pbh(__m256bh __A, __m256bh __B, __m256bh __C, __mmask16 __U) { - // CHECK-LABEL: @test_mm256_mask3_fnmsubne_pbh +__m256bh test_mm256_mask3_fnmsub_pbh(__m256bh __A, __m256bh __B, __m256bh __C, __mmask16 __U) { + // CHECK-LABEL: @test_mm256_mask3_fnmsub_pbh // CHECK: fneg // CHECK: fneg // CHECK: call <16 x bfloat> @llvm.fma.v16bf16(<16 x bfloat> %{{.*}}, <16 x bfloat> %{{.*}}, <16 x bfloat> %{{.*}}) // CHECK: select <16 x i1> %{{.*}}, <16 x bfloat> %{{.*}}, <16 x bfloat> %{{.*}} - return _mm256_mask3_fnmsubne_pbh(__A, __B, __C, __U); + return _mm256_mask3_fnmsub_pbh(__A, __B, __C, __U); } -__m256bh test_mm256_maskz_fnmsubne_pbh(__mmask16 __U, __m256bh __A, __m256bh __B, __m256bh __C) { - // CHECK-LABEL: @test_mm256_maskz_fnmsubne_pbh +__m256bh test_mm256_maskz_fnmsub_pbh(__mmask16 __U, __m256bh __A, __m256bh __B, __m256bh __C) { + // CHECK-LABEL: @test_mm256_maskz_fnmsub_pbh // CHECK: fneg // CHECK: fneg // CHECK: call <16 x bfloat> @llvm.fma.v16bf16(<16 x bfloat> %{{.*}}, <16 x bfloat> %{{.*}}, <16 x bfloat> %{{.*}}) // CHECK: select <16 x i1> %{{.*}}, <16 x bfloat> %{{.*}}, <16 x bfloat> %{{.*}} - return _mm256_maskz_fnmsubne_pbh(__U, __A, __B, __C); + return _mm256_maskz_fnmsub_pbh(__U, __A, __B, __C); } -__m128bh test_mm_fmaddne_pbh(__m128bh __A, __m128bh __B, __m128bh __C) { - // CHECK-LABEL: @test_mm_fmaddne_pbh +__m128bh test_mm_fmadd_pbh(__m128bh __A, __m128bh __B, __m128bh __C) { + // CHECK-LABEL: @test_mm_fmadd_pbh // CHECK: call <8 x bfloat> @llvm.fma.v8bf16(<8 x bfloat> %{{.*}}, <8 x bfloat> %{{.*}}, <8 x bfloat> %{{.*}}) - return _mm_fmaddne_pbh(__A, __B, __C); + return _mm_fmadd_pbh(__A, __B, __C); } -__m128bh test_mm_mask_fmaddne_pbh(__m128bh __A, __mmask8 __U, __m128bh __B, __m128bh __C) { - // CHECK-LABEL: @test_mm_mask_fmaddne_pbh +__m128bh test_mm_mask_fmadd_pbh(__m128bh __A, __mmask8 __U, __m128bh __B, __m128bh __C) { + // CHECK-LABEL: @test_mm_mask_fmadd_pbh // CHECK: call <8 x bfloat> @llvm.fma.v8bf16(<8 x bfloat> %{{.*}}, <8 x bfloat> %{{.*}}, <8 x bfloat> %{{.*}}) // CHECK: select <8 x i1> %{{.*}}, <8 x bfloat> %{{.*}}, <8 x bfloat> %{{.*}} - return _mm_mask_fmaddne_pbh(__A, __U, __B, __C); + return _mm_mask_fmadd_pbh(__A, __U, __B, __C); } -__m128bh test_mm_mask3_fmaddne_pbh(__m128bh __A, __m128bh __B, __m128bh __C, __mmask8 __U) { - // CHECK-LABEL: @test_mm_mask3_fmaddne_pbh +__m128bh test_mm_mask3_fmadd_pbh(__m128bh __A, __m128bh __B, __m128bh __C, __mmask8 __U) { + // CHECK-LABEL: @test_mm_mask3_fmadd_pbh // CHECK: call <8 x bfloat> @llvm.fma.v8bf16(<8 x bfloat> %{{.*}}, <8 x bfloat> %{{.*}}, <8 x bfloat> %{{.*}}) // CHECK: select <8 x i1> %{{.*}}, <8 x bfloat> %{{.*}}, <8 x bfloat> %{{.*}} - return _mm_mask3_fmaddne_pbh(__A, __B, __C, __U); + return _mm_mask3_fmadd_pbh(__A, __B, __C, __U); } -__m128bh test_mm_maskz_fmaddne_pbh(__mmask8 __U, __m128bh __A, __m128bh __B, __m128bh __C) { - // CHECK-LABEL: @test_mm_maskz_fmaddne_pbh +__m128bh test_mm_maskz_fmadd_pbh(__mmask8 __U, __m128bh __A, __m128bh __B, __m128bh __C) { + // CHECK-LABEL: @test_mm_maskz_fmadd_pbh // CHECK: call <8 x bfloat> @llvm.fma.v8bf16(<8 x bfloat> %{{.*}}, <8 x bfloat> %{{.*}}, <8 x bfloat> %{{.*}}) // CHECK: select <8 x i1> %{{.*}}, <8 x bfloat> %{{.*}}, <8 x bfloat> %{{.*}} - return _mm_maskz_fmaddne_pbh(__U, __A, __B, __C); + return _mm_maskz_fmadd_pbh(__U, __A, __B, __C); } -__m128bh test_mm_fmsubne_pbh(__m128bh __A, __m128bh __B, __m128bh __C) { - // CHECK-LABEL: @test_mm_fmsubne_pbh +__m128bh test_mm_fmsub_pbh(__m128bh __A, __m128bh __B, __m128bh __C) { + // CHECK-LABEL: @test_mm_fmsub_pbh // CHECK: fneg // CHECK: call <8 x bfloat> @llvm.fma.v8bf16(<8 x bfloat> %{{.*}}, <8 x bfloat> %{{.*}}, <8 x bfloat> %{{.*}}) - return _mm_fmsubne_pbh(__A, __B, __C); + return _mm_fmsub_pbh(__A, __B, __C); } -__m128bh test_mm_mask_fmsubne_pbh(__m128bh __A, __mmask8 __U, __m128bh __B, __m128bh __C) { - // CHECK-LABEL: @test_mm_mask_fmsubne_pbh +__m128bh test_mm_mask_fmsub_pbh(__m128bh __A, __mmask8 __U, __m128bh __B, __m128bh __C) { + // CHECK-LABEL: @test_mm_mask_fmsub_pbh // CHECK: fneg // CHECK: call <8 x bfloat> @llvm.fma.v8bf16(<8 x bfloat> %{{.*}}, <8 x bfloat> %{{.*}}, <8 x bfloat> %{{.*}}) // CHECK: select <8 x i1> %{{.*}}, <8 x bfloat> %{{.*}}, <8 x bfloat> %{{.*}} - return _mm_mask_fmsubne_pbh(__A, __U, __B, __C); + return _mm_mask_fmsub_pbh(__A, __U, __B, __C); } -__m128bh test_mm_mask3_fmsubne_pbh(__m128bh __A, __m128bh __B, __m128bh __C, __mmask8 __U) { - // CHECK-LABEL: @test_mm_mask3_fmsubne_pbh +__m128bh test_mm_mask3_fmsub_pbh(__m128bh __A, __m128bh __B, __m128bh __C, __mmask8 __U) { + // CHECK-LABEL: @test_mm_mask3_fmsub_pbh // CHECK: fneg // CHECK: call <8 x bfloat> @llvm.fma.v8bf16(<8 x bfloat> %{{.*}}, <8 x bfloat> %{{.*}}, <8 x bfloat> %{{.*}}) // CHECK: select <8 x i1> %{{.*}}, <8 x bfloat> %{{.*}}, <8 x bfloat> %{{.*}} - return _mm_mask3_fmsubne_pbh(__A, __B, __C, __U); + return _mm_mask3_fmsub_pbh(__A, __B, __C, __U); } -__m128bh test_mm_maskz_fmsubne_pbh(__mmask8 __U, __m128bh __A, __m128bh __B, __m128bh __C) { - // CHECK-LABEL: @test_mm_maskz_fmsubne_pbh +__m128bh test_mm_maskz_fmsub_pbh(__mmask8 __U, __m128bh __A, __m128bh __B, __m128bh __C) { + // CHECK-LABEL: @test_mm_maskz_fmsub_pbh // CHECK: fneg // CHECK: call <8 x bfloat> @llvm.fma.v8bf16(<8 x bfloat> %{{.*}}, <8 x bfloat> %{{.*}}, <8 x bfloat> %{{.*}}) // CHECK: select <8 x i1> %{{.*}}, <8 x bfloat> %{{.*}}, <8 x bfloat> %{{.*}} - return _mm_maskz_fmsubne_pbh(__U, __A, __B, __C); + return _mm_maskz_fmsub_pbh(__U, __A, __B, __C); } -__m128bh test_mm_fnmaddne_pbh(__m128bh __A, __m128bh __B, __m128bh __C) { - // CHECK-LABEL: @test_mm_fnmaddne_pbh +__m128bh test_mm_fnmadd_pbh(__m128bh __A, __m128bh __B, __m128bh __C) { + // CHECK-LABEL: @test_mm_fnmadd_pbh // CHECK: fneg // CHECK: call <8 x bfloat> @llvm.fma.v8bf16(<8 x bfloat> %{{.*}}, <8 x bfloat> %{{.*}}, <8 x bfloat> %{{.*}}) - return _mm_fnmaddne_pbh(__A, __B, __C); + return _mm_fnmadd_pbh(__A, __B, __C); } -__m128bh test_mm_mask_fnmaddne_pbh(__m128bh __A, __mmask8 __U, __m128bh __B, __m128bh __C) { - // CHECK-LABEL: @test_mm_mask_fnmaddne_pbh +__m128bh test_mm_mask_fnmadd_pbh(__m128bh __A, __mmask8 __U, __m128bh __B, __m128bh __C) { + // CHECK-LABEL: @test_mm_mask_fnmadd_pbh // CHECK: fneg // CHECK: call <8 x bfloat> @llvm.fma.v8bf16(<8 x bfloat> %{{.*}}, <8 x bfloat> %{{.*}}, <8 x bfloat> %{{.*}}) // CHECK: select <8 x i1> %{{.*}}, <8 x bfloat> %{{.*}}, <8 x bfloat> %{{.*}} - return _mm_mask_fnmaddne_pbh(__A, __U, __B, __C); + return _mm_mask_fnmadd_pbh(__A, __U, __B, __C); } -__m128bh test_mm_mask3_fnmaddne_pbh(__m128bh __A, __m128bh __B, __m128bh __C, __mmask8 __U) { - // CHECK-LABEL: @test_mm_mask3_fnmaddne_pbh +__m128bh test_mm_mask3_fnmadd_pbh(__m128bh __A, __m128bh __B, __m128bh __C, __mmask8 __U) { + // CHECK-LABEL: @test_mm_mask3_fnmadd_pbh // CHECK: fneg // CHECK: call <8 x bfloat> @llvm.fma.v8bf16(<8 x bfloat> %{{.*}}, <8 x bfloat> %{{.*}}, <8 x bfloat> %{{.*}}) // CHECK: select <8 x i1> %{{.*}}, <8 x bfloat> %{{.*}}, <8 x bfloat> %{{.*}} - return _mm_mask3_fnmaddne_pbh(__A, __B, __C, __U); + return _mm_mask3_fnmadd_pbh(__A, __B, __C, __U); } -__m128bh test_mm_maskz_fnmaddne_pbh(__mmask8 __U, __m128bh __A, __m128bh __B, __m128bh __C) { - // CHECK-LABEL: @test_mm_maskz_fnmaddne_pbh +__m128bh test_mm_maskz_fnmadd_pbh(__mmask8 __U, __m128bh __A, __m128bh __B, __m128bh __C) { + // CHECK-LABEL: @test_mm_maskz_fnmadd_pbh // CHECK: fneg // CHECK: call <8 x bfloat> @llvm.fma.v8bf16(<8 x bfloat> %{{.*}}, <8 x bfloat> %{{.*}}, <8 x bfloat> %{{.*}}) // CHECK: select <8 x i1> %{{.*}}, <8 x bfloat> %{{.*}}, <8 x bfloat> %{{.*}} - return _mm_maskz_fnmaddne_pbh(__U, __A, __B, __C); + return _mm_maskz_fnmadd_pbh(__U, __A, __B, __C); } -__m128bh test_mm_fnmsubne_pbh(__m128bh __A, __m128bh __B, __m128bh __C) { - // CHECK-LABEL: @test_mm_fnmsubne_pbh +__m128bh test_mm_fnmsub_pbh(__m128bh __A, __m128bh __B, __m128bh __C) { + // CHECK-LABEL: @test_mm_fnmsub_pbh // CHECK: fneg // CHECK: fneg // CHECK: call <8 x bfloat> @llvm.fma.v8bf16(<8 x bfloat> %{{.*}}, <8 x bfloat> %{{.*}}, <8 x bfloat> %{{.*}}) - return _mm_fnmsubne_pbh(__A, __B, __C); + return _mm_fnmsub_pbh(__A, __B, __C); } -__m128bh test_mm_mask_fnmsubne_pbh(__m128bh __A, __mmask8 __U, __m128bh __B, __m128bh __C) { - // CHECK-LABEL: @test_mm_mask_fnmsubne_pbh +__m128bh test_mm_mask_fnmsub_pbh(__m128bh __A, __mmask8 __U, __m128bh __B, __m128bh __C) { + // CHECK-LABEL: @test_mm_mask_fnmsub_pbh // CHECK: fneg // CHECK: fneg // CHECK: call <8 x bfloat> @llvm.fma.v8bf16(<8 x bfloat> %{{.*}}, <8 x bfloat> %{{.*}}, <8 x bfloat> %{{.*}}) // CHECK: select <8 x i1> %{{.*}}, <8 x bfloat> %{{.*}}, <8 x bfloat> %{{.*}} - return _mm_mask_fnmsubne_pbh(__A, __U, __B, __C); + return _mm_mask_fnmsub_pbh(__A, __U, __B, __C); } -__m128bh test_mm_mask3_fnmsubne_pbh(__m128bh __A, __m128bh __B, __m128bh __C, __mmask8 __U) { - // CHECK-LABEL: @test_mm_mask3_fnmsubne_pbh +__m128bh test_mm_mask3_fnmsub_pbh(__m128bh __A, __m128bh __B, __m128bh __C, __mmask8 __U) { + // CHECK-LABEL: @test_mm_mask3_fnmsub_pbh // CHECK: fneg // CHECK: fneg // CHECK: call <8 x bfloat> @llvm.fma.v8bf16(<8 x bfloat> %{{.*}}, <8 x bfloat> %{{.*}}, <8 x bfloat> %{{.*}}) // CHECK: select <8 x i1> %{{.*}}, <8 x bfloat> %{{.*}}, <8 x bfloat> %{{.*}} - return _mm_mask3_fnmsubne_pbh(__A, __B, __C, __U); + return _mm_mask3_fnmsub_pbh(__A, __B, __C, __U); } -__m128bh test_mm_maskz_fnmsubne_pbh(__mmask8 __U, __m128bh __A, __m128bh __B, __m128bh __C) { - // CHECK-LABEL: @test_mm_maskz_fnmsubne_pbh +__m128bh test_mm_maskz_fnmsub_pbh(__mmask8 __U, __m128bh __A, __m128bh __B, __m128bh __C) { + // CHECK-LABEL: @test_mm_maskz_fnmsub_pbh // CHECK: fneg // CHECK: fneg // CHECK: call <8 x bfloat> @llvm.fma.v8bf16(<8 x bfloat> %{{.*}}, <8 x bfloat> %{{.*}}, <8 x bfloat> %{{.*}}) // CHECK: select <8 x i1> %{{.*}}, <8 x bfloat> %{{.*}}, <8 x bfloat> %{{.*}} - return _mm_maskz_fnmsubne_pbh(__U, __A, __B, __C); + return _mm_maskz_fnmsub_pbh(__U, __A, __B, __C); } diff --git a/llvm/include/llvm/IR/IntrinsicsX86.td b/llvm/include/llvm/IR/IntrinsicsX86.td index 42b211e0e1f75..a258da8b7e49f 100644 --- a/llvm/include/llvm/IR/IntrinsicsX86.td +++ b/llvm/include/llvm/IR/IntrinsicsX86.td @@ -7588,58 +7588,58 @@ def int_x86_avx10_mask_vcvtneph2hf8s512 : ClangBuiltin<"__builtin_ia32_vcvtneph2 //===----------------------------------------------------------------------===// let TargetPrefix = "x86" in { -def int_x86_avx10_vaddnepbf16512 : ClangBuiltin<"__builtin_ia32_vaddnepbf16512">, +def int_x86_avx10_vaddbf16512 : ClangBuiltin<"__builtin_ia32_vaddbf16512">, DefaultAttrsIntrinsic<[llvm_v32bf16_ty], [llvm_v32bf16_ty, llvm_v32bf16_ty], [IntrNoMem]>; -def int_x86_avx10_vaddnepbf16256 : ClangBuiltin<"__builtin_ia32_vaddnepbf16256">, +def int_x86_avx10_vaddbf16256 : ClangBuiltin<"__builtin_ia32_vaddbf16256">, DefaultAttrsIntrinsic<[llvm_v16bf16_ty], [llvm_v16bf16_ty, llvm_v16bf16_ty], [IntrNoMem]>; -def int_x86_avx10_vaddnepbf16128 : ClangBuiltin<"__builtin_ia32_vaddnepbf16128">, +def int_x86_avx10_vaddbf16128 : ClangBuiltin<"__builtin_ia32_vaddbf16128">, DefaultAttrsIntrinsic<[llvm_v8bf16_ty], [llvm_v8bf16_ty, llvm_v8bf16_ty], [IntrNoMem]>; -def int_x86_avx10_vsubnepbf16512 : ClangBuiltin<"__builtin_ia32_vsubnepbf16512">, +def int_x86_avx10_vsubbf16512 : ClangBuiltin<"__builtin_ia32_vsubbf16512">, DefaultAttrsIntrinsic<[llvm_v32bf16_ty], [llvm_v32bf16_ty, llvm_v32bf16_ty], [IntrNoMem]>; -def int_x86_avx10_vsubnepbf16256 : ClangBuiltin<"__builtin_ia32_vsubnepbf16256">, +def int_x86_avx10_vsubbf16256 : ClangBuiltin<"__builtin_ia32_vsubbf16256">, DefaultAttrsIntrinsic<[llvm_v16bf16_ty], [llvm_v16bf16_ty, llvm_v16bf16_ty], [IntrNoMem]>; -def int_x86_avx10_vsubnepbf16128 : ClangBuiltin<"__builtin_ia32_vsubnepbf16128">, +def int_x86_avx10_vsubbf16128 : ClangBuiltin<"__builtin_ia32_vsubbf16128">, DefaultAttrsIntrinsic<[llvm_v8bf16_ty], [llvm_v8bf16_ty, llvm_v8bf16_ty], [IntrNoMem]>; -def int_x86_avx10_vmulnepbf16512 : ClangBuiltin<"__builtin_ia32_vmulnepbf16512">, +def int_x86_avx10_vmulbf16512 : ClangBuiltin<"__builtin_ia32_vmulbf16512">, DefaultAttrsIntrinsic<[llvm_v32bf16_ty], [llvm_v32bf16_ty, llvm_v32bf16_ty], [IntrNoMem]>; -def int_x86_avx10_vmulnepbf16256 : ClangBuiltin<"__builtin_ia32_vmulnepbf16256">, +def int_x86_avx10_vmulbf16256 : ClangBuiltin<"__builtin_ia32_vmulbf16256">, DefaultAttrsIntrinsic<[llvm_v16bf16_ty], [llvm_v16bf16_ty, llvm_v16bf16_ty], [IntrNoMem]>; -def int_x86_avx10_vmulnepbf16128 : ClangBuiltin<"__builtin_ia32_vmulnepbf16128">, +def int_x86_avx10_vmulbf16128 : ClangBuiltin<"__builtin_ia32_vmulbf16128">, DefaultAttrsIntrinsic<[llvm_v8bf16_ty], [llvm_v8bf16_ty, llvm_v8bf16_ty], [IntrNoMem]>; -def int_x86_avx10_vdivnepbf16512 : ClangBuiltin<"__builtin_ia32_vdivnepbf16512">, +def int_x86_avx10_vdivbf16512 : ClangBuiltin<"__builtin_ia32_vdivbf16512">, DefaultAttrsIntrinsic<[llvm_v32bf16_ty], [llvm_v32bf16_ty, llvm_v32bf16_ty], [IntrNoMem]>; -def int_x86_avx10_vdivnepbf16256 : ClangBuiltin<"__builtin_ia32_vdivnepbf16256">, +def int_x86_avx10_vdivbf16256 : ClangBuiltin<"__builtin_ia32_vdivbf16256">, DefaultAttrsIntrinsic<[llvm_v16bf16_ty], [llvm_v16bf16_ty, llvm_v16bf16_ty], [IntrNoMem]>; -def int_x86_avx10_vdivnepbf16128 : ClangBuiltin<"__builtin_ia32_vdivnepbf16128">, +def int_x86_avx10_vdivbf16128 : ClangBuiltin<"__builtin_ia32_vdivbf16128">, DefaultAttrsIntrinsic<[llvm_v8bf16_ty], [llvm_v8bf16_ty, llvm_v8bf16_ty], [IntrNoMem]>; -def int_x86_avx10_vmaxpbf16512 : ClangBuiltin<"__builtin_ia32_vmaxpbf16512">, +def int_x86_avx10_vmaxbf16512 : ClangBuiltin<"__builtin_ia32_vmaxbf16512">, DefaultAttrsIntrinsic<[llvm_v32bf16_ty], [llvm_v32bf16_ty, llvm_v32bf16_ty], [IntrNoMem]>; -def int_x86_avx10_vmaxpbf16256 : ClangBuiltin<"__builtin_ia32_vmaxpbf16256">, +def int_x86_avx10_vmaxbf16256 : ClangBuiltin<"__builtin_ia32_vmaxbf16256">, DefaultAttrsIntrinsic<[llvm_v16bf16_ty], [llvm_v16bf16_ty, llvm_v16bf16_ty], [IntrNoMem]>; -def int_x86_avx10_vmaxpbf16128 : ClangBuiltin<"__builtin_ia32_vmaxpbf16128">, +def int_x86_avx10_vmaxbf16128 : ClangBuiltin<"__builtin_ia32_vmaxbf16128">, DefaultAttrsIntrinsic<[llvm_v8bf16_ty], [llvm_v8bf16_ty, llvm_v8bf16_ty], [IntrNoMem]>; -def int_x86_avx10_vminpbf16512 : ClangBuiltin<"__builtin_ia32_vminpbf16512">, +def int_x86_avx10_vminbf16512 : ClangBuiltin<"__builtin_ia32_vminbf16512">, DefaultAttrsIntrinsic<[llvm_v32bf16_ty], [llvm_v32bf16_ty, llvm_v32bf16_ty], [IntrNoMem]>; -def int_x86_avx10_vminpbf16256 : ClangBuiltin<"__builtin_ia32_vminpbf16256">, +def int_x86_avx10_vminbf16256 : ClangBuiltin<"__builtin_ia32_vminbf16256">, DefaultAttrsIntrinsic<[llvm_v16bf16_ty], [llvm_v16bf16_ty, llvm_v16bf16_ty], [IntrNoMem]>; -def int_x86_avx10_vminpbf16128 : ClangBuiltin<"__builtin_ia32_vminpbf16128">, +def int_x86_avx10_vminbf16128 : ClangBuiltin<"__builtin_ia32_vminbf16128">, DefaultAttrsIntrinsic<[llvm_v8bf16_ty], [llvm_v8bf16_ty, llvm_v8bf16_ty], [IntrNoMem]>; def int_x86_avx10_vcomsbf16eq : ClangBuiltin<"__builtin_ia32_vcomsbf16eq">, @@ -7660,181 +7660,181 @@ def int_x86_avx10_vcomsbf16ge : ClangBuiltin<"__builtin_ia32_vcomsbf16ge">, def int_x86_avx10_vcomsbf16neq : ClangBuiltin<"__builtin_ia32_vcomsbf16neq">, DefaultAttrsIntrinsic<[llvm_i32_ty], [llvm_v8bf16_ty, llvm_v8bf16_ty], [IntrNoMem]>; -def int_x86_avx10_mask_rsqrt_nepbf16_128 : ClangBuiltin<"__builtin_ia32_vrsqrtpbf16128_mask">, +def int_x86_avx10_mask_rsqrt_bf16_128 : ClangBuiltin<"__builtin_ia32_vrsqrtbf16128_mask">, DefaultAttrsIntrinsic<[llvm_v8bf16_ty], [llvm_v8bf16_ty, llvm_v8bf16_ty, llvm_i8_ty], [IntrNoMem]>; -def int_x86_avx10_mask_rsqrt_nepbf16_256 : ClangBuiltin<"__builtin_ia32_vrsqrtpbf16256_mask">, +def int_x86_avx10_mask_rsqrt_bf16_256 : ClangBuiltin<"__builtin_ia32_vrsqrtbf16256_mask">, DefaultAttrsIntrinsic<[llvm_v16bf16_ty], [llvm_v16bf16_ty, llvm_v16bf16_ty, llvm_i16_ty], [IntrNoMem]>; -def int_x86_avx10_mask_rsqrt_nepbf16_512 : ClangBuiltin<"__builtin_ia32_vrsqrtpbf16512_mask">, +def int_x86_avx10_mask_rsqrt_bf16_512 : ClangBuiltin<"__builtin_ia32_vrsqrtbf16512_mask">, DefaultAttrsIntrinsic<[llvm_v32bf16_ty], [llvm_v32bf16_ty, llvm_v32bf16_ty, llvm_i32_ty], [IntrNoMem]>; -def int_x86_avx10_mask_rcp_nepbf16_128 : ClangBuiltin<"__builtin_ia32_vrcppbf16128_mask">, +def int_x86_avx10_mask_rcp_bf16_128 : ClangBuiltin<"__builtin_ia32_vrcpbf16128_mask">, DefaultAttrsIntrinsic<[llvm_v8bf16_ty], [llvm_v8bf16_ty, llvm_v8bf16_ty, llvm_i8_ty], [IntrNoMem]>; -def int_x86_avx10_mask_rcp_nepbf16_256 : ClangBuiltin<"__builtin_ia32_vrcppbf16256_mask">, +def int_x86_avx10_mask_rcp_bf16_256 : ClangBuiltin<"__builtin_ia32_vrcpbf16256_mask">, DefaultAttrsIntrinsic<[llvm_v16bf16_ty], [llvm_v16bf16_ty, llvm_v16bf16_ty, llvm_i16_ty], [IntrNoMem]>; -def int_x86_avx10_mask_rcp_nepbf16_512 : ClangBuiltin<"__builtin_ia32_vrcppbf16512_mask">, +def int_x86_avx10_mask_rcp_bf16_512 : ClangBuiltin<"__builtin_ia32_vrcpbf16512_mask">, DefaultAttrsIntrinsic<[llvm_v32bf16_ty], [llvm_v32bf16_ty, llvm_v32bf16_ty, llvm_i32_ty], [IntrNoMem]>; -def int_x86_avx10_mask_reduce_nepbf16_128 : ClangBuiltin<"__builtin_ia32_vreducenepbf16128_mask">, +def int_x86_avx10_mask_reduce_bf16_128 : ClangBuiltin<"__builtin_ia32_vreducebf16128_mask">, DefaultAttrsIntrinsic<[llvm_v8bf16_ty], [llvm_v8bf16_ty, llvm_i32_ty, llvm_v8bf16_ty, llvm_i8_ty], [IntrNoMem, ImmArg>]>; -def int_x86_avx10_mask_reduce_nepbf16_256 : ClangBuiltin<"__builtin_ia32_vreducenepbf16256_mask">, +def int_x86_avx10_mask_reduce_bf16_256 : ClangBuiltin<"__builtin_ia32_vreducebf16256_mask">, DefaultAttrsIntrinsic<[llvm_v16bf16_ty], [llvm_v16bf16_ty, llvm_i32_ty, llvm_v16bf16_ty, llvm_i16_ty], [IntrNoMem, ImmArg>]>; -def int_x86_avx10_mask_reduce_nepbf16_512 : ClangBuiltin<"__builtin_ia32_vreducenepbf16512_mask">, +def int_x86_avx10_mask_reduce_bf16_512 : ClangBuiltin<"__builtin_ia32_vreducebf16512_mask">, DefaultAttrsIntrinsic<[llvm_v32bf16_ty], [llvm_v32bf16_ty, llvm_i32_ty, llvm_v32bf16_ty, llvm_i32_ty], [IntrNoMem, ImmArg>]>; -def int_x86_avx10_fpclass_nepbf16_128 : +def int_x86_avx10_fpclass_bf16_128 : DefaultAttrsIntrinsic<[llvm_v8i1_ty], [llvm_v8bf16_ty, llvm_i32_ty], [IntrNoMem, ImmArg>]>; -def int_x86_avx10_fpclass_nepbf16_256 : +def int_x86_avx10_fpclass_bf16_256 : DefaultAttrsIntrinsic<[llvm_v16i1_ty], [llvm_v16bf16_ty, llvm_i32_ty], [IntrNoMem, ImmArg>]>; -def int_x86_avx10_fpclass_nepbf16_512 : +def int_x86_avx10_fpclass_bf16_512 : DefaultAttrsIntrinsic<[llvm_v32i1_ty], [llvm_v32bf16_ty, llvm_i32_ty], [IntrNoMem, ImmArg>]>; -def int_x86_avx10_mask_getexp_nepbf16_128 : ClangBuiltin<"__builtin_ia32_vgetexppbf16128_mask">, +def int_x86_avx10_mask_getexp_bf16_128 : ClangBuiltin<"__builtin_ia32_vgetexpbf16128_mask">, DefaultAttrsIntrinsic<[llvm_v8bf16_ty], [llvm_v8bf16_ty, llvm_v8bf16_ty, llvm_i8_ty], [IntrNoMem]>; -def int_x86_avx10_mask_getexp_nepbf16_256 : ClangBuiltin<"__builtin_ia32_vgetexppbf16256_mask">, +def int_x86_avx10_mask_getexp_bf16_256 : ClangBuiltin<"__builtin_ia32_vgetexpbf16256_mask">, DefaultAttrsIntrinsic<[llvm_v16bf16_ty], [llvm_v16bf16_ty, llvm_v16bf16_ty, llvm_i16_ty], [IntrNoMem]>; -def int_x86_avx10_mask_getexp_nepbf16_512 : ClangBuiltin<"__builtin_ia32_vgetexppbf16512_mask">, +def int_x86_avx10_mask_getexp_bf16_512 : ClangBuiltin<"__builtin_ia32_vgetexpbf16512_mask">, DefaultAttrsIntrinsic<[llvm_v32bf16_ty], [llvm_v32bf16_ty, llvm_v32bf16_ty, llvm_i32_ty], [IntrNoMem]>; -def int_x86_avx10_mask_getmant_nepbf16_128 : ClangBuiltin<"__builtin_ia32_vgetmantpbf16128_mask">, +def int_x86_avx10_mask_getmant_bf16_128 : ClangBuiltin<"__builtin_ia32_vgetmantbf16128_mask">, DefaultAttrsIntrinsic<[llvm_v8bf16_ty], [llvm_v8bf16_ty, llvm_i32_ty, llvm_v8bf16_ty, llvm_i8_ty], [IntrNoMem, ImmArg>]>; -def int_x86_avx10_mask_getmant_nepbf16_256 : ClangBuiltin<"__builtin_ia32_vgetmantpbf16256_mask">, +def int_x86_avx10_mask_getmant_bf16_256 : ClangBuiltin<"__builtin_ia32_vgetmantbf16256_mask">, DefaultAttrsIntrinsic<[llvm_v16bf16_ty], [llvm_v16bf16_ty, llvm_i32_ty, llvm_v16bf16_ty, llvm_i16_ty], [IntrNoMem, ImmArg>]>; -def int_x86_avx10_mask_getmant_nepbf16_512 : ClangBuiltin<"__builtin_ia32_vgetmantpbf16512_mask">, +def int_x86_avx10_mask_getmant_bf16_512 : ClangBuiltin<"__builtin_ia32_vgetmantbf16512_mask">, DefaultAttrsIntrinsic<[llvm_v32bf16_ty], [llvm_v32bf16_ty, llvm_i32_ty, llvm_v32bf16_ty, llvm_i32_ty], [IntrNoMem, ImmArg>]>; -def int_x86_avx10_mask_rndscale_nepbf16_128 : ClangBuiltin<"__builtin_ia32_vrndscalenepbf16_128_mask">, +def int_x86_avx10_mask_rndscale_bf16_128 : ClangBuiltin<"__builtin_ia32_vrndscalebf16_128_mask">, DefaultAttrsIntrinsic<[llvm_v8bf16_ty], [llvm_v8bf16_ty, llvm_i32_ty, llvm_v8bf16_ty, llvm_i8_ty], [IntrNoMem, ImmArg>]>; -def int_x86_avx10_mask_rndscale_nepbf16_256 : ClangBuiltin<"__builtin_ia32_vrndscalenepbf16_256_mask">, +def int_x86_avx10_mask_rndscale_bf16_256 : ClangBuiltin<"__builtin_ia32_vrndscalebf16_256_mask">, DefaultAttrsIntrinsic<[llvm_v16bf16_ty], [llvm_v16bf16_ty, llvm_i32_ty, llvm_v16bf16_ty, llvm_i16_ty], [IntrNoMem, ImmArg>]>; -def int_x86_avx10_mask_rndscale_nepbf16_512 : ClangBuiltin<"__builtin_ia32_vrndscalenepbf16_mask">, +def int_x86_avx10_mask_rndscale_bf16_512 : ClangBuiltin<"__builtin_ia32_vrndscalebf16_mask">, DefaultAttrsIntrinsic<[llvm_v32bf16_ty], [llvm_v32bf16_ty, llvm_i32_ty, llvm_v32bf16_ty, llvm_i32_ty], [IntrNoMem, ImmArg>]>; -def int_x86_avx10_mask_scalef_nepbf16_128 : ClangBuiltin<"__builtin_ia32_vscalefpbf16128_mask">, +def int_x86_avx10_mask_scalef_bf16_128 : ClangBuiltin<"__builtin_ia32_vscalefbf16128_mask">, DefaultAttrsIntrinsic<[llvm_v8bf16_ty], [llvm_v8bf16_ty, llvm_v8bf16_ty, llvm_v8bf16_ty, llvm_i8_ty], [IntrNoMem]>; -def int_x86_avx10_mask_scalef_nepbf16_256 : ClangBuiltin<"__builtin_ia32_vscalefpbf16256_mask">, +def int_x86_avx10_mask_scalef_bf16_256 : ClangBuiltin<"__builtin_ia32_vscalefbf16256_mask">, DefaultAttrsIntrinsic<[llvm_v16bf16_ty], [llvm_v16bf16_ty, llvm_v16bf16_ty, llvm_v16bf16_ty, llvm_i16_ty], [IntrNoMem]>; -def int_x86_avx10_mask_scalef_nepbf16_512 : ClangBuiltin<"__builtin_ia32_vscalefpbf16512_mask">, +def int_x86_avx10_mask_scalef_bf16_512 : ClangBuiltin<"__builtin_ia32_vscalefbf16512_mask">, DefaultAttrsIntrinsic<[llvm_v32bf16_ty], [llvm_v32bf16_ty, llvm_v32bf16_ty, llvm_v32bf16_ty, llvm_i32_ty], [IntrNoMem]>; -def int_x86_avx10_vfmadd213nepbf16256 : ClangBuiltin<"__builtin_ia32_vfmadd213nepbf16256">, +def int_x86_avx10_vfmadd213bf16256 : ClangBuiltin<"__builtin_ia32_vfmadd213bf16256">, DefaultAttrsIntrinsic<[llvm_v16bf16_ty], [llvm_v16bf16_ty, llvm_v16bf16_ty, llvm_v16bf16_ty], [IntrNoMem]>; -def int_x86_avx10_vfmadd213nepbf16128 : ClangBuiltin<"__builtin_ia32_vfmadd213nepbf16128">, +def int_x86_avx10_vfmadd213bf16128 : ClangBuiltin<"__builtin_ia32_vfmadd213bf16128">, DefaultAttrsIntrinsic<[llvm_v8bf16_ty], [llvm_v8bf16_ty, llvm_v8bf16_ty, llvm_v8bf16_ty ], [IntrNoMem]>; -def int_x86_avx10_vfmadd132nepbf16512 : ClangBuiltin<"__builtin_ia32_vfmadd132nepbf16512">, +def int_x86_avx10_vfmadd132bf16512 : ClangBuiltin<"__builtin_ia32_vfmadd132bf16512">, DefaultAttrsIntrinsic<[llvm_v32bf16_ty], [llvm_v32bf16_ty, llvm_v32bf16_ty, llvm_v32bf16_ty], [IntrNoMem]>; -def int_x86_avx10_vfmadd132nepbf16256 : ClangBuiltin<"__builtin_ia32_vfmadd132nepbf16256">, +def int_x86_avx10_vfmadd132bf16256 : ClangBuiltin<"__builtin_ia32_vfmadd132bf16256">, DefaultAttrsIntrinsic<[llvm_v16bf16_ty], [llvm_v16bf16_ty, llvm_v16bf16_ty, llvm_v16bf16_ty], [IntrNoMem]>; -def int_x86_avx10_vfmadd132nepbf16128 : ClangBuiltin<"__builtin_ia32_vfmadd132nepbf16128">, +def int_x86_avx10_vfmadd132bf16128 : ClangBuiltin<"__builtin_ia32_vfmadd132bf16128">, DefaultAttrsIntrinsic<[llvm_v8bf16_ty], [llvm_v8bf16_ty, llvm_v8bf16_ty, llvm_v8bf16_ty ], [IntrNoMem]>; -def int_x86_avx10_vfmadd231nepbf16512 : ClangBuiltin<"__builtin_ia32_vfmadd231nepbf16512">, +def int_x86_avx10_vfmadd231bf16512 : ClangBuiltin<"__builtin_ia32_vfmadd231bf16512">, DefaultAttrsIntrinsic<[llvm_v32bf16_ty], [llvm_v32bf16_ty, llvm_v32bf16_ty, llvm_v32bf16_ty], [IntrNoMem]>; -def int_x86_avx10_vfmadd231nepbf16256 : ClangBuiltin<"__builtin_ia32_vfmadd231nepbf16256">, +def int_x86_avx10_vfmadd231bf16256 : ClangBuiltin<"__builtin_ia32_vfmadd231bf16256">, DefaultAttrsIntrinsic<[llvm_v16bf16_ty], [llvm_v16bf16_ty, llvm_v16bf16_ty, llvm_v16bf16_ty], [IntrNoMem]>; -def int_x86_avx10_vfmadd231nepbf16128 : ClangBuiltin<"__builtin_ia32_vfmadd231nepbf16128">, +def int_x86_avx10_vfmadd231bf16128 : ClangBuiltin<"__builtin_ia32_vfmadd231bf16128">, DefaultAttrsIntrinsic<[llvm_v8bf16_ty], [llvm_v8bf16_ty, llvm_v8bf16_ty, llvm_v8bf16_ty ], [IntrNoMem]>; -def int_x86_avx10_vfmsub213nepbf16512 : ClangBuiltin<"__builtin_ia32_vfmsub213nepbf16512">, +def int_x86_avx10_vfmsub213bf16512 : ClangBuiltin<"__builtin_ia32_vfmsub213bf16512">, DefaultAttrsIntrinsic<[llvm_v32bf16_ty], [llvm_v32bf16_ty, llvm_v32bf16_ty, llvm_v32bf16_ty], [IntrNoMem]>; -def int_x86_avx10_vfmsub213nepbf16256 : ClangBuiltin<"__builtin_ia32_vfmsub213nepbf16256">, +def int_x86_avx10_vfmsub213bf16256 : ClangBuiltin<"__builtin_ia32_vfmsub213bf16256">, DefaultAttrsIntrinsic<[llvm_v16bf16_ty], [llvm_v16bf16_ty, llvm_v16bf16_ty, llvm_v16bf16_ty], [IntrNoMem]>; -def int_x86_avx10_vfmsub213nepbf16128 : ClangBuiltin<"__builtin_ia32_vfmsub213nepbf16128">, +def int_x86_avx10_vfmsub213bf16128 : ClangBuiltin<"__builtin_ia32_vfmsub213bf16128">, DefaultAttrsIntrinsic<[llvm_v8bf16_ty], [llvm_v8bf16_ty, llvm_v8bf16_ty, llvm_v8bf16_ty ], [IntrNoMem]>; -def int_x86_avx10_vfmsub132nepbf16512 : ClangBuiltin<"__builtin_ia32_vfmsub132nepbf16512">, +def int_x86_avx10_vfmsub132bf16512 : ClangBuiltin<"__builtin_ia32_vfmsub132bf16512">, DefaultAttrsIntrinsic<[llvm_v32bf16_ty], [llvm_v32bf16_ty, llvm_v32bf16_ty, llvm_v32bf16_ty], [IntrNoMem]>; -def int_x86_avx10_vfmsub132nepbf16256 : ClangBuiltin<"__builtin_ia32_vfmsub132nepbf16256">, +def int_x86_avx10_vfmsub132bf16256 : ClangBuiltin<"__builtin_ia32_vfmsub132bf16256">, DefaultAttrsIntrinsic<[llvm_v16bf16_ty], [llvm_v16bf16_ty, llvm_v16bf16_ty, llvm_v16bf16_ty], [IntrNoMem]>; -def int_x86_avx10_vfmsub132nepbf16128 : ClangBuiltin<"__builtin_ia32_vfmsub132nepbf16128">, +def int_x86_avx10_vfmsub132bf16128 : ClangBuiltin<"__builtin_ia32_vfmsub132bf16128">, DefaultAttrsIntrinsic<[llvm_v8bf16_ty], [llvm_v8bf16_ty, llvm_v8bf16_ty, llvm_v8bf16_ty ], [IntrNoMem]>; -def int_x86_avx10_vfmsub231nepbf16512 : ClangBuiltin<"__builtin_ia32_vfmsub231nepbf16512">, +def int_x86_avx10_vfmsub231bf16512 : ClangBuiltin<"__builtin_ia32_vfmsub231bf16512">, DefaultAttrsIntrinsic<[llvm_v32bf16_ty], [llvm_v32bf16_ty, llvm_v32bf16_ty, llvm_v32bf16_ty], [IntrNoMem]>; -def int_x86_avx10_vfmsub231nepbf16256 : ClangBuiltin<"__builtin_ia32_vfmsub231nepbf16256">, +def int_x86_avx10_vfmsub231bf16256 : ClangBuiltin<"__builtin_ia32_vfmsub231bf16256">, DefaultAttrsIntrinsic<[llvm_v16bf16_ty], [llvm_v16bf16_ty, llvm_v16bf16_ty, llvm_v16bf16_ty], [IntrNoMem]>; -def int_x86_avx10_vfmsub231nepbf16128 : ClangBuiltin<"__builtin_ia32_vfmsub231nepbf16128">, +def int_x86_avx10_vfmsub231bf16128 : ClangBuiltin<"__builtin_ia32_vfmsub231bf16128">, DefaultAttrsIntrinsic<[llvm_v8bf16_ty], [llvm_v8bf16_ty, llvm_v8bf16_ty, llvm_v8bf16_ty ], [IntrNoMem]>; -def int_x86_avx10_vfnmadd213nepbf16512 : ClangBuiltin<"__builtin_ia32_vfnmadd213nepbf16512">, +def int_x86_avx10_vfnmadd213bf16512 : ClangBuiltin<"__builtin_ia32_vfnmadd213bf16512">, DefaultAttrsIntrinsic<[llvm_v32bf16_ty], [llvm_v32bf16_ty, llvm_v32bf16_ty, llvm_v32bf16_ty], [IntrNoMem]>; -def int_x86_avx10_vfnmadd213nepbf16256 : ClangBuiltin<"__builtin_ia32_vfnmadd213nepbf16256">, +def int_x86_avx10_vfnmadd213bf16256 : ClangBuiltin<"__builtin_ia32_vfnmadd213bf16256">, DefaultAttrsIntrinsic<[llvm_v16bf16_ty], [llvm_v16bf16_ty, llvm_v16bf16_ty, llvm_v16bf16_ty], [IntrNoMem]>; -def int_x86_avx10_vfnmadd213nepbf16128 : ClangBuiltin<"__builtin_ia32_vfnmadd213nepbf16128">, +def int_x86_avx10_vfnmadd213bf16128 : ClangBuiltin<"__builtin_ia32_vfnmadd213bf16128">, DefaultAttrsIntrinsic<[llvm_v8bf16_ty], [llvm_v8bf16_ty, llvm_v8bf16_ty, llvm_v8bf16_ty ], [IntrNoMem]>; -def int_x86_avx10_vfnmadd132nepbf16512 : ClangBuiltin<"__builtin_ia32_vfnmadd132nepbf16512">, +def int_x86_avx10_vfnmadd132bf16512 : ClangBuiltin<"__builtin_ia32_vfnmadd132bf16512">, DefaultAttrsIntrinsic<[llvm_v32bf16_ty], [llvm_v32bf16_ty, llvm_v32bf16_ty, llvm_v32bf16_ty], [IntrNoMem]>; -def int_x86_avx10_vfnmadd132nepbf16256 : ClangBuiltin<"__builtin_ia32_vfnmadd132nepbf16256">, +def int_x86_avx10_vfnmadd132bf16256 : ClangBuiltin<"__builtin_ia32_vfnmadd132bf16256">, DefaultAttrsIntrinsic<[llvm_v16bf16_ty], [llvm_v16bf16_ty, llvm_v16bf16_ty, llvm_v16bf16_ty], [IntrNoMem]>; -def int_x86_avx10_vfnmadd132nepbf16128 : ClangBuiltin<"__builtin_ia32_vfnmadd132nepbf16128">, +def int_x86_avx10_vfnmadd132bf16128 : ClangBuiltin<"__builtin_ia32_vfnmadd132bf16128">, DefaultAttrsIntrinsic<[llvm_v8bf16_ty], [llvm_v8bf16_ty, llvm_v8bf16_ty, llvm_v8bf16_ty ], [IntrNoMem]>; -def int_x86_avx10_vfnmadd231nepbf16512 : ClangBuiltin<"__builtin_ia32_vfnmadd231nepbf16512">, +def int_x86_avx10_vfnmadd231bf16512 : ClangBuiltin<"__builtin_ia32_vfnmadd231bf16512">, DefaultAttrsIntrinsic<[llvm_v32bf16_ty], [llvm_v32bf16_ty, llvm_v32bf16_ty, llvm_v32bf16_ty], [IntrNoMem]>; -def int_x86_avx10_vfnmadd231nepbf16256 : ClangBuiltin<"__builtin_ia32_vfnmadd231nepbf16256">, +def int_x86_avx10_vfnmadd231bf16256 : ClangBuiltin<"__builtin_ia32_vfnmadd231bf16256">, DefaultAttrsIntrinsic<[llvm_v16bf16_ty], [llvm_v16bf16_ty, llvm_v16bf16_ty, llvm_v16bf16_ty], [IntrNoMem]>; -def int_x86_avx10_vfnmadd231nepbf16128 : ClangBuiltin<"__builtin_ia32_vfnmadd231nepbf16128">, +def int_x86_avx10_vfnmadd231bf16128 : ClangBuiltin<"__builtin_ia32_vfnmadd231bf16128">, DefaultAttrsIntrinsic<[llvm_v8bf16_ty], [llvm_v8bf16_ty, llvm_v8bf16_ty, llvm_v8bf16_ty ], [IntrNoMem]>; -def int_x86_avx10_vfnmsub213nepbf16512 : ClangBuiltin<"__builtin_ia32_vfnmsub213nepbf16512">, +def int_x86_avx10_vfnmsub213bf16512 : ClangBuiltin<"__builtin_ia32_vfnmsub213bf16512">, DefaultAttrsIntrinsic<[llvm_v32bf16_ty], [llvm_v32bf16_ty, llvm_v32bf16_ty, llvm_v32bf16_ty], [IntrNoMem]>; -def int_x86_avx10_vfnmsub213nepbf16256 : ClangBuiltin<"__builtin_ia32_vfnmsub213nepbf16256">, +def int_x86_avx10_vfnmsub213bf16256 : ClangBuiltin<"__builtin_ia32_vfnmsub213bf16256">, DefaultAttrsIntrinsic<[llvm_v16bf16_ty], [llvm_v16bf16_ty, llvm_v16bf16_ty, llvm_v16bf16_ty], [IntrNoMem]>; -def int_x86_avx10_vfnmsub213nepbf16128 : ClangBuiltin<"__builtin_ia32_vfnmsub213nepbf16128">, +def int_x86_avx10_vfnmsub213bf16128 : ClangBuiltin<"__builtin_ia32_vfnmsub213bf16128">, DefaultAttrsIntrinsic<[llvm_v8bf16_ty], [llvm_v8bf16_ty, llvm_v8bf16_ty, llvm_v8bf16_ty ], [IntrNoMem]>; -def int_x86_avx10_vfnmsub132nepbf16512 : ClangBuiltin<"__builtin_ia32_vfnmsub132nepbf16512">, +def int_x86_avx10_vfnmsub132bf16512 : ClangBuiltin<"__builtin_ia32_vfnmsub132bf16512">, DefaultAttrsIntrinsic<[llvm_v32bf16_ty], [llvm_v32bf16_ty, llvm_v32bf16_ty, llvm_v32bf16_ty], [IntrNoMem]>; -def int_x86_avx10_vfnmsub132nepbf16256 : ClangBuiltin<"__builtin_ia32_vfnmsub132nepbf16256">, +def int_x86_avx10_vfnmsub132bf16256 : ClangBuiltin<"__builtin_ia32_vfnmsub132bf16256">, DefaultAttrsIntrinsic<[llvm_v16bf16_ty], [llvm_v16bf16_ty, llvm_v16bf16_ty, llvm_v16bf16_ty], [IntrNoMem]>; -def int_x86_avx10_vfnmsub132nepbf16128 : ClangBuiltin<"__builtin_ia32_vfnmsub132nepbf16128">, +def int_x86_avx10_vfnmsub132bf16128 : ClangBuiltin<"__builtin_ia32_vfnmsub132bf16128">, DefaultAttrsIntrinsic<[llvm_v8bf16_ty], [llvm_v8bf16_ty, llvm_v8bf16_ty, llvm_v8bf16_ty ], [IntrNoMem]>; -def int_x86_avx10_vfnmsub231nepbf16512 : ClangBuiltin<"__builtin_ia32_vfnmsub231nepbf16512">, +def int_x86_avx10_vfnmsub231bf16512 : ClangBuiltin<"__builtin_ia32_vfnmsub231bf16512">, DefaultAttrsIntrinsic<[llvm_v32bf16_ty], [llvm_v32bf16_ty, llvm_v32bf16_ty, llvm_v32bf16_ty], [IntrNoMem]>; -def int_x86_avx10_vfnmsub231nepbf16256 : ClangBuiltin<"__builtin_ia32_vfnmsub231nepbf16256">, +def int_x86_avx10_vfnmsub231bf16256 : ClangBuiltin<"__builtin_ia32_vfnmsub231bf16256">, DefaultAttrsIntrinsic<[llvm_v16bf16_ty], [llvm_v16bf16_ty, llvm_v16bf16_ty, llvm_v16bf16_ty], [IntrNoMem]>; -def int_x86_avx10_vfnmsub231nepbf16128 : ClangBuiltin<"__builtin_ia32_vfnmsub231nepbf16128">, +def int_x86_avx10_vfnmsub231bf16128 : ClangBuiltin<"__builtin_ia32_vfnmsub231bf16128">, DefaultAttrsIntrinsic<[llvm_v8bf16_ty], [llvm_v8bf16_ty, llvm_v8bf16_ty, llvm_v8bf16_ty ], [IntrNoMem]>; } @@ -7893,4 +7893,4 @@ def int_x86_movrsdi : ClangBuiltin<"__builtin_ia32_movrsdi">, [IntrReadMem]>; def int_x86_prefetchrs : ClangBuiltin<"__builtin_ia32_prefetchrs">, Intrinsic<[], [llvm_ptr_ty], []>; -} \ No newline at end of file +} diff --git a/llvm/lib/Target/X86/AsmParser/X86AsmParser.cpp b/llvm/lib/Target/X86/AsmParser/X86AsmParser.cpp index 41a646621c7ea..a6285a55f4155 100644 --- a/llvm/lib/Target/X86/AsmParser/X86AsmParser.cpp +++ b/llvm/lib/Target/X86/AsmParser/X86AsmParser.cpp @@ -3306,11 +3306,11 @@ bool X86AsmParser::parseInstruction(ParseInstructionInfo &Info, StringRef Name, if ((PatchedName.starts_with("cmp") || PatchedName.starts_with("vcmp")) && (PatchedName.ends_with("ss") || PatchedName.ends_with("sd") || PatchedName.ends_with("sh") || PatchedName.ends_with("ph") || - PatchedName.ends_with("pbf16") || PatchedName.ends_with("ps") || + PatchedName.ends_with("bf16") || PatchedName.ends_with("ps") || PatchedName.ends_with("pd"))) { bool IsVCMP = PatchedName[0] == 'v'; unsigned CCIdx = IsVCMP ? 4 : 3; - unsigned suffixLength = PatchedName.ends_with("pbf16") ? 5 : 2; + unsigned suffixLength = PatchedName.ends_with("bf16") ? 5 : 2; unsigned CC = StringSwitch( PatchedName.slice(CCIdx, PatchedName.size() - suffixLength)) .Case("eq", 0x00) @@ -3375,8 +3375,8 @@ bool X86AsmParser::parseInstruction(ParseInstructionInfo &Info, StringRef Name, PatchedName = "vcmpsh"; else if (PatchedName.ends_with("ph")) PatchedName = "vcmpph"; - else if (PatchedName.ends_with("pbf16")) - PatchedName = "vcmppbf16"; + else if (PatchedName.ends_with("bf16")) + PatchedName = "vcmpbf16"; else llvm_unreachable("Unexpected suffix!"); diff --git a/llvm/lib/Target/X86/MCTargetDesc/X86ATTInstPrinter.cpp b/llvm/lib/Target/X86/MCTargetDesc/X86ATTInstPrinter.cpp index abe0cc6365dd4..cd89b88f46194 100644 --- a/llvm/lib/Target/X86/MCTargetDesc/X86ATTInstPrinter.cpp +++ b/llvm/lib/Target/X86/MCTargetDesc/X86ATTInstPrinter.cpp @@ -166,15 +166,15 @@ bool X86ATTInstPrinter::printVecCompareInstr(const MCInst *MI, case X86::VCMPPHZrmbi: case X86::VCMPPHZrmbik: case X86::VCMPPHZrrib: case X86::VCMPPHZrribk: case X86::VCMPSHZrrib_Int: case X86::VCMPSHZrribk_Int: - case X86::VCMPPBF16Z128rmi: case X86::VCMPPBF16Z128rri: - case X86::VCMPPBF16Z256rmi: case X86::VCMPPBF16Z256rri: - case X86::VCMPPBF16Zrmi: case X86::VCMPPBF16Zrri: - case X86::VCMPPBF16Z128rmik: case X86::VCMPPBF16Z128rrik: - case X86::VCMPPBF16Z256rmik: case X86::VCMPPBF16Z256rrik: - case X86::VCMPPBF16Zrmik: case X86::VCMPPBF16Zrrik: - case X86::VCMPPBF16Z128rmbi: case X86::VCMPPBF16Z128rmbik: - case X86::VCMPPBF16Z256rmbi: case X86::VCMPPBF16Z256rmbik: - case X86::VCMPPBF16Zrmbi: case X86::VCMPPBF16Zrmbik: + case X86::VCMPBF16Z128rmi: case X86::VCMPBF16Z128rri: + case X86::VCMPBF16Z256rmi: case X86::VCMPBF16Z256rri: + case X86::VCMPBF16Zrmi: case X86::VCMPBF16Zrri: + case X86::VCMPBF16Z128rmik: case X86::VCMPBF16Z128rrik: + case X86::VCMPBF16Z256rmik: case X86::VCMPBF16Z256rrik: + case X86::VCMPBF16Zrmik: case X86::VCMPBF16Zrrik: + case X86::VCMPBF16Z128rmbi: case X86::VCMPBF16Z128rmbik: + case X86::VCMPBF16Z256rmbi: case X86::VCMPBF16Z256rmbik: + case X86::VCMPBF16Zrmbi: case X86::VCMPBF16Zrmbik: if (Imm >= 0 && Imm <= 31) { OS << '\t'; printCMPMnemonic(MI, /*IsVCMP*/true, OS); diff --git a/llvm/lib/Target/X86/MCTargetDesc/X86InstComments.cpp b/llvm/lib/Target/X86/MCTargetDesc/X86InstComments.cpp index 681d0dab37d09..4c26fc86f9547 100644 --- a/llvm/lib/Target/X86/MCTargetDesc/X86InstComments.cpp +++ b/llvm/lib/Target/X86/MCTargetDesc/X86InstComments.cpp @@ -979,7 +979,7 @@ static bool printFPCLASSComments(const MCInst *MI, raw_ostream &OS, unsigned NumOperands = MI->getNumOperands(); int SrcIdx; switch (MI->getOpcode()) { - CASE_FPCLASS_PACKED(FPCLASSPBF16, r) + CASE_FPCLASS_PACKED(FPCLASSBF16, r) CASE_FPCLASS_PACKED(FPCLASSPH, r) CASE_FPCLASS_PACKED(FPCLASSPS, r) CASE_FPCLASS_PACKED(FPCLASSPD, r) @@ -989,7 +989,7 @@ static bool printFPCLASSComments(const MCInst *MI, raw_ostream &OS, SrcIdx = NumOperands - 2; break; } - CASE_FPCLASS_PACKED_MEM(FPCLASSPBF16) + CASE_FPCLASS_PACKED_MEM(FPCLASSBF16) CASE_FPCLASS_PACKED_MEM(FPCLASSPH) CASE_FPCLASS_PACKED_MEM(FPCLASSPS) CASE_FPCLASS_PACKED_MEM(FPCLASSPD) diff --git a/llvm/lib/Target/X86/MCTargetDesc/X86InstPrinterCommon.cpp b/llvm/lib/Target/X86/MCTargetDesc/X86InstPrinterCommon.cpp index 01e2d4ace9773..8470d26011cd8 100644 --- a/llvm/lib/Target/X86/MCTargetDesc/X86InstPrinterCommon.cpp +++ b/llvm/lib/Target/X86/MCTargetDesc/X86InstPrinterCommon.cpp @@ -309,16 +309,16 @@ void X86InstPrinterCommon::printCMPMnemonic(const MCInst *MI, bool IsVCmp, case X86::VCMPSHZrmik_Int: case X86::VCMPSHZrrik_Int: OS << "sh\t"; break; - case X86::VCMPPBF16Z128rmi: case X86::VCMPPBF16Z128rri: - case X86::VCMPPBF16Z256rmi: case X86::VCMPPBF16Z256rri: - case X86::VCMPPBF16Zrmi: case X86::VCMPPBF16Zrri: - case X86::VCMPPBF16Z128rmik: case X86::VCMPPBF16Z128rrik: - case X86::VCMPPBF16Z256rmik: case X86::VCMPPBF16Z256rrik: - case X86::VCMPPBF16Zrmik: case X86::VCMPPBF16Zrrik: - case X86::VCMPPBF16Z128rmbi: case X86::VCMPPBF16Z128rmbik: - case X86::VCMPPBF16Z256rmbi: case X86::VCMPPBF16Z256rmbik: - case X86::VCMPPBF16Zrmbi: case X86::VCMPPBF16Zrmbik: - OS << "pbf16\t"; + case X86::VCMPBF16Z128rmi: case X86::VCMPBF16Z128rri: + case X86::VCMPBF16Z256rmi: case X86::VCMPBF16Z256rri: + case X86::VCMPBF16Zrmi: case X86::VCMPBF16Zrri: + case X86::VCMPBF16Z128rmik: case X86::VCMPBF16Z128rrik: + case X86::VCMPBF16Z256rmik: case X86::VCMPBF16Z256rrik: + case X86::VCMPBF16Zrmik: case X86::VCMPBF16Zrrik: + case X86::VCMPBF16Z128rmbi: case X86::VCMPBF16Z128rmbik: + case X86::VCMPBF16Z256rmbi: case X86::VCMPBF16Z256rmbik: + case X86::VCMPBF16Zrmbi: case X86::VCMPBF16Zrmbik: + OS << "bf16\t"; break; } } diff --git a/llvm/lib/Target/X86/MCTargetDesc/X86IntelInstPrinter.cpp b/llvm/lib/Target/X86/MCTargetDesc/X86IntelInstPrinter.cpp index c26dc2ca5a7a4..0d92609b3a63d 100644 --- a/llvm/lib/Target/X86/MCTargetDesc/X86IntelInstPrinter.cpp +++ b/llvm/lib/Target/X86/MCTargetDesc/X86IntelInstPrinter.cpp @@ -145,15 +145,15 @@ bool X86IntelInstPrinter::printVecCompareInstr(const MCInst *MI, raw_ostream &OS case X86::VCMPPHZrmbi: case X86::VCMPPHZrmbik: case X86::VCMPPHZrrib: case X86::VCMPPHZrribk: case X86::VCMPSHZrrib_Int: case X86::VCMPSHZrribk_Int: - case X86::VCMPPBF16Z128rmi: case X86::VCMPPBF16Z128rri: - case X86::VCMPPBF16Z256rmi: case X86::VCMPPBF16Z256rri: - case X86::VCMPPBF16Zrmi: case X86::VCMPPBF16Zrri: - case X86::VCMPPBF16Z128rmik: case X86::VCMPPBF16Z128rrik: - case X86::VCMPPBF16Z256rmik: case X86::VCMPPBF16Z256rrik: - case X86::VCMPPBF16Zrmik: case X86::VCMPPBF16Zrrik: - case X86::VCMPPBF16Z128rmbi: case X86::VCMPPBF16Z128rmbik: - case X86::VCMPPBF16Z256rmbi: case X86::VCMPPBF16Z256rmbik: - case X86::VCMPPBF16Zrmbi: case X86::VCMPPBF16Zrmbik: + case X86::VCMPBF16Z128rmi: case X86::VCMPBF16Z128rri: + case X86::VCMPBF16Z256rmi: case X86::VCMPBF16Z256rri: + case X86::VCMPBF16Zrmi: case X86::VCMPBF16Zrri: + case X86::VCMPBF16Z128rmik: case X86::VCMPBF16Z128rrik: + case X86::VCMPBF16Z256rmik: case X86::VCMPBF16Z256rrik: + case X86::VCMPBF16Zrmik: case X86::VCMPBF16Zrrik: + case X86::VCMPBF16Z128rmbi: case X86::VCMPBF16Z128rmbik: + case X86::VCMPBF16Z256rmbi: case X86::VCMPBF16Z256rmbik: + case X86::VCMPBF16Zrmbi: case X86::VCMPBF16Zrmbik: if (Imm >= 0 && Imm <= 31) { OS << '\t'; printCMPMnemonic(MI, /*IsVCMP*/true, OS); diff --git a/llvm/lib/Target/X86/X86InstrAVX10.td b/llvm/lib/Target/X86/X86InstrAVX10.td index edbcb17297603..6cc814f6b31f4 100644 --- a/llvm/lib/Target/X86/X86InstrAVX10.td +++ b/llvm/lib/Target/X86/X86InstrAVX10.td @@ -1308,31 +1308,31 @@ defm VCVTHF82PH : avx10_convert_2op_nomb<"vcvthf82ph", avx512vl_f16_info, // AVX10 BF16 instructions //------------------------------------------------- -// VADDNEPBF16, VSUBNEPBF16, VMULNEPBF16, VDIVNEPBF16, VMAXPBF16, VMINPBF16 -multiclass avx10_fp_binopne_int_pbf16 opc, string OpcodeStr, +// VADDBF16, VSUBBF16, VMULBF16, VDIVBF16, VMAXBF16, VMINBF16 +multiclass avx10_fp_binopne_int_bf16 opc, string OpcodeStr, X86SchedWriteSizes sched, bit IsCommutable = 0> { let Predicates = [HasAVX10_2_512] in defm Z : avx512_fp_packed("int_x86_avx10_"#OpcodeStr#"pbf16512"), - !cast("int_x86_avx10_"#OpcodeStr#"pbf16512"), + !cast("int_x86_avx10_"#OpcodeStr#"bf16512"), + !cast("int_x86_avx10_"#OpcodeStr#"bf16512"), v32bf16_info, sched.PH.ZMM, IsCommutable>, EVEX_V512, T_MAP5, PD, EVEX_CD8<16, CD8VF>; let Predicates = [HasAVX10_2] in { defm Z128 : avx512_fp_packed("int_x86_avx10_"#OpcodeStr#"pbf16128"), - !cast("int_x86_avx10_"#OpcodeStr#"pbf16128"), + !cast("int_x86_avx10_"#OpcodeStr#"bf16128"), + !cast("int_x86_avx10_"#OpcodeStr#"bf16128"), v8bf16x_info, sched.PH.XMM, IsCommutable>, EVEX_V128, T_MAP5, PD, EVEX_CD8<16, CD8VF>; defm Z256 : avx512_fp_packed("int_x86_avx10_"#OpcodeStr#"pbf16256"), - !cast("int_x86_avx10_"#OpcodeStr#"pbf16256"), + !cast("int_x86_avx10_"#OpcodeStr#"bf16256"), + !cast("int_x86_avx10_"#OpcodeStr#"bf16256"), v16bf16x_info, sched.PH.YMM, IsCommutable>, EVEX_V256, T_MAP5, PD, EVEX_CD8<16, CD8VF>; } } -multiclass avx10_fp_binop_pbf16 opc, string OpcodeStr, SDPatternOperator OpNode, +multiclass avx10_fp_binop_bf16 opc, string OpcodeStr, SDPatternOperator OpNode, X86SchedWriteSizes sched, bit IsCommutable = 0, SDPatternOperator MaskOpNode = OpNode> { @@ -1351,12 +1351,12 @@ multiclass avx10_fp_binop_pbf16 opc, string OpcodeStr, SDPatternOperator } let Uses = [], mayRaiseFPException = 0 in { -defm VADDNEPBF16 : avx10_fp_binop_pbf16<0x58, "vaddne", fadd, SchedWriteFAddSizes, 1>; -defm VSUBNEPBF16 : avx10_fp_binop_pbf16<0x5C, "vsubne", fsub, SchedWriteFAddSizes, 0>; -defm VMULNEPBF16 : avx10_fp_binop_pbf16<0x59, "vmulne", fmul, SchedWriteFMulSizes, 1>; -defm VDIVNEPBF16 : avx10_fp_binop_pbf16<0x5E, "vdivne", fdiv, SchedWriteFDivSizes, 0>; -defm VMINPBF16 : avx10_fp_binopne_int_pbf16<0x5D, "vmin", SchedWriteFCmpSizes, 0>; -defm VMAXPBF16 : avx10_fp_binopne_int_pbf16<0x5F, "vmax", SchedWriteFCmpSizes, 0>; +defm VADDBF16 : avx10_fp_binop_bf16<0x58, "vadd", fadd, SchedWriteFAddSizes, 1>; +defm VSUBBF16 : avx10_fp_binop_bf16<0x5C, "vsub", fsub, SchedWriteFAddSizes, 0>; +defm VMULBF16 : avx10_fp_binop_bf16<0x59, "vmul", fmul, SchedWriteFMulSizes, 1>; +defm VDIVBF16 : avx10_fp_binop_bf16<0x5E, "vdiv", fdiv, SchedWriteFDivSizes, 0>; +defm VMINBF16 : avx10_fp_binopne_int_bf16<0x5D, "vmin", SchedWriteFCmpSizes, 0>; +defm VMAXBF16 : avx10_fp_binopne_int_bf16<0x5F, "vmax", SchedWriteFCmpSizes, 0>; } // VCOMSBF16 @@ -1375,7 +1375,7 @@ let Uses = [], mayRaiseFPException = 0, } } -// VCMPPBF16 +// VCMPBF16 multiclass avx10_vcmp_common_bf16 { let mayRaiseFPException = 0 in { defm rri : AVX512_maskable_cmp<0xC2, MRMSrcReg, _, @@ -1421,56 +1421,56 @@ multiclass avx10_vcmp_bf16 { } } -defm VCMPPBF16 : avx10_vcmp_bf16, +defm VCMPBF16 : avx10_vcmp_bf16, AVX512XDIi8Base, EVEX, VVVV, EVEX_CD8<16, CD8VF>, TA; -// VSQRTNEPBF16 +// VSQRTBF16 multiclass avx10_sqrt_packed_bf16 opc, string OpcodeStr, X86SchedWriteSizes sched> { let Predicates = [HasAVX10_2_512] in - defm Z : avx512_sqrt_packed, EVEX_V512, PD, T_MAP5, EVEX_CD8<16, CD8VF>; let Predicates = [HasAVX10_2] in { - defm Z128 : avx512_sqrt_packed, EVEX_V128, PD, T_MAP5, EVEX_CD8<16, CD8VF>; - defm Z256 : avx512_sqrt_packed, EVEX_V256, PD, T_MAP5, EVEX_CD8<16, CD8VF>; } } let Uses = [], mayRaiseFPException = 0 in -defm VSQRTNEPBF16 : avx10_sqrt_packed_bf16<0x51, "vsqrtne", SchedWriteFSqrtSizes>; +defm VSQRTBF16 : avx10_sqrt_packed_bf16<0x51, "vsqrt", SchedWriteFSqrtSizes>; -// VRSQRTPBF16, VRCPPBF16, VSRQTPBF16, VGETEXPPBF16 -multiclass avx10_fp14_pbf16 opc, string OpcodeStr, SDNode OpNode, +// VRSQRTBF16, VRCPBF16, VSRQTBF16, VGETEXPBF16 +multiclass avx10_fp14_bf16 opc, string OpcodeStr, SDNode OpNode, X86SchedWriteWidths sched> { let Predicates = [HasAVX10_2_512] in - defm PBF16Z : avx512_fp14_p, - EVEX_V512; + defm BF16Z : avx512_fp14_p, + EVEX_V512; let Predicates = [HasAVX10_2] in { - defm PBF16Z128 : avx512_fp14_p, - EVEX_V128; - defm PBF16Z256 : avx512_fp14_p, - EVEX_V256; + defm BF16Z128 : avx512_fp14_p, + EVEX_V128; + defm BF16Z256 : avx512_fp14_p, + EVEX_V256; } } -defm VRSQRT : avx10_fp14_pbf16<0x4E, "vrsqrt", X86rsqrt14, SchedWriteFRsqrt>, +defm VRSQRT : avx10_fp14_bf16<0x4E, "vrsqrt", X86rsqrt14, SchedWriteFRsqrt>, T_MAP6, PS, EVEX_CD8<16, CD8VF>; -defm VRCP : avx10_fp14_pbf16<0x4C, "vrcp", X86rcp14, SchedWriteFRcp>, +defm VRCP : avx10_fp14_bf16<0x4C, "vrcp", X86rcp14, SchedWriteFRcp>, T_MAP6, PS, EVEX_CD8<16, CD8VF>; -defm VGETEXP : avx10_fp14_pbf16<0x42, "vgetexp", X86fgetexp, SchedWriteFRnd>, +defm VGETEXP : avx10_fp14_bf16<0x42, "vgetexp", X86fgetexp, SchedWriteFRnd>, T_MAP5, EVEX_CD8<16, CD8VF>; -// VSCALEFPBF16 +// VSCALEFBF16 multiclass avx10_fp_scalef_bf16 opc, string OpcodeStr, X86SchedWriteWidths sched> { let Predicates = [HasAVX10_2_512] in @@ -1485,9 +1485,9 @@ multiclass avx10_fp_scalef_bf16 opc, string OpcodeStr, } let Uses = [], mayRaiseFPException = 0 in -defm VSCALEFPBF16 : avx10_fp_scalef_bf16<0x2C, "vscalef", SchedWriteFAdd>; +defm VSCALEFBF16 : avx10_fp_scalef_bf16<0x2C, "vscalef", SchedWriteFAdd>; -// VREDUCENEPBF16, VRNDSCALENEPBF16, VGETMANTPBF16 +// VREDUCEBF16, VRNDSCALEBF16, VGETMANTBF16 multiclass avx10_common_unary_fp_packed_imm_bf16 opc, SDPatternOperator OpNode, SDPatternOperator MaskOpNode, X86SchedWriteWidths sched> { @@ -1503,18 +1503,18 @@ multiclass avx10_common_unary_fp_packed_imm_bf16, mayRaiseFPException = 0 in { -defm VREDUCENEPBF16 : avx10_common_unary_fp_packed_imm_bf16<"vreducene", avx512vl_bf16_info, 0x56, +defm VREDUCEBF16 : avx10_common_unary_fp_packed_imm_bf16<"vreduce", avx512vl_bf16_info, 0x56, X86VReduce, X86VReduce, SchedWriteFRnd>, AVX512XDIi8Base, TA, EVEX, EVEX_CD8<16, CD8VF>; -defm VRNDSCALENEPBF16 : avx10_common_unary_fp_packed_imm_bf16<"vrndscalene", avx512vl_bf16_info, 0x08, +defm VRNDSCALEBF16 : avx10_common_unary_fp_packed_imm_bf16<"vrndscale", avx512vl_bf16_info, 0x08, X86any_VRndScale, X86VRndScale, SchedWriteFRnd>, AVX512XDIi8Base, TA, EVEX, EVEX_CD8<16, CD8VF>; -defm VGETMANTPBF16 : avx10_common_unary_fp_packed_imm_bf16<"vgetmant", avx512vl_bf16_info, 0x26, +defm VGETMANTBF16 : avx10_common_unary_fp_packed_imm_bf16<"vgetmant", avx512vl_bf16_info, 0x26, X86VGetMant, X86VGetMant, SchedWriteFRnd>, AVX512XDIi8Base, TA, EVEX, EVEX_CD8<16, CD8VF>; } -// VFPCLASSPBF16 +// VFPCLASSBF16 multiclass avx10_fp_fpclass_bf16 opcVec, X86SchedWriteWidths sched> { let Predicates = [HasAVX10_2_512] in @@ -1531,13 +1531,13 @@ multiclass avx10_fp_fpclass_bf16 opcVec, } } -defm VFPCLASSPBF16 : avx10_fp_fpclass_bf16<"vfpclass", 0x66, SchedWriteFCmp>, +defm VFPCLASSBF16 : avx10_fp_fpclass_bf16<"vfpclass", 0x66, SchedWriteFCmp>, AVX512XDIi8Base, TA, EVEX, EVEX_CD8<16, CD8VF>; -// VF[,N]M[ADD,SUB][132,213,231]NEPBF16 +// VF[,N]M[ADD,SUB][132,213,231]BF16 multiclass avx10_fma3p_213_bf16 opc, string OpcodeStr, - SDPatternOperator OpNode, SDNode MaskOpNode, - X86SchedWriteWidths sched> { + SDPatternOperator OpNode, SDNode MaskOpNode, + X86SchedWriteWidths sched> { let Predicates = [HasAVX10_2_512] in defm Z : avx512_fma3p_213_rm, EVEX_V512, T_MAP6, PS, @@ -1553,14 +1553,14 @@ multiclass avx10_fma3p_213_bf16 opc, string OpcodeStr, } let Uses = [], mayRaiseFPException = 0 in { -defm VFMADD213NEPBF16 : avx10_fma3p_213_bf16<0xA8, "vfmadd213nepbf16", any_fma, - fma, SchedWriteFMA>; -defm VFMSUB213NEPBF16 : avx10_fma3p_213_bf16<0xAA, "vfmsub213nepbf16", X86any_Fmsub, - X86Fmsub, SchedWriteFMA>; -defm VFNMADD213NEPBF16 : avx10_fma3p_213_bf16<0xAC, "vfnmadd213nepbf16", X86any_Fnmadd, - X86Fnmadd, SchedWriteFMA>; -defm VFNMSUB213NEPBF16 : avx10_fma3p_213_bf16<0xAE, "vfnmsub213nepbf16", X86any_Fnmsub, - X86Fnmsub, SchedWriteFMA>; +defm VFMADD213BF16 : avx10_fma3p_213_bf16<0xA8, "vfmadd213bf16", any_fma, + fma, SchedWriteFMA>; +defm VFMSUB213BF16 : avx10_fma3p_213_bf16<0xAA, "vfmsub213bf16", X86any_Fmsub, + X86Fmsub, SchedWriteFMA>; +defm VFNMADD213BF16 : avx10_fma3p_213_bf16<0xAC, "vfnmadd213bf16", X86any_Fnmadd, + X86Fnmadd, SchedWriteFMA>; +defm VFNMSUB213BF16 : avx10_fma3p_213_bf16<0xAE, "vfnmsub213bf16", X86any_Fnmsub, + X86Fnmsub, SchedWriteFMA>; } multiclass avx10_fma3p_231_bf16 opc, string OpcodeStr, @@ -1581,14 +1581,14 @@ multiclass avx10_fma3p_231_bf16 opc, string OpcodeStr, } let Uses = [], mayRaiseFPException = 0 in { -defm VFMADD231NEPBF16 : avx10_fma3p_231_bf16<0xB8, "vfmadd231nepbf16", any_fma, - fma, SchedWriteFMA>; -defm VFMSUB231NEPBF16 : avx10_fma3p_231_bf16<0xBA, "vfmsub231nepbf16", X86any_Fmsub, - X86Fmsub, SchedWriteFMA>; -defm VFNMADD231NEPBF16 : avx10_fma3p_231_bf16<0xBC, "vfnmadd231nepbf16", X86any_Fnmadd, - X86Fnmadd, SchedWriteFMA>; -defm VFNMSUB231NEPBF16 : avx10_fma3p_231_bf16<0xBE, "vfnmsub231nepbf16", X86any_Fnmsub, - X86Fnmsub, SchedWriteFMA>; +defm VFMADD231BF16 : avx10_fma3p_231_bf16<0xB8, "vfmadd231bf16", any_fma, + fma, SchedWriteFMA>; +defm VFMSUB231BF16 : avx10_fma3p_231_bf16<0xBA, "vfmsub231bf16", X86any_Fmsub, + X86Fmsub, SchedWriteFMA>; +defm VFNMADD231BF16 : avx10_fma3p_231_bf16<0xBC, "vfnmadd231bf16", X86any_Fnmadd, + X86Fnmadd, SchedWriteFMA>; +defm VFNMSUB231BF16 : avx10_fma3p_231_bf16<0xBE, "vfnmsub231bf16", X86any_Fnmsub, + X86Fnmsub, SchedWriteFMA>; } multiclass avx10_fma3p_132_bf16 opc, string OpcodeStr, @@ -1609,14 +1609,14 @@ multiclass avx10_fma3p_132_bf16 opc, string OpcodeStr, } let Uses = [], mayRaiseFPException = 0 in { -defm VFMADD132NEPBF16 : avx10_fma3p_132_bf16<0x98, "vfmadd132nepbf16", any_fma, - fma, SchedWriteFMA>; -defm VFMSUB132NEPBF16 : avx10_fma3p_132_bf16<0x9A, "vfmsub132nepbf16", X86any_Fmsub, +defm VFMADD132BF16 : avx10_fma3p_132_bf16<0x98, "vfmadd132bf16", any_fma, + fma, SchedWriteFMA>; +defm VFMSUB132BF16 : avx10_fma3p_132_bf16<0x9A, "vfmsub132bf16", X86any_Fmsub, X86Fmsub, SchedWriteFMA>; -defm VFNMADD132NEPBF16 : avx10_fma3p_132_bf16<0x9C, "vfnmadd132nepbf16", X86any_Fnmadd, - X86Fnmadd, SchedWriteFMA>; -defm VFNMSUB132NEPBF16 : avx10_fma3p_132_bf16<0x9E, "vfnmsub132nepbf16", X86any_Fnmsub, - X86Fnmsub, SchedWriteFMA>; +defm VFNMADD132BF16 : avx10_fma3p_132_bf16<0x9C, "vfnmadd132bf16", X86any_Fnmadd, + X86Fnmadd, SchedWriteFMA>; +defm VFNMSUB132BF16 : avx10_fma3p_132_bf16<0x9E, "vfnmsub132bf16", X86any_Fnmsub, + X86Fnmsub, SchedWriteFMA>; } //------------------------------------------------- diff --git a/llvm/lib/Target/X86/X86InstrFMA3Info.cpp b/llvm/lib/Target/X86/X86InstrFMA3Info.cpp index 0da4857d66748..d0c508d9934c3 100644 --- a/llvm/lib/Target/X86/X86InstrFMA3Info.cpp +++ b/llvm/lib/Target/X86/X86InstrFMA3Info.cpp @@ -53,7 +53,7 @@ using namespace llvm; FMA3GROUP_PACKED_WIDTHS_ALL(Name, PS, Attrs) #define FMA3GROUP_PACKED_BF16(Name, Attrs) \ - FMA3GROUP_PACKED_WIDTHS_Z(Name, NEPBF16, Attrs) + FMA3GROUP_PACKED_WIDTHS_Z(Name, BF16, Attrs) #define FMA3GROUP_SCALAR_WIDTHS_Z(Name, Suf, Attrs) \ FMA3GROUP(Name, Suf##Zm, Attrs) \ @@ -93,7 +93,7 @@ static const X86InstrFMA3Group Groups[] = { FMA3GROUP_MASKED(Name, Type##Z##Suf, Attrs) #define FMA3GROUP_PACKED_AVX512_ALL(Name, Suf, Attrs) \ - FMA3GROUP_PACKED_AVX512_WIDTHS(Name, NEPBF16, Suf, Attrs) \ + FMA3GROUP_PACKED_AVX512_WIDTHS(Name, BF16, Suf, Attrs) \ FMA3GROUP_PACKED_AVX512_WIDTHS(Name, PD, Suf, Attrs) \ FMA3GROUP_PACKED_AVX512_WIDTHS(Name, PH, Suf, Attrs) \ FMA3GROUP_PACKED_AVX512_WIDTHS(Name, PS, Suf, Attrs) diff --git a/llvm/lib/Target/X86/X86InstrUtils.td b/llvm/lib/Target/X86/X86InstrUtils.td index ab171ac79fb37..6aae90b77fbad 100644 --- a/llvm/lib/Target/X86/X86InstrUtils.td +++ b/llvm/lib/Target/X86/X86InstrUtils.td @@ -311,7 +311,7 @@ def v32i16_info : X86VectorVTInfo<32, i16, VR512, "w">; def v16i32_info : X86VectorVTInfo<16, i32, VR512, "d">; def v8i64_info : X86VectorVTInfo<8, i64, VR512, "q">; def v32f16_info : X86VectorVTInfo<32, f16, VR512, "ph">; -def v32bf16_info: X86VectorVTInfo<32, bf16, VR512, "pbf16">; +def v32bf16_info: X86VectorVTInfo<32, bf16, VR512, "bf16">; def v16f32_info : X86VectorVTInfo<16, f32, VR512, "ps">; def v8f64_info : X86VectorVTInfo<8, f64, VR512, "pd">; @@ -321,7 +321,7 @@ def v16i16x_info : X86VectorVTInfo<16, i16, VR256X, "w">; def v8i32x_info : X86VectorVTInfo<8, i32, VR256X, "d">; def v4i64x_info : X86VectorVTInfo<4, i64, VR256X, "q">; def v16f16x_info : X86VectorVTInfo<16, f16, VR256X, "ph">; -def v16bf16x_info: X86VectorVTInfo<16, bf16, VR256X, "pbf16">; +def v16bf16x_info: X86VectorVTInfo<16, bf16, VR256X, "bf16">; def v8f32x_info : X86VectorVTInfo<8, f32, VR256X, "ps">; def v4f64x_info : X86VectorVTInfo<4, f64, VR256X, "pd">; @@ -330,7 +330,7 @@ def v8i16x_info : X86VectorVTInfo<8, i16, VR128X, "w">; def v4i32x_info : X86VectorVTInfo<4, i32, VR128X, "d">; def v2i64x_info : X86VectorVTInfo<2, i64, VR128X, "q">; def v8f16x_info : X86VectorVTInfo<8, f16, VR128X, "ph">; -def v8bf16x_info : X86VectorVTInfo<8, bf16, VR128X, "pbf16">; +def v8bf16x_info : X86VectorVTInfo<8, bf16, VR128X, "bf16">; def v4f32x_info : X86VectorVTInfo<4, f32, VR128X, "ps">; def v2f64x_info : X86VectorVTInfo<2, f64, VR128X, "pd">; diff --git a/llvm/lib/Target/X86/X86IntrinsicsInfo.h b/llvm/lib/Target/X86/X86IntrinsicsInfo.h index 86fd04046d16a..91d7d8755be9b 100644 --- a/llvm/lib/Target/X86/X86IntrinsicsInfo.h +++ b/llvm/lib/Target/X86/X86IntrinsicsInfo.h @@ -389,53 +389,53 @@ static const IntrinsicData IntrinsicsWithoutChain[] = { X86_INTRINSIC_DATA(avx_vpermilvar_ps, INTR_TYPE_2OP, X86ISD::VPERMILPV, 0), X86_INTRINSIC_DATA(avx_vpermilvar_ps_256, INTR_TYPE_2OP, X86ISD::VPERMILPV, 0), - X86_INTRINSIC_DATA(avx10_fpclass_nepbf16_128, INTR_TYPE_2OP, - X86ISD::VFPCLASS, 0), - X86_INTRINSIC_DATA(avx10_fpclass_nepbf16_256, INTR_TYPE_2OP, - X86ISD::VFPCLASS, 0), - X86_INTRINSIC_DATA(avx10_fpclass_nepbf16_512, INTR_TYPE_2OP, - X86ISD::VFPCLASS, 0), - X86_INTRINSIC_DATA(avx10_mask_getexp_nepbf16_128, INTR_TYPE_1OP_MASK, + X86_INTRINSIC_DATA(avx10_fpclass_bf16_128, INTR_TYPE_2OP, X86ISD::VFPCLASS, + 0), + X86_INTRINSIC_DATA(avx10_fpclass_bf16_256, INTR_TYPE_2OP, X86ISD::VFPCLASS, + 0), + X86_INTRINSIC_DATA(avx10_fpclass_bf16_512, INTR_TYPE_2OP, X86ISD::VFPCLASS, + 0), + X86_INTRINSIC_DATA(avx10_mask_getexp_bf16_128, INTR_TYPE_1OP_MASK, X86ISD::FGETEXP, 0), - X86_INTRINSIC_DATA(avx10_mask_getexp_nepbf16_256, INTR_TYPE_1OP_MASK, + X86_INTRINSIC_DATA(avx10_mask_getexp_bf16_256, INTR_TYPE_1OP_MASK, X86ISD::FGETEXP, 0), - X86_INTRINSIC_DATA(avx10_mask_getexp_nepbf16_512, INTR_TYPE_1OP_MASK, + X86_INTRINSIC_DATA(avx10_mask_getexp_bf16_512, INTR_TYPE_1OP_MASK, X86ISD::FGETEXP, 0), - X86_INTRINSIC_DATA(avx10_mask_getmant_nepbf16_128, INTR_TYPE_2OP_MASK, + X86_INTRINSIC_DATA(avx10_mask_getmant_bf16_128, INTR_TYPE_2OP_MASK, X86ISD::VGETMANT, 0), - X86_INTRINSIC_DATA(avx10_mask_getmant_nepbf16_256, INTR_TYPE_2OP_MASK, + X86_INTRINSIC_DATA(avx10_mask_getmant_bf16_256, INTR_TYPE_2OP_MASK, X86ISD::VGETMANT, 0), - X86_INTRINSIC_DATA(avx10_mask_getmant_nepbf16_512, INTR_TYPE_2OP_MASK, + X86_INTRINSIC_DATA(avx10_mask_getmant_bf16_512, INTR_TYPE_2OP_MASK, X86ISD::VGETMANT, 0), - X86_INTRINSIC_DATA(avx10_mask_rcp_nepbf16_128, INTR_TYPE_1OP_MASK, + X86_INTRINSIC_DATA(avx10_mask_rcp_bf16_128, INTR_TYPE_1OP_MASK, X86ISD::RCP14, 0), - X86_INTRINSIC_DATA(avx10_mask_rcp_nepbf16_256, INTR_TYPE_1OP_MASK, + X86_INTRINSIC_DATA(avx10_mask_rcp_bf16_256, INTR_TYPE_1OP_MASK, X86ISD::RCP14, 0), - X86_INTRINSIC_DATA(avx10_mask_rcp_nepbf16_512, INTR_TYPE_1OP_MASK, + X86_INTRINSIC_DATA(avx10_mask_rcp_bf16_512, INTR_TYPE_1OP_MASK, X86ISD::RCP14, 0), - X86_INTRINSIC_DATA(avx10_mask_reduce_nepbf16_128, INTR_TYPE_2OP_MASK, + X86_INTRINSIC_DATA(avx10_mask_reduce_bf16_128, INTR_TYPE_2OP_MASK, X86ISD::VREDUCE, 0), - X86_INTRINSIC_DATA(avx10_mask_reduce_nepbf16_256, INTR_TYPE_2OP_MASK, + X86_INTRINSIC_DATA(avx10_mask_reduce_bf16_256, INTR_TYPE_2OP_MASK, X86ISD::VREDUCE, 0), - X86_INTRINSIC_DATA(avx10_mask_reduce_nepbf16_512, INTR_TYPE_2OP_MASK, + X86_INTRINSIC_DATA(avx10_mask_reduce_bf16_512, INTR_TYPE_2OP_MASK, X86ISD::VREDUCE, 0), - X86_INTRINSIC_DATA(avx10_mask_rndscale_nepbf16_128, INTR_TYPE_2OP_MASK, + X86_INTRINSIC_DATA(avx10_mask_rndscale_bf16_128, INTR_TYPE_2OP_MASK, X86ISD::VRNDSCALE, 0), - X86_INTRINSIC_DATA(avx10_mask_rndscale_nepbf16_256, INTR_TYPE_2OP_MASK, + X86_INTRINSIC_DATA(avx10_mask_rndscale_bf16_256, INTR_TYPE_2OP_MASK, X86ISD::VRNDSCALE, 0), - X86_INTRINSIC_DATA(avx10_mask_rndscale_nepbf16_512, INTR_TYPE_2OP_MASK, + X86_INTRINSIC_DATA(avx10_mask_rndscale_bf16_512, INTR_TYPE_2OP_MASK, X86ISD::VRNDSCALE, 0), - X86_INTRINSIC_DATA(avx10_mask_rsqrt_nepbf16_128, INTR_TYPE_1OP_MASK, + X86_INTRINSIC_DATA(avx10_mask_rsqrt_bf16_128, INTR_TYPE_1OP_MASK, X86ISD::RSQRT14, 0), - X86_INTRINSIC_DATA(avx10_mask_rsqrt_nepbf16_256, INTR_TYPE_1OP_MASK, + X86_INTRINSIC_DATA(avx10_mask_rsqrt_bf16_256, INTR_TYPE_1OP_MASK, X86ISD::RSQRT14, 0), - X86_INTRINSIC_DATA(avx10_mask_rsqrt_nepbf16_512, INTR_TYPE_1OP_MASK, + X86_INTRINSIC_DATA(avx10_mask_rsqrt_bf16_512, INTR_TYPE_1OP_MASK, X86ISD::RSQRT14, 0), - X86_INTRINSIC_DATA(avx10_mask_scalef_nepbf16_128, INTR_TYPE_2OP_MASK, + X86_INTRINSIC_DATA(avx10_mask_scalef_bf16_128, INTR_TYPE_2OP_MASK, X86ISD::SCALEF, 0), - X86_INTRINSIC_DATA(avx10_mask_scalef_nepbf16_256, INTR_TYPE_2OP_MASK, + X86_INTRINSIC_DATA(avx10_mask_scalef_bf16_256, INTR_TYPE_2OP_MASK, X86ISD::SCALEF, 0), - X86_INTRINSIC_DATA(avx10_mask_scalef_nepbf16_512, INTR_TYPE_2OP_MASK, + X86_INTRINSIC_DATA(avx10_mask_scalef_bf16_512, INTR_TYPE_2OP_MASK, X86ISD::SCALEF, 0), X86_INTRINSIC_DATA(avx10_mask_vcmppd256, CMP_MASK_CC, X86ISD::CMPMM, X86ISD::CMPMM_SAE), diff --git a/llvm/test/CodeGen/X86/avx10.2-fma-commute.ll b/llvm/test/CodeGen/X86/avx10.2-fma-commute.ll index c41e03ba637cb..ab8ac4fbd4193 100644 --- a/llvm/test/CodeGen/X86/avx10.2-fma-commute.ll +++ b/llvm/test/CodeGen/X86/avx10.2-fma-commute.ll @@ -4,7 +4,7 @@ define <8 x bfloat> @fma_123_v8bf16(<8 x bfloat> %x, <8 x bfloat> %y, <8 x bfloat> %z) { ; CHECK-LABEL: fma_123_v8bf16: ; CHECK: # %bb.0: -; CHECK-NEXT: vfmadd213nepbf16 %xmm2, %xmm1, %xmm0 +; CHECK-NEXT: vfmadd213bf16 %xmm2, %xmm1, %xmm0 ; CHECK-NEXT: retq %a = call <8 x bfloat> @llvm.fma.v8bf16(<8 x bfloat> %x, <8 x bfloat> %y, <8 x bfloat> %z) ret <8 x bfloat> %a @@ -13,7 +13,7 @@ define <8 x bfloat> @fma_123_v8bf16(<8 x bfloat> %x, <8 x bfloat> %y, <8 x bfloa define <8 x bfloat> @fma_213_v8bf16(<8 x bfloat> %x, <8 x bfloat> %y, <8 x bfloat> %z) { ; CHECK-LABEL: fma_213_v8bf16: ; CHECK: # %bb.0: -; CHECK-NEXT: vfmadd213nepbf16 %xmm2, %xmm1, %xmm0 +; CHECK-NEXT: vfmadd213bf16 %xmm2, %xmm1, %xmm0 ; CHECK-NEXT: retq %a = call <8 x bfloat> @llvm.fma.v8bf16(<8 x bfloat> %y, <8 x bfloat> %x, <8 x bfloat> %z) ret <8 x bfloat> %a @@ -22,7 +22,7 @@ define <8 x bfloat> @fma_213_v8bf16(<8 x bfloat> %x, <8 x bfloat> %y, <8 x bfloa define <8 x bfloat> @fma_231_v8bf16(<8 x bfloat> %x, <8 x bfloat> %y, <8 x bfloat> %z) { ; CHECK-LABEL: fma_231_v8bf16: ; CHECK: # %bb.0: -; CHECK-NEXT: vfmadd231nepbf16 %xmm1, %xmm2, %xmm0 +; CHECK-NEXT: vfmadd231bf16 %xmm1, %xmm2, %xmm0 ; CHECK-NEXT: retq %a = call <8 x bfloat> @llvm.fma.v8bf16(<8 x bfloat> %y, <8 x bfloat> %z, <8 x bfloat> %x) ret <8 x bfloat> %a @@ -31,7 +31,7 @@ define <8 x bfloat> @fma_231_v8bf16(<8 x bfloat> %x, <8 x bfloat> %y, <8 x bfloa define <8 x bfloat> @fma_321_v8bf16(<8 x bfloat> %x, <8 x bfloat> %y, <8 x bfloat> %z) { ; CHECK-LABEL: fma_321_v8bf16: ; CHECK: # %bb.0: -; CHECK-NEXT: vfmadd231nepbf16 %xmm1, %xmm2, %xmm0 +; CHECK-NEXT: vfmadd231bf16 %xmm1, %xmm2, %xmm0 ; CHECK-NEXT: retq %a = call <8 x bfloat> @llvm.fma.v8bf16(<8 x bfloat> %z, <8 x bfloat> %y, <8 x bfloat> %x) ret <8 x bfloat> %a @@ -40,7 +40,7 @@ define <8 x bfloat> @fma_321_v8bf16(<8 x bfloat> %x, <8 x bfloat> %y, <8 x bfloa define <8 x bfloat> @fma_132_v8bf16(<8 x bfloat> %x, <8 x bfloat> %y, <8 x bfloat> %z) { ; CHECK-LABEL: fma_132_v8bf16: ; CHECK: # %bb.0: -; CHECK-NEXT: vfmadd213nepbf16 %xmm1, %xmm2, %xmm0 +; CHECK-NEXT: vfmadd213bf16 %xmm1, %xmm2, %xmm0 ; CHECK-NEXT: retq %a = call <8 x bfloat> @llvm.fma.v8bf16(<8 x bfloat> %x, <8 x bfloat> %z, <8 x bfloat> %y) ret <8 x bfloat> %a @@ -49,7 +49,7 @@ define <8 x bfloat> @fma_132_v8bf16(<8 x bfloat> %x, <8 x bfloat> %y, <8 x bfloa define <8 x bfloat> @fma_312_v8bf16(<8 x bfloat> %x, <8 x bfloat> %y, <8 x bfloat> %z) { ; CHECK-LABEL: fma_312_v8bf16: ; CHECK: # %bb.0: -; CHECK-NEXT: vfmadd213nepbf16 %xmm1, %xmm2, %xmm0 +; CHECK-NEXT: vfmadd213bf16 %xmm1, %xmm2, %xmm0 ; CHECK-NEXT: retq %a = call <8 x bfloat> @llvm.fma.v8bf16(<8 x bfloat> %z, <8 x bfloat> %x, <8 x bfloat> %y) ret <8 x bfloat> %a @@ -58,7 +58,7 @@ define <8 x bfloat> @fma_312_v8bf16(<8 x bfloat> %x, <8 x bfloat> %y, <8 x bfloa define <8 x bfloat> @fma_load_123_v8bf16(<8 x bfloat> %x, <8 x bfloat> %y, ptr %zp) { ; CHECK-LABEL: fma_load_123_v8bf16: ; CHECK: # %bb.0: -; CHECK-NEXT: vfmadd213nepbf16 (%rdi), %xmm1, %xmm0 +; CHECK-NEXT: vfmadd213bf16 (%rdi), %xmm1, %xmm0 ; CHECK-NEXT: retq %z = load <8 x bfloat>, ptr %zp %a = call <8 x bfloat> @llvm.fma.v8bf16(<8 x bfloat> %x, <8 x bfloat> %y, <8 x bfloat> %z) @@ -68,7 +68,7 @@ define <8 x bfloat> @fma_load_123_v8bf16(<8 x bfloat> %x, <8 x bfloat> %y, ptr % define <8 x bfloat> @fma_load_213_v8bf16(<8 x bfloat> %x, <8 x bfloat> %y, ptr %zp) { ; CHECK-LABEL: fma_load_213_v8bf16: ; CHECK: # %bb.0: -; CHECK-NEXT: vfmadd213nepbf16 (%rdi), %xmm1, %xmm0 +; CHECK-NEXT: vfmadd213bf16 (%rdi), %xmm1, %xmm0 ; CHECK-NEXT: retq %z = load <8 x bfloat>, ptr %zp %a = call <8 x bfloat> @llvm.fma.v8bf16(<8 x bfloat> %y, <8 x bfloat> %x, <8 x bfloat> %z) @@ -78,7 +78,7 @@ define <8 x bfloat> @fma_load_213_v8bf16(<8 x bfloat> %x, <8 x bfloat> %y, ptr % define <8 x bfloat> @fma_load_231_v8bf16(<8 x bfloat> %x, <8 x bfloat> %y, ptr %zp) { ; CHECK-LABEL: fma_load_231_v8bf16: ; CHECK: # %bb.0: -; CHECK-NEXT: vfmadd231nepbf16 (%rdi), %xmm1, %xmm0 +; CHECK-NEXT: vfmadd231bf16 (%rdi), %xmm1, %xmm0 ; CHECK-NEXT: retq %z = load <8 x bfloat>, ptr %zp %a = call <8 x bfloat> @llvm.fma.v8bf16(<8 x bfloat> %y, <8 x bfloat> %z, <8 x bfloat> %x) @@ -88,7 +88,7 @@ define <8 x bfloat> @fma_load_231_v8bf16(<8 x bfloat> %x, <8 x bfloat> %y, ptr % define <8 x bfloat> @fma_load_321_v8bf16(<8 x bfloat> %x, <8 x bfloat> %y, ptr %zp) { ; CHECK-LABEL: fma_load_321_v8bf16: ; CHECK: # %bb.0: -; CHECK-NEXT: vfmadd231nepbf16 (%rdi), %xmm1, %xmm0 +; CHECK-NEXT: vfmadd231bf16 (%rdi), %xmm1, %xmm0 ; CHECK-NEXT: retq %z = load <8 x bfloat>, ptr %zp %a = call <8 x bfloat> @llvm.fma.v8bf16(<8 x bfloat> %z, <8 x bfloat> %y, <8 x bfloat> %x) @@ -98,7 +98,7 @@ define <8 x bfloat> @fma_load_321_v8bf16(<8 x bfloat> %x, <8 x bfloat> %y, ptr % define <8 x bfloat> @fma_load_132_v8bf16(<8 x bfloat> %x, <8 x bfloat> %y, ptr %zp) { ; CHECK-LABEL: fma_load_132_v8bf16: ; CHECK: # %bb.0: -; CHECK-NEXT: vfmadd132nepbf16 (%rdi), %xmm1, %xmm0 +; CHECK-NEXT: vfmadd132bf16 (%rdi), %xmm1, %xmm0 ; CHECK-NEXT: retq %z = load <8 x bfloat>, ptr %zp %a = call <8 x bfloat> @llvm.fma.v8bf16(<8 x bfloat> %x, <8 x bfloat> %z, <8 x bfloat> %y) @@ -108,7 +108,7 @@ define <8 x bfloat> @fma_load_132_v8bf16(<8 x bfloat> %x, <8 x bfloat> %y, ptr % define <8 x bfloat> @fma_load_312_v8bf16(<8 x bfloat> %x, <8 x bfloat> %y, ptr %zp) { ; CHECK-LABEL: fma_load_312_v8bf16: ; CHECK: # %bb.0: -; CHECK-NEXT: vfmadd132nepbf16 (%rdi), %xmm1, %xmm0 +; CHECK-NEXT: vfmadd132bf16 (%rdi), %xmm1, %xmm0 ; CHECK-NEXT: retq %z = load <8 x bfloat>, ptr %zp %a = call <8 x bfloat> @llvm.fma.v8bf16(<8 x bfloat> %z, <8 x bfloat> %x, <8 x bfloat> %y) @@ -119,7 +119,7 @@ define <8 x bfloat> @fma_mask_123_v8bf16(<8 x bfloat> %x, <8 x bfloat> %y, <8 x ; CHECK-LABEL: fma_mask_123_v8bf16: ; CHECK: # %bb.0: ; CHECK-NEXT: kmovd %edi, %k1 -; CHECK-NEXT: vfmadd132nepbf16 %xmm1, %xmm2, %xmm0 {%k1} +; CHECK-NEXT: vfmadd132bf16 %xmm1, %xmm2, %xmm0 {%k1} ; CHECK-NEXT: retq %a = call <8 x bfloat> @llvm.fma.v8bf16(<8 x bfloat> %x, <8 x bfloat> %y, <8 x bfloat> %z) %b = bitcast i8 %mask to <8 x i1> @@ -131,7 +131,7 @@ define <8 x bfloat> @fma_mask_213_v8bf16(<8 x bfloat> %x, <8 x bfloat> %y, <8 x ; CHECK-LABEL: fma_mask_213_v8bf16: ; CHECK: # %bb.0: ; CHECK-NEXT: kmovd %edi, %k1 -; CHECK-NEXT: vfmadd213nepbf16 %xmm2, %xmm1, %xmm0 {%k1} +; CHECK-NEXT: vfmadd213bf16 %xmm2, %xmm1, %xmm0 {%k1} ; CHECK-NEXT: retq %a = call <8 x bfloat> @llvm.fma.v8bf16(<8 x bfloat> %y, <8 x bfloat> %x, <8 x bfloat> %z) %b = bitcast i8 %mask to <8 x i1> @@ -143,7 +143,7 @@ define <8 x bfloat> @fma_mask_231_v8bf16(<8 x bfloat> %x, <8 x bfloat> %y, <8 x ; CHECK-LABEL: fma_mask_231_v8bf16: ; CHECK: # %bb.0: ; CHECK-NEXT: kmovd %edi, %k1 -; CHECK-NEXT: vfmadd231nepbf16 %xmm2, %xmm1, %xmm0 {%k1} +; CHECK-NEXT: vfmadd231bf16 %xmm2, %xmm1, %xmm0 {%k1} ; CHECK-NEXT: retq %a = call <8 x bfloat> @llvm.fma.v8bf16(<8 x bfloat> %y, <8 x bfloat> %z, <8 x bfloat> %x) %b = bitcast i8 %mask to <8 x i1> @@ -155,7 +155,7 @@ define <8 x bfloat> @fma_mask_321_v8bf16(<8 x bfloat> %x, <8 x bfloat> %y, <8 x ; CHECK-LABEL: fma_mask_321_v8bf16: ; CHECK: # %bb.0: ; CHECK-NEXT: kmovd %edi, %k1 -; CHECK-NEXT: vfmadd231nepbf16 %xmm1, %xmm2, %xmm0 {%k1} +; CHECK-NEXT: vfmadd231bf16 %xmm1, %xmm2, %xmm0 {%k1} ; CHECK-NEXT: retq %a = call <8 x bfloat> @llvm.fma.v8bf16(<8 x bfloat> %z, <8 x bfloat> %y, <8 x bfloat> %x) %b = bitcast i8 %mask to <8 x i1> @@ -167,7 +167,7 @@ define <8 x bfloat> @fma_mask_132_v8bf16(<8 x bfloat> %x, <8 x bfloat> %y, <8 x ; CHECK-LABEL: fma_mask_132_v8bf16: ; CHECK: # %bb.0: ; CHECK-NEXT: kmovd %edi, %k1 -; CHECK-NEXT: vfmadd132nepbf16 %xmm2, %xmm1, %xmm0 {%k1} +; CHECK-NEXT: vfmadd132bf16 %xmm2, %xmm1, %xmm0 {%k1} ; CHECK-NEXT: retq %a = call <8 x bfloat> @llvm.fma.v8bf16(<8 x bfloat> %x, <8 x bfloat> %z, <8 x bfloat> %y) %b = bitcast i8 %mask to <8 x i1> @@ -179,7 +179,7 @@ define <8 x bfloat> @fma_mask_312_v8bf16(<8 x bfloat> %x, <8 x bfloat> %y, <8 x ; CHECK-LABEL: fma_mask_312_v8bf16: ; CHECK: # %bb.0: ; CHECK-NEXT: kmovd %edi, %k1 -; CHECK-NEXT: vfmadd213nepbf16 %xmm1, %xmm2, %xmm0 {%k1} +; CHECK-NEXT: vfmadd213bf16 %xmm1, %xmm2, %xmm0 {%k1} ; CHECK-NEXT: retq %a = call <8 x bfloat> @llvm.fma.v8bf16(<8 x bfloat> %z, <8 x bfloat> %x, <8 x bfloat> %y) %b = bitcast i8 %mask to <8 x i1> @@ -191,7 +191,7 @@ define <8 x bfloat> @fma_maskz_123_v8bf16(<8 x bfloat> %x, <8 x bfloat> %y, <8 x ; CHECK-LABEL: fma_maskz_123_v8bf16: ; CHECK: # %bb.0: ; CHECK-NEXT: kmovd %edi, %k1 -; CHECK-NEXT: vfmadd213nepbf16 %xmm2, %xmm1, %xmm0 {%k1} {z} +; CHECK-NEXT: vfmadd213bf16 %xmm2, %xmm1, %xmm0 {%k1} {z} ; CHECK-NEXT: retq %a = call <8 x bfloat> @llvm.fma.v8bf16(<8 x bfloat> %x, <8 x bfloat> %y, <8 x bfloat> %z) %b = bitcast i8 %mask to <8 x i1> @@ -203,7 +203,7 @@ define <8 x bfloat> @fma_maskz_213_v8bf16(<8 x bfloat> %x, <8 x bfloat> %y, <8 x ; CHECK-LABEL: fma_maskz_213_v8bf16: ; CHECK: # %bb.0: ; CHECK-NEXT: kmovd %edi, %k1 -; CHECK-NEXT: vfmadd213nepbf16 %xmm2, %xmm1, %xmm0 {%k1} {z} +; CHECK-NEXT: vfmadd213bf16 %xmm2, %xmm1, %xmm0 {%k1} {z} ; CHECK-NEXT: retq %a = call <8 x bfloat> @llvm.fma.v8bf16(<8 x bfloat> %y, <8 x bfloat> %x, <8 x bfloat> %z) %b = bitcast i8 %mask to <8 x i1> @@ -215,7 +215,7 @@ define <8 x bfloat> @fma_maskz_231_v8bf16(<8 x bfloat> %x, <8 x bfloat> %y, <8 x ; CHECK-LABEL: fma_maskz_231_v8bf16: ; CHECK: # %bb.0: ; CHECK-NEXT: kmovd %edi, %k1 -; CHECK-NEXT: vfmadd231nepbf16 %xmm1, %xmm2, %xmm0 {%k1} {z} +; CHECK-NEXT: vfmadd231bf16 %xmm1, %xmm2, %xmm0 {%k1} {z} ; CHECK-NEXT: retq %a = call <8 x bfloat> @llvm.fma.v8bf16(<8 x bfloat> %y, <8 x bfloat> %z, <8 x bfloat> %x) %b = bitcast i8 %mask to <8 x i1> @@ -227,7 +227,7 @@ define <8 x bfloat> @fma_maskz_321_v8bf16(<8 x bfloat> %x, <8 x bfloat> %y, <8 x ; CHECK-LABEL: fma_maskz_321_v8bf16: ; CHECK: # %bb.0: ; CHECK-NEXT: kmovd %edi, %k1 -; CHECK-NEXT: vfmadd231nepbf16 %xmm1, %xmm2, %xmm0 {%k1} {z} +; CHECK-NEXT: vfmadd231bf16 %xmm1, %xmm2, %xmm0 {%k1} {z} ; CHECK-NEXT: retq %a = call <8 x bfloat> @llvm.fma.v8bf16(<8 x bfloat> %z, <8 x bfloat> %y, <8 x bfloat> %x) %b = bitcast i8 %mask to <8 x i1> @@ -239,7 +239,7 @@ define <8 x bfloat> @fma_maskz_132_v8bf16(<8 x bfloat> %x, <8 x bfloat> %y, <8 x ; CHECK-LABEL: fma_maskz_132_v8bf16: ; CHECK: # %bb.0: ; CHECK-NEXT: kmovd %edi, %k1 -; CHECK-NEXT: vfmadd213nepbf16 %xmm1, %xmm2, %xmm0 {%k1} {z} +; CHECK-NEXT: vfmadd213bf16 %xmm1, %xmm2, %xmm0 {%k1} {z} ; CHECK-NEXT: retq %a = call <8 x bfloat> @llvm.fma.v8bf16(<8 x bfloat> %x, <8 x bfloat> %z, <8 x bfloat> %y) %b = bitcast i8 %mask to <8 x i1> @@ -251,7 +251,7 @@ define <8 x bfloat> @fma_maskz_312_v8bf16(<8 x bfloat> %x, <8 x bfloat> %y, <8 x ; CHECK-LABEL: fma_maskz_312_v8bf16: ; CHECK: # %bb.0: ; CHECK-NEXT: kmovd %edi, %k1 -; CHECK-NEXT: vfmadd213nepbf16 %xmm1, %xmm2, %xmm0 {%k1} {z} +; CHECK-NEXT: vfmadd213bf16 %xmm1, %xmm2, %xmm0 {%k1} {z} ; CHECK-NEXT: retq %a = call <8 x bfloat> @llvm.fma.v8bf16(<8 x bfloat> %z, <8 x bfloat> %x, <8 x bfloat> %y) %b = bitcast i8 %mask to <8 x i1> @@ -263,7 +263,7 @@ define <8 x bfloat> @fma_mask_load_123_v8bf16(<8 x bfloat> %x, <8 x bfloat> %y, ; CHECK-LABEL: fma_mask_load_123_v8bf16: ; CHECK: # %bb.0: ; CHECK-NEXT: kmovd %esi, %k1 -; CHECK-NEXT: vfmadd213nepbf16 (%rdi), %xmm1, %xmm0 {%k1} +; CHECK-NEXT: vfmadd213bf16 (%rdi), %xmm1, %xmm0 {%k1} ; CHECK-NEXT: retq %z = load <8 x bfloat>, ptr %zp %a = call <8 x bfloat> @llvm.fma.v8bf16(<8 x bfloat> %x, <8 x bfloat> %y, <8 x bfloat> %z) @@ -276,7 +276,7 @@ define <8 x bfloat> @fma_mask_load_213_v8bf16(<8 x bfloat> %x, <8 x bfloat> %y, ; CHECK-LABEL: fma_mask_load_213_v8bf16: ; CHECK: # %bb.0: ; CHECK-NEXT: kmovd %esi, %k1 -; CHECK-NEXT: vfmadd213nepbf16 (%rdi), %xmm1, %xmm0 {%k1} +; CHECK-NEXT: vfmadd213bf16 (%rdi), %xmm1, %xmm0 {%k1} ; CHECK-NEXT: retq %z = load <8 x bfloat>, ptr %zp %a = call <8 x bfloat> @llvm.fma.v8bf16(<8 x bfloat> %y, <8 x bfloat> %x, <8 x bfloat> %z) @@ -289,7 +289,7 @@ define <8 x bfloat> @fma_mask_load_231_v8bf16(<8 x bfloat> %x, <8 x bfloat> %y, ; CHECK-LABEL: fma_mask_load_231_v8bf16: ; CHECK: # %bb.0: ; CHECK-NEXT: kmovd %esi, %k1 -; CHECK-NEXT: vfmadd231nepbf16 (%rdi), %xmm1, %xmm0 {%k1} +; CHECK-NEXT: vfmadd231bf16 (%rdi), %xmm1, %xmm0 {%k1} ; CHECK-NEXT: retq %z = load <8 x bfloat>, ptr %zp %a = call <8 x bfloat> @llvm.fma.v8bf16(<8 x bfloat> %y, <8 x bfloat> %z, <8 x bfloat> %x) @@ -302,7 +302,7 @@ define <8 x bfloat> @fma_mask_load_321_v8bf16(<8 x bfloat> %x, <8 x bfloat> %y, ; CHECK-LABEL: fma_mask_load_321_v8bf16: ; CHECK: # %bb.0: ; CHECK-NEXT: kmovd %esi, %k1 -; CHECK-NEXT: vfmadd231nepbf16 (%rdi), %xmm1, %xmm0 {%k1} +; CHECK-NEXT: vfmadd231bf16 (%rdi), %xmm1, %xmm0 {%k1} ; CHECK-NEXT: retq %z = load <8 x bfloat>, ptr %zp %a = call <8 x bfloat> @llvm.fma.v8bf16(<8 x bfloat> %z, <8 x bfloat> %y, <8 x bfloat> %x) @@ -315,7 +315,7 @@ define <8 x bfloat> @fma_mask_load_132_v8bf16(<8 x bfloat> %x, <8 x bfloat> %y, ; CHECK-LABEL: fma_mask_load_132_v8bf16: ; CHECK: # %bb.0: ; CHECK-NEXT: kmovd %esi, %k1 -; CHECK-NEXT: vfmadd132nepbf16 (%rdi), %xmm1, %xmm0 {%k1} +; CHECK-NEXT: vfmadd132bf16 (%rdi), %xmm1, %xmm0 {%k1} ; CHECK-NEXT: retq %z = load <8 x bfloat>, ptr %zp %a = call <8 x bfloat> @llvm.fma.v8bf16(<8 x bfloat> %x, <8 x bfloat> %z, <8 x bfloat> %y) @@ -328,7 +328,7 @@ define <8 x bfloat> @fma_mask_load_312_v8bf16(<8 x bfloat> %x, <8 x bfloat> %y, ; CHECK-LABEL: fma_mask_load_312_v8bf16: ; CHECK: # %bb.0: ; CHECK-NEXT: kmovd %esi, %k1 -; CHECK-NEXT: vfmadd132nepbf16 (%rdi), %xmm1, %xmm0 {%k1} +; CHECK-NEXT: vfmadd132bf16 (%rdi), %xmm1, %xmm0 {%k1} ; CHECK-NEXT: retq %z = load <8 x bfloat>, ptr %zp %a = call <8 x bfloat> @llvm.fma.v8bf16(<8 x bfloat> %z, <8 x bfloat> %x, <8 x bfloat> %y) @@ -341,7 +341,7 @@ define <8 x bfloat> @fma_maskz_load_123_v8bf16(<8 x bfloat> %x, <8 x bfloat> %y, ; CHECK-LABEL: fma_maskz_load_123_v8bf16: ; CHECK: # %bb.0: ; CHECK-NEXT: kmovd %esi, %k1 -; CHECK-NEXT: vfmadd213nepbf16 (%rdi), %xmm1, %xmm0 {%k1} {z} +; CHECK-NEXT: vfmadd213bf16 (%rdi), %xmm1, %xmm0 {%k1} {z} ; CHECK-NEXT: retq %z = load <8 x bfloat>, ptr %zp %a = call <8 x bfloat> @llvm.fma.v8bf16(<8 x bfloat> %x, <8 x bfloat> %y, <8 x bfloat> %z) @@ -354,7 +354,7 @@ define <8 x bfloat> @fma_maskz_load_213_v8bf16(<8 x bfloat> %x, <8 x bfloat> %y, ; CHECK-LABEL: fma_maskz_load_213_v8bf16: ; CHECK: # %bb.0: ; CHECK-NEXT: kmovd %esi, %k1 -; CHECK-NEXT: vfmadd213nepbf16 (%rdi), %xmm1, %xmm0 {%k1} {z} +; CHECK-NEXT: vfmadd213bf16 (%rdi), %xmm1, %xmm0 {%k1} {z} ; CHECK-NEXT: retq %z = load <8 x bfloat>, ptr %zp %a = call <8 x bfloat> @llvm.fma.v8bf16(<8 x bfloat> %y, <8 x bfloat> %x, <8 x bfloat> %z) @@ -367,7 +367,7 @@ define <8 x bfloat> @fma_maskz_load_231_v8bf16(<8 x bfloat> %x, <8 x bfloat> %y, ; CHECK-LABEL: fma_maskz_load_231_v8bf16: ; CHECK: # %bb.0: ; CHECK-NEXT: kmovd %esi, %k1 -; CHECK-NEXT: vfmadd231nepbf16 (%rdi), %xmm1, %xmm0 {%k1} {z} +; CHECK-NEXT: vfmadd231bf16 (%rdi), %xmm1, %xmm0 {%k1} {z} ; CHECK-NEXT: retq %z = load <8 x bfloat>, ptr %zp %a = call <8 x bfloat> @llvm.fma.v8bf16(<8 x bfloat> %y, <8 x bfloat> %z, <8 x bfloat> %x) @@ -380,7 +380,7 @@ define <8 x bfloat> @fma_maskz_load_321_v8bf16(<8 x bfloat> %x, <8 x bfloat> %y, ; CHECK-LABEL: fma_maskz_load_321_v8bf16: ; CHECK: # %bb.0: ; CHECK-NEXT: kmovd %esi, %k1 -; CHECK-NEXT: vfmadd231nepbf16 (%rdi), %xmm1, %xmm0 {%k1} {z} +; CHECK-NEXT: vfmadd231bf16 (%rdi), %xmm1, %xmm0 {%k1} {z} ; CHECK-NEXT: retq %z = load <8 x bfloat>, ptr %zp %a = call <8 x bfloat> @llvm.fma.v8bf16(<8 x bfloat> %z, <8 x bfloat> %y, <8 x bfloat> %x) @@ -393,7 +393,7 @@ define <8 x bfloat> @fma_maskz_load_132_v8bf16(<8 x bfloat> %x, <8 x bfloat> %y, ; CHECK-LABEL: fma_maskz_load_132_v8bf16: ; CHECK: # %bb.0: ; CHECK-NEXT: kmovd %esi, %k1 -; CHECK-NEXT: vfmadd132nepbf16 (%rdi), %xmm1, %xmm0 {%k1} {z} +; CHECK-NEXT: vfmadd132bf16 (%rdi), %xmm1, %xmm0 {%k1} {z} ; CHECK-NEXT: retq %z = load <8 x bfloat>, ptr %zp %a = call <8 x bfloat> @llvm.fma.v8bf16(<8 x bfloat> %x, <8 x bfloat> %z, <8 x bfloat> %y) @@ -406,7 +406,7 @@ define <8 x bfloat> @fma_maskz_load_312_v8bf16(<8 x bfloat> %x, <8 x bfloat> %y, ; CHECK-LABEL: fma_maskz_load_312_v8bf16: ; CHECK: # %bb.0: ; CHECK-NEXT: kmovd %esi, %k1 -; CHECK-NEXT: vfmadd132nepbf16 (%rdi), %xmm1, %xmm0 {%k1} {z} +; CHECK-NEXT: vfmadd132bf16 (%rdi), %xmm1, %xmm0 {%k1} {z} ; CHECK-NEXT: retq %z = load <8 x bfloat>, ptr %zp %a = call <8 x bfloat> @llvm.fma.v8bf16(<8 x bfloat> %z, <8 x bfloat> %x, <8 x bfloat> %y) @@ -418,7 +418,7 @@ define <8 x bfloat> @fma_maskz_load_312_v8bf16(<8 x bfloat> %x, <8 x bfloat> %y, define <16 x bfloat> @fma_123_v16bf16(<16 x bfloat> %x, <16 x bfloat> %y, <16 x bfloat> %z) { ; CHECK-LABEL: fma_123_v16bf16: ; CHECK: # %bb.0: -; CHECK-NEXT: vfmadd213nepbf16 %ymm2, %ymm1, %ymm0 +; CHECK-NEXT: vfmadd213bf16 %ymm2, %ymm1, %ymm0 ; CHECK-NEXT: retq %a = call <16 x bfloat> @llvm.fma.v16bf16(<16 x bfloat> %x, <16 x bfloat> %y, <16 x bfloat> %z) ret <16 x bfloat> %a @@ -427,7 +427,7 @@ define <16 x bfloat> @fma_123_v16bf16(<16 x bfloat> %x, <16 x bfloat> %y, <16 x define <16 x bfloat> @fma_213_v16bf16(<16 x bfloat> %x, <16 x bfloat> %y, <16 x bfloat> %z) { ; CHECK-LABEL: fma_213_v16bf16: ; CHECK: # %bb.0: -; CHECK-NEXT: vfmadd213nepbf16 %ymm2, %ymm1, %ymm0 +; CHECK-NEXT: vfmadd213bf16 %ymm2, %ymm1, %ymm0 ; CHECK-NEXT: retq %a = call <16 x bfloat> @llvm.fma.v16bf16(<16 x bfloat> %y, <16 x bfloat> %x, <16 x bfloat> %z) ret <16 x bfloat> %a @@ -436,7 +436,7 @@ define <16 x bfloat> @fma_213_v16bf16(<16 x bfloat> %x, <16 x bfloat> %y, <16 x define <16 x bfloat> @fma_231_v16bf16(<16 x bfloat> %x, <16 x bfloat> %y, <16 x bfloat> %z) { ; CHECK-LABEL: fma_231_v16bf16: ; CHECK: # %bb.0: -; CHECK-NEXT: vfmadd231nepbf16 %ymm1, %ymm2, %ymm0 +; CHECK-NEXT: vfmadd231bf16 %ymm1, %ymm2, %ymm0 ; CHECK-NEXT: retq %a = call <16 x bfloat> @llvm.fma.v16bf16(<16 x bfloat> %y, <16 x bfloat> %z, <16 x bfloat> %x) ret <16 x bfloat> %a @@ -445,7 +445,7 @@ define <16 x bfloat> @fma_231_v16bf16(<16 x bfloat> %x, <16 x bfloat> %y, <16 x define <16 x bfloat> @fma_321_v16bf16(<16 x bfloat> %x, <16 x bfloat> %y, <16 x bfloat> %z) { ; CHECK-LABEL: fma_321_v16bf16: ; CHECK: # %bb.0: -; CHECK-NEXT: vfmadd231nepbf16 %ymm1, %ymm2, %ymm0 +; CHECK-NEXT: vfmadd231bf16 %ymm1, %ymm2, %ymm0 ; CHECK-NEXT: retq %a = call <16 x bfloat> @llvm.fma.v16bf16(<16 x bfloat> %z, <16 x bfloat> %y, <16 x bfloat> %x) ret <16 x bfloat> %a @@ -454,7 +454,7 @@ define <16 x bfloat> @fma_321_v16bf16(<16 x bfloat> %x, <16 x bfloat> %y, <16 x define <16 x bfloat> @fma_132_v16bf16(<16 x bfloat> %x, <16 x bfloat> %y, <16 x bfloat> %z) { ; CHECK-LABEL: fma_132_v16bf16: ; CHECK: # %bb.0: -; CHECK-NEXT: vfmadd213nepbf16 %ymm1, %ymm2, %ymm0 +; CHECK-NEXT: vfmadd213bf16 %ymm1, %ymm2, %ymm0 ; CHECK-NEXT: retq %a = call <16 x bfloat> @llvm.fma.v16bf16(<16 x bfloat> %x, <16 x bfloat> %z, <16 x bfloat> %y) ret <16 x bfloat> %a @@ -463,7 +463,7 @@ define <16 x bfloat> @fma_132_v16bf16(<16 x bfloat> %x, <16 x bfloat> %y, <16 x define <16 x bfloat> @fma_312_v16bf16(<16 x bfloat> %x, <16 x bfloat> %y, <16 x bfloat> %z) { ; CHECK-LABEL: fma_312_v16bf16: ; CHECK: # %bb.0: -; CHECK-NEXT: vfmadd213nepbf16 %ymm1, %ymm2, %ymm0 +; CHECK-NEXT: vfmadd213bf16 %ymm1, %ymm2, %ymm0 ; CHECK-NEXT: retq %a = call <16 x bfloat> @llvm.fma.v16bf16(<16 x bfloat> %z, <16 x bfloat> %x, <16 x bfloat> %y) ret <16 x bfloat> %a @@ -472,7 +472,7 @@ define <16 x bfloat> @fma_312_v16bf16(<16 x bfloat> %x, <16 x bfloat> %y, <16 x define <16 x bfloat> @fma_load_123_v16bf16(<16 x bfloat> %x, <16 x bfloat> %y, ptr %zp) { ; CHECK-LABEL: fma_load_123_v16bf16: ; CHECK: # %bb.0: -; CHECK-NEXT: vfmadd213nepbf16 (%rdi), %ymm1, %ymm0 +; CHECK-NEXT: vfmadd213bf16 (%rdi), %ymm1, %ymm0 ; CHECK-NEXT: retq %z = load <16 x bfloat>, ptr %zp %a = call <16 x bfloat> @llvm.fma.v16bf16(<16 x bfloat> %x, <16 x bfloat> %y, <16 x bfloat> %z) @@ -482,7 +482,7 @@ define <16 x bfloat> @fma_load_123_v16bf16(<16 x bfloat> %x, <16 x bfloat> %y, p define <16 x bfloat> @fma_load_213_v16bf16(<16 x bfloat> %x, <16 x bfloat> %y, ptr %zp) { ; CHECK-LABEL: fma_load_213_v16bf16: ; CHECK: # %bb.0: -; CHECK-NEXT: vfmadd213nepbf16 (%rdi), %ymm1, %ymm0 +; CHECK-NEXT: vfmadd213bf16 (%rdi), %ymm1, %ymm0 ; CHECK-NEXT: retq %z = load <16 x bfloat>, ptr %zp %a = call <16 x bfloat> @llvm.fma.v16bf16(<16 x bfloat> %y, <16 x bfloat> %x, <16 x bfloat> %z) @@ -492,7 +492,7 @@ define <16 x bfloat> @fma_load_213_v16bf16(<16 x bfloat> %x, <16 x bfloat> %y, p define <16 x bfloat> @fma_load_231_v16bf16(<16 x bfloat> %x, <16 x bfloat> %y, ptr %zp) { ; CHECK-LABEL: fma_load_231_v16bf16: ; CHECK: # %bb.0: -; CHECK-NEXT: vfmadd231nepbf16 (%rdi), %ymm1, %ymm0 +; CHECK-NEXT: vfmadd231bf16 (%rdi), %ymm1, %ymm0 ; CHECK-NEXT: retq %z = load <16 x bfloat>, ptr %zp %a = call <16 x bfloat> @llvm.fma.v16bf16(<16 x bfloat> %y, <16 x bfloat> %z, <16 x bfloat> %x) @@ -502,7 +502,7 @@ define <16 x bfloat> @fma_load_231_v16bf16(<16 x bfloat> %x, <16 x bfloat> %y, p define <16 x bfloat> @fma_load_321_v16bf16(<16 x bfloat> %x, <16 x bfloat> %y, ptr %zp) { ; CHECK-LABEL: fma_load_321_v16bf16: ; CHECK: # %bb.0: -; CHECK-NEXT: vfmadd231nepbf16 (%rdi), %ymm1, %ymm0 +; CHECK-NEXT: vfmadd231bf16 (%rdi), %ymm1, %ymm0 ; CHECK-NEXT: retq %z = load <16 x bfloat>, ptr %zp %a = call <16 x bfloat> @llvm.fma.v16bf16(<16 x bfloat> %z, <16 x bfloat> %y, <16 x bfloat> %x) @@ -512,7 +512,7 @@ define <16 x bfloat> @fma_load_321_v16bf16(<16 x bfloat> %x, <16 x bfloat> %y, p define <16 x bfloat> @fma_load_132_v16bf16(<16 x bfloat> %x, <16 x bfloat> %y, ptr %zp) { ; CHECK-LABEL: fma_load_132_v16bf16: ; CHECK: # %bb.0: -; CHECK-NEXT: vfmadd132nepbf16 (%rdi), %ymm1, %ymm0 +; CHECK-NEXT: vfmadd132bf16 (%rdi), %ymm1, %ymm0 ; CHECK-NEXT: retq %z = load <16 x bfloat>, ptr %zp %a = call <16 x bfloat> @llvm.fma.v16bf16(<16 x bfloat> %x, <16 x bfloat> %z, <16 x bfloat> %y) @@ -522,7 +522,7 @@ define <16 x bfloat> @fma_load_132_v16bf16(<16 x bfloat> %x, <16 x bfloat> %y, p define <16 x bfloat> @fma_load_312_v16bf16(<16 x bfloat> %x, <16 x bfloat> %y, ptr %zp) { ; CHECK-LABEL: fma_load_312_v16bf16: ; CHECK: # %bb.0: -; CHECK-NEXT: vfmadd132nepbf16 (%rdi), %ymm1, %ymm0 +; CHECK-NEXT: vfmadd132bf16 (%rdi), %ymm1, %ymm0 ; CHECK-NEXT: retq %z = load <16 x bfloat>, ptr %zp %a = call <16 x bfloat> @llvm.fma.v16bf16(<16 x bfloat> %z, <16 x bfloat> %x, <16 x bfloat> %y) @@ -533,7 +533,7 @@ define <16 x bfloat> @fma_mask_123_v16bf16(<16 x bfloat> %x, <16 x bfloat> %y, < ; CHECK-LABEL: fma_mask_123_v16bf16: ; CHECK: # %bb.0: ; CHECK-NEXT: kmovd %edi, %k1 -; CHECK-NEXT: vfmadd132nepbf16 %ymm1, %ymm2, %ymm0 {%k1} +; CHECK-NEXT: vfmadd132bf16 %ymm1, %ymm2, %ymm0 {%k1} ; CHECK-NEXT: retq %a = call <16 x bfloat> @llvm.fma.v16bf16(<16 x bfloat> %x, <16 x bfloat> %y, <16 x bfloat> %z) %b = bitcast i16 %mask to <16 x i1> @@ -545,7 +545,7 @@ define <16 x bfloat> @fma_mask_213_v16bf16(<16 x bfloat> %x, <16 x bfloat> %y, < ; CHECK-LABEL: fma_mask_213_v16bf16: ; CHECK: # %bb.0: ; CHECK-NEXT: kmovd %edi, %k1 -; CHECK-NEXT: vfmadd213nepbf16 %ymm2, %ymm1, %ymm0 {%k1} +; CHECK-NEXT: vfmadd213bf16 %ymm2, %ymm1, %ymm0 {%k1} ; CHECK-NEXT: retq %a = call <16 x bfloat> @llvm.fma.v16bf16(<16 x bfloat> %y, <16 x bfloat> %x, <16 x bfloat> %z) %b = bitcast i16 %mask to <16 x i1> @@ -557,7 +557,7 @@ define <16 x bfloat> @fma_mask_231_v16bf16(<16 x bfloat> %x, <16 x bfloat> %y, < ; CHECK-LABEL: fma_mask_231_v16bf16: ; CHECK: # %bb.0: ; CHECK-NEXT: kmovd %edi, %k1 -; CHECK-NEXT: vfmadd231nepbf16 %ymm2, %ymm1, %ymm0 {%k1} +; CHECK-NEXT: vfmadd231bf16 %ymm2, %ymm1, %ymm0 {%k1} ; CHECK-NEXT: retq %a = call <16 x bfloat> @llvm.fma.v16bf16(<16 x bfloat> %y, <16 x bfloat> %z, <16 x bfloat> %x) %b = bitcast i16 %mask to <16 x i1> @@ -569,7 +569,7 @@ define <16 x bfloat> @fma_mask_321_v16bf16(<16 x bfloat> %x, <16 x bfloat> %y, < ; CHECK-LABEL: fma_mask_321_v16bf16: ; CHECK: # %bb.0: ; CHECK-NEXT: kmovd %edi, %k1 -; CHECK-NEXT: vfmadd231nepbf16 %ymm1, %ymm2, %ymm0 {%k1} +; CHECK-NEXT: vfmadd231bf16 %ymm1, %ymm2, %ymm0 {%k1} ; CHECK-NEXT: retq %a = call <16 x bfloat> @llvm.fma.v16bf16(<16 x bfloat> %z, <16 x bfloat> %y, <16 x bfloat> %x) %b = bitcast i16 %mask to <16 x i1> @@ -581,7 +581,7 @@ define <16 x bfloat> @fma_mask_132_v16bf16(<16 x bfloat> %x, <16 x bfloat> %y, < ; CHECK-LABEL: fma_mask_132_v16bf16: ; CHECK: # %bb.0: ; CHECK-NEXT: kmovd %edi, %k1 -; CHECK-NEXT: vfmadd132nepbf16 %ymm2, %ymm1, %ymm0 {%k1} +; CHECK-NEXT: vfmadd132bf16 %ymm2, %ymm1, %ymm0 {%k1} ; CHECK-NEXT: retq %a = call <16 x bfloat> @llvm.fma.v16bf16(<16 x bfloat> %x, <16 x bfloat> %z, <16 x bfloat> %y) %b = bitcast i16 %mask to <16 x i1> @@ -593,7 +593,7 @@ define <16 x bfloat> @fma_mask_312_v16bf16(<16 x bfloat> %x, <16 x bfloat> %y, < ; CHECK-LABEL: fma_mask_312_v16bf16: ; CHECK: # %bb.0: ; CHECK-NEXT: kmovd %edi, %k1 -; CHECK-NEXT: vfmadd213nepbf16 %ymm1, %ymm2, %ymm0 {%k1} +; CHECK-NEXT: vfmadd213bf16 %ymm1, %ymm2, %ymm0 {%k1} ; CHECK-NEXT: retq %a = call <16 x bfloat> @llvm.fma.v16bf16(<16 x bfloat> %z, <16 x bfloat> %x, <16 x bfloat> %y) %b = bitcast i16 %mask to <16 x i1> @@ -605,7 +605,7 @@ define <16 x bfloat> @fma_maskz_123_v16bf16(<16 x bfloat> %x, <16 x bfloat> %y, ; CHECK-LABEL: fma_maskz_123_v16bf16: ; CHECK: # %bb.0: ; CHECK-NEXT: kmovd %edi, %k1 -; CHECK-NEXT: vfmadd213nepbf16 %ymm2, %ymm1, %ymm0 {%k1} {z} +; CHECK-NEXT: vfmadd213bf16 %ymm2, %ymm1, %ymm0 {%k1} {z} ; CHECK-NEXT: retq %a = call <16 x bfloat> @llvm.fma.v16bf16(<16 x bfloat> %x, <16 x bfloat> %y, <16 x bfloat> %z) %b = bitcast i16 %mask to <16 x i1> @@ -617,7 +617,7 @@ define <16 x bfloat> @fma_maskz_213_v16bf16(<16 x bfloat> %x, <16 x bfloat> %y, ; CHECK-LABEL: fma_maskz_213_v16bf16: ; CHECK: # %bb.0: ; CHECK-NEXT: kmovd %edi, %k1 -; CHECK-NEXT: vfmadd213nepbf16 %ymm2, %ymm1, %ymm0 {%k1} {z} +; CHECK-NEXT: vfmadd213bf16 %ymm2, %ymm1, %ymm0 {%k1} {z} ; CHECK-NEXT: retq %a = call <16 x bfloat> @llvm.fma.v16bf16(<16 x bfloat> %y, <16 x bfloat> %x, <16 x bfloat> %z) %b = bitcast i16 %mask to <16 x i1> @@ -629,7 +629,7 @@ define <16 x bfloat> @fma_maskz_231_v16bf16(<16 x bfloat> %x, <16 x bfloat> %y, ; CHECK-LABEL: fma_maskz_231_v16bf16: ; CHECK: # %bb.0: ; CHECK-NEXT: kmovd %edi, %k1 -; CHECK-NEXT: vfmadd231nepbf16 %ymm1, %ymm2, %ymm0 {%k1} {z} +; CHECK-NEXT: vfmadd231bf16 %ymm1, %ymm2, %ymm0 {%k1} {z} ; CHECK-NEXT: retq %a = call <16 x bfloat> @llvm.fma.v16bf16(<16 x bfloat> %y, <16 x bfloat> %z, <16 x bfloat> %x) %b = bitcast i16 %mask to <16 x i1> @@ -641,7 +641,7 @@ define <16 x bfloat> @fma_maskz_321_v16bf16(<16 x bfloat> %x, <16 x bfloat> %y, ; CHECK-LABEL: fma_maskz_321_v16bf16: ; CHECK: # %bb.0: ; CHECK-NEXT: kmovd %edi, %k1 -; CHECK-NEXT: vfmadd231nepbf16 %ymm1, %ymm2, %ymm0 {%k1} {z} +; CHECK-NEXT: vfmadd231bf16 %ymm1, %ymm2, %ymm0 {%k1} {z} ; CHECK-NEXT: retq %a = call <16 x bfloat> @llvm.fma.v16bf16(<16 x bfloat> %z, <16 x bfloat> %y, <16 x bfloat> %x) %b = bitcast i16 %mask to <16 x i1> @@ -653,7 +653,7 @@ define <16 x bfloat> @fma_maskz_132_v16bf16(<16 x bfloat> %x, <16 x bfloat> %y, ; CHECK-LABEL: fma_maskz_132_v16bf16: ; CHECK: # %bb.0: ; CHECK-NEXT: kmovd %edi, %k1 -; CHECK-NEXT: vfmadd213nepbf16 %ymm1, %ymm2, %ymm0 {%k1} {z} +; CHECK-NEXT: vfmadd213bf16 %ymm1, %ymm2, %ymm0 {%k1} {z} ; CHECK-NEXT: retq %a = call <16 x bfloat> @llvm.fma.v16bf16(<16 x bfloat> %x, <16 x bfloat> %z, <16 x bfloat> %y) %b = bitcast i16 %mask to <16 x i1> @@ -665,7 +665,7 @@ define <16 x bfloat> @fma_maskz_312_v16bf16(<16 x bfloat> %x, <16 x bfloat> %y, ; CHECK-LABEL: fma_maskz_312_v16bf16: ; CHECK: # %bb.0: ; CHECK-NEXT: kmovd %edi, %k1 -; CHECK-NEXT: vfmadd213nepbf16 %ymm1, %ymm2, %ymm0 {%k1} {z} +; CHECK-NEXT: vfmadd213bf16 %ymm1, %ymm2, %ymm0 {%k1} {z} ; CHECK-NEXT: retq %a = call <16 x bfloat> @llvm.fma.v16bf16(<16 x bfloat> %z, <16 x bfloat> %x, <16 x bfloat> %y) %b = bitcast i16 %mask to <16 x i1> @@ -677,7 +677,7 @@ define <16 x bfloat> @fma_mask_load_123_v16bf16(<16 x bfloat> %x, <16 x bfloat> ; CHECK-LABEL: fma_mask_load_123_v16bf16: ; CHECK: # %bb.0: ; CHECK-NEXT: kmovd %esi, %k1 -; CHECK-NEXT: vfmadd213nepbf16 (%rdi), %ymm1, %ymm0 {%k1} +; CHECK-NEXT: vfmadd213bf16 (%rdi), %ymm1, %ymm0 {%k1} ; CHECK-NEXT: retq %z = load <16 x bfloat>, ptr %zp %a = call <16 x bfloat> @llvm.fma.v16bf16(<16 x bfloat> %x, <16 x bfloat> %y, <16 x bfloat> %z) @@ -690,7 +690,7 @@ define <16 x bfloat> @fma_mask_load_213_v16bf16(<16 x bfloat> %x, <16 x bfloat> ; CHECK-LABEL: fma_mask_load_213_v16bf16: ; CHECK: # %bb.0: ; CHECK-NEXT: kmovd %esi, %k1 -; CHECK-NEXT: vfmadd213nepbf16 (%rdi), %ymm1, %ymm0 {%k1} +; CHECK-NEXT: vfmadd213bf16 (%rdi), %ymm1, %ymm0 {%k1} ; CHECK-NEXT: retq %z = load <16 x bfloat>, ptr %zp %a = call <16 x bfloat> @llvm.fma.v16bf16(<16 x bfloat> %y, <16 x bfloat> %x, <16 x bfloat> %z) @@ -703,7 +703,7 @@ define <16 x bfloat> @fma_mask_load_231_v16bf16(<16 x bfloat> %x, <16 x bfloat> ; CHECK-LABEL: fma_mask_load_231_v16bf16: ; CHECK: # %bb.0: ; CHECK-NEXT: kmovd %esi, %k1 -; CHECK-NEXT: vfmadd231nepbf16 (%rdi), %ymm1, %ymm0 {%k1} +; CHECK-NEXT: vfmadd231bf16 (%rdi), %ymm1, %ymm0 {%k1} ; CHECK-NEXT: retq %z = load <16 x bfloat>, ptr %zp %a = call <16 x bfloat> @llvm.fma.v16bf16(<16 x bfloat> %y, <16 x bfloat> %z, <16 x bfloat> %x) @@ -716,7 +716,7 @@ define <16 x bfloat> @fma_mask_load_321_v16bf16(<16 x bfloat> %x, <16 x bfloat> ; CHECK-LABEL: fma_mask_load_321_v16bf16: ; CHECK: # %bb.0: ; CHECK-NEXT: kmovd %esi, %k1 -; CHECK-NEXT: vfmadd231nepbf16 (%rdi), %ymm1, %ymm0 {%k1} +; CHECK-NEXT: vfmadd231bf16 (%rdi), %ymm1, %ymm0 {%k1} ; CHECK-NEXT: retq %z = load <16 x bfloat>, ptr %zp %a = call <16 x bfloat> @llvm.fma.v16bf16(<16 x bfloat> %z, <16 x bfloat> %y, <16 x bfloat> %x) @@ -729,7 +729,7 @@ define <16 x bfloat> @fma_mask_load_132_v16bf16(<16 x bfloat> %x, <16 x bfloat> ; CHECK-LABEL: fma_mask_load_132_v16bf16: ; CHECK: # %bb.0: ; CHECK-NEXT: kmovd %esi, %k1 -; CHECK-NEXT: vfmadd132nepbf16 (%rdi), %ymm1, %ymm0 {%k1} +; CHECK-NEXT: vfmadd132bf16 (%rdi), %ymm1, %ymm0 {%k1} ; CHECK-NEXT: retq %z = load <16 x bfloat>, ptr %zp %a = call <16 x bfloat> @llvm.fma.v16bf16(<16 x bfloat> %x, <16 x bfloat> %z, <16 x bfloat> %y) @@ -742,7 +742,7 @@ define <16 x bfloat> @fma_mask_load_312_v16bf16(<16 x bfloat> %x, <16 x bfloat> ; CHECK-LABEL: fma_mask_load_312_v16bf16: ; CHECK: # %bb.0: ; CHECK-NEXT: kmovd %esi, %k1 -; CHECK-NEXT: vfmadd132nepbf16 (%rdi), %ymm1, %ymm0 {%k1} +; CHECK-NEXT: vfmadd132bf16 (%rdi), %ymm1, %ymm0 {%k1} ; CHECK-NEXT: retq %z = load <16 x bfloat>, ptr %zp %a = call <16 x bfloat> @llvm.fma.v16bf16(<16 x bfloat> %z, <16 x bfloat> %x, <16 x bfloat> %y) @@ -755,7 +755,7 @@ define <16 x bfloat> @fma_maskz_load_123_v16bf16(<16 x bfloat> %x, <16 x bfloat> ; CHECK-LABEL: fma_maskz_load_123_v16bf16: ; CHECK: # %bb.0: ; CHECK-NEXT: kmovd %esi, %k1 -; CHECK-NEXT: vfmadd213nepbf16 (%rdi), %ymm1, %ymm0 {%k1} {z} +; CHECK-NEXT: vfmadd213bf16 (%rdi), %ymm1, %ymm0 {%k1} {z} ; CHECK-NEXT: retq %z = load <16 x bfloat>, ptr %zp %a = call <16 x bfloat> @llvm.fma.v16bf16(<16 x bfloat> %x, <16 x bfloat> %y, <16 x bfloat> %z) @@ -768,7 +768,7 @@ define <16 x bfloat> @fma_maskz_load_213_v16bf16(<16 x bfloat> %x, <16 x bfloat> ; CHECK-LABEL: fma_maskz_load_213_v16bf16: ; CHECK: # %bb.0: ; CHECK-NEXT: kmovd %esi, %k1 -; CHECK-NEXT: vfmadd213nepbf16 (%rdi), %ymm1, %ymm0 {%k1} {z} +; CHECK-NEXT: vfmadd213bf16 (%rdi), %ymm1, %ymm0 {%k1} {z} ; CHECK-NEXT: retq %z = load <16 x bfloat>, ptr %zp %a = call <16 x bfloat> @llvm.fma.v16bf16(<16 x bfloat> %y, <16 x bfloat> %x, <16 x bfloat> %z) @@ -781,7 +781,7 @@ define <16 x bfloat> @fma_maskz_load_231_v16bf16(<16 x bfloat> %x, <16 x bfloat> ; CHECK-LABEL: fma_maskz_load_231_v16bf16: ; CHECK: # %bb.0: ; CHECK-NEXT: kmovd %esi, %k1 -; CHECK-NEXT: vfmadd231nepbf16 (%rdi), %ymm1, %ymm0 {%k1} {z} +; CHECK-NEXT: vfmadd231bf16 (%rdi), %ymm1, %ymm0 {%k1} {z} ; CHECK-NEXT: retq %z = load <16 x bfloat>, ptr %zp %a = call <16 x bfloat> @llvm.fma.v16bf16(<16 x bfloat> %y, <16 x bfloat> %z, <16 x bfloat> %x) @@ -794,7 +794,7 @@ define <16 x bfloat> @fma_maskz_load_321_v16bf16(<16 x bfloat> %x, <16 x bfloat> ; CHECK-LABEL: fma_maskz_load_321_v16bf16: ; CHECK: # %bb.0: ; CHECK-NEXT: kmovd %esi, %k1 -; CHECK-NEXT: vfmadd231nepbf16 (%rdi), %ymm1, %ymm0 {%k1} {z} +; CHECK-NEXT: vfmadd231bf16 (%rdi), %ymm1, %ymm0 {%k1} {z} ; CHECK-NEXT: retq %z = load <16 x bfloat>, ptr %zp %a = call <16 x bfloat> @llvm.fma.v16bf16(<16 x bfloat> %z, <16 x bfloat> %y, <16 x bfloat> %x) @@ -807,7 +807,7 @@ define <16 x bfloat> @fma_maskz_load_132_v16bf16(<16 x bfloat> %x, <16 x bfloat> ; CHECK-LABEL: fma_maskz_load_132_v16bf16: ; CHECK: # %bb.0: ; CHECK-NEXT: kmovd %esi, %k1 -; CHECK-NEXT: vfmadd132nepbf16 (%rdi), %ymm1, %ymm0 {%k1} {z} +; CHECK-NEXT: vfmadd132bf16 (%rdi), %ymm1, %ymm0 {%k1} {z} ; CHECK-NEXT: retq %z = load <16 x bfloat>, ptr %zp %a = call <16 x bfloat> @llvm.fma.v16bf16(<16 x bfloat> %x, <16 x bfloat> %z, <16 x bfloat> %y) @@ -820,7 +820,7 @@ define <16 x bfloat> @fma_maskz_load_312_v16bf16(<16 x bfloat> %x, <16 x bfloat> ; CHECK-LABEL: fma_maskz_load_312_v16bf16: ; CHECK: # %bb.0: ; CHECK-NEXT: kmovd %esi, %k1 -; CHECK-NEXT: vfmadd132nepbf16 (%rdi), %ymm1, %ymm0 {%k1} {z} +; CHECK-NEXT: vfmadd132bf16 (%rdi), %ymm1, %ymm0 {%k1} {z} ; CHECK-NEXT: retq %z = load <16 x bfloat>, ptr %zp %a = call <16 x bfloat> @llvm.fma.v16bf16(<16 x bfloat> %z, <16 x bfloat> %x, <16 x bfloat> %y) @@ -832,7 +832,7 @@ define <16 x bfloat> @fma_maskz_load_312_v16bf16(<16 x bfloat> %x, <16 x bfloat> define <32 x bfloat> @fma_123_v32bf16(<32 x bfloat> %x, <32 x bfloat> %y, <32 x bfloat> %z) { ; CHECK-LABEL: fma_123_v32bf16: ; CHECK: # %bb.0: -; CHECK-NEXT: vfmadd213nepbf16 %zmm2, %zmm1, %zmm0 +; CHECK-NEXT: vfmadd213bf16 %zmm2, %zmm1, %zmm0 ; CHECK-NEXT: retq %a = call <32 x bfloat> @llvm.fma.v32bf16(<32 x bfloat> %x, <32 x bfloat> %y, <32 x bfloat> %z) ret <32 x bfloat> %a @@ -841,7 +841,7 @@ define <32 x bfloat> @fma_123_v32bf16(<32 x bfloat> %x, <32 x bfloat> %y, <32 x define <32 x bfloat> @fma_213_v32bf16(<32 x bfloat> %x, <32 x bfloat> %y, <32 x bfloat> %z) { ; CHECK-LABEL: fma_213_v32bf16: ; CHECK: # %bb.0: -; CHECK-NEXT: vfmadd213nepbf16 %zmm2, %zmm1, %zmm0 +; CHECK-NEXT: vfmadd213bf16 %zmm2, %zmm1, %zmm0 ; CHECK-NEXT: retq %a = call <32 x bfloat> @llvm.fma.v32bf16(<32 x bfloat> %y, <32 x bfloat> %x, <32 x bfloat> %z) ret <32 x bfloat> %a @@ -850,7 +850,7 @@ define <32 x bfloat> @fma_213_v32bf16(<32 x bfloat> %x, <32 x bfloat> %y, <32 x define <32 x bfloat> @fma_231_v32bf16(<32 x bfloat> %x, <32 x bfloat> %y, <32 x bfloat> %z) { ; CHECK-LABEL: fma_231_v32bf16: ; CHECK: # %bb.0: -; CHECK-NEXT: vfmadd231nepbf16 %zmm1, %zmm2, %zmm0 +; CHECK-NEXT: vfmadd231bf16 %zmm1, %zmm2, %zmm0 ; CHECK-NEXT: retq %a = call <32 x bfloat> @llvm.fma.v32bf16(<32 x bfloat> %y, <32 x bfloat> %z, <32 x bfloat> %x) ret <32 x bfloat> %a @@ -859,7 +859,7 @@ define <32 x bfloat> @fma_231_v32bf16(<32 x bfloat> %x, <32 x bfloat> %y, <32 x define <32 x bfloat> @fma_321_v32bf16(<32 x bfloat> %x, <32 x bfloat> %y, <32 x bfloat> %z) { ; CHECK-LABEL: fma_321_v32bf16: ; CHECK: # %bb.0: -; CHECK-NEXT: vfmadd231nepbf16 %zmm1, %zmm2, %zmm0 +; CHECK-NEXT: vfmadd231bf16 %zmm1, %zmm2, %zmm0 ; CHECK-NEXT: retq %a = call <32 x bfloat> @llvm.fma.v32bf16(<32 x bfloat> %z, <32 x bfloat> %y, <32 x bfloat> %x) ret <32 x bfloat> %a @@ -868,7 +868,7 @@ define <32 x bfloat> @fma_321_v32bf16(<32 x bfloat> %x, <32 x bfloat> %y, <32 x define <32 x bfloat> @fma_132_v32bf16(<32 x bfloat> %x, <32 x bfloat> %y, <32 x bfloat> %z) { ; CHECK-LABEL: fma_132_v32bf16: ; CHECK: # %bb.0: -; CHECK-NEXT: vfmadd213nepbf16 %zmm1, %zmm2, %zmm0 +; CHECK-NEXT: vfmadd213bf16 %zmm1, %zmm2, %zmm0 ; CHECK-NEXT: retq %a = call <32 x bfloat> @llvm.fma.v32bf16(<32 x bfloat> %x, <32 x bfloat> %z, <32 x bfloat> %y) ret <32 x bfloat> %a @@ -877,7 +877,7 @@ define <32 x bfloat> @fma_132_v32bf16(<32 x bfloat> %x, <32 x bfloat> %y, <32 x define <32 x bfloat> @fma_312_v32bf16(<32 x bfloat> %x, <32 x bfloat> %y, <32 x bfloat> %z) { ; CHECK-LABEL: fma_312_v32bf16: ; CHECK: # %bb.0: -; CHECK-NEXT: vfmadd213nepbf16 %zmm1, %zmm2, %zmm0 +; CHECK-NEXT: vfmadd213bf16 %zmm1, %zmm2, %zmm0 ; CHECK-NEXT: retq %a = call <32 x bfloat> @llvm.fma.v32bf16(<32 x bfloat> %z, <32 x bfloat> %x, <32 x bfloat> %y) ret <32 x bfloat> %a @@ -886,7 +886,7 @@ define <32 x bfloat> @fma_312_v32bf16(<32 x bfloat> %x, <32 x bfloat> %y, <32 x define <32 x bfloat> @fma_load_123_v32bf16(<32 x bfloat> %x, <32 x bfloat> %y, ptr %zp) { ; CHECK-LABEL: fma_load_123_v32bf16: ; CHECK: # %bb.0: -; CHECK-NEXT: vfmadd213nepbf16 (%rdi), %zmm1, %zmm0 +; CHECK-NEXT: vfmadd213bf16 (%rdi), %zmm1, %zmm0 ; CHECK-NEXT: retq %z = load <32 x bfloat>, ptr %zp %a = call <32 x bfloat> @llvm.fma.v32bf16(<32 x bfloat> %x, <32 x bfloat> %y, <32 x bfloat> %z) @@ -896,7 +896,7 @@ define <32 x bfloat> @fma_load_123_v32bf16(<32 x bfloat> %x, <32 x bfloat> %y, p define <32 x bfloat> @fma_load_213_v32bf16(<32 x bfloat> %x, <32 x bfloat> %y, ptr %zp) { ; CHECK-LABEL: fma_load_213_v32bf16: ; CHECK: # %bb.0: -; CHECK-NEXT: vfmadd213nepbf16 (%rdi), %zmm1, %zmm0 +; CHECK-NEXT: vfmadd213bf16 (%rdi), %zmm1, %zmm0 ; CHECK-NEXT: retq %z = load <32 x bfloat>, ptr %zp %a = call <32 x bfloat> @llvm.fma.v32bf16(<32 x bfloat> %y, <32 x bfloat> %x, <32 x bfloat> %z) @@ -906,7 +906,7 @@ define <32 x bfloat> @fma_load_213_v32bf16(<32 x bfloat> %x, <32 x bfloat> %y, p define <32 x bfloat> @fma_load_231_v32bf16(<32 x bfloat> %x, <32 x bfloat> %y, ptr %zp) { ; CHECK-LABEL: fma_load_231_v32bf16: ; CHECK: # %bb.0: -; CHECK-NEXT: vfmadd231nepbf16 (%rdi), %zmm1, %zmm0 +; CHECK-NEXT: vfmadd231bf16 (%rdi), %zmm1, %zmm0 ; CHECK-NEXT: retq %z = load <32 x bfloat>, ptr %zp %a = call <32 x bfloat> @llvm.fma.v32bf16(<32 x bfloat> %y, <32 x bfloat> %z, <32 x bfloat> %x) @@ -916,7 +916,7 @@ define <32 x bfloat> @fma_load_231_v32bf16(<32 x bfloat> %x, <32 x bfloat> %y, p define <32 x bfloat> @fma_load_321_v32bf16(<32 x bfloat> %x, <32 x bfloat> %y, ptr %zp) { ; CHECK-LABEL: fma_load_321_v32bf16: ; CHECK: # %bb.0: -; CHECK-NEXT: vfmadd231nepbf16 (%rdi), %zmm1, %zmm0 +; CHECK-NEXT: vfmadd231bf16 (%rdi), %zmm1, %zmm0 ; CHECK-NEXT: retq %z = load <32 x bfloat>, ptr %zp %a = call <32 x bfloat> @llvm.fma.v32bf16(<32 x bfloat> %z, <32 x bfloat> %y, <32 x bfloat> %x) @@ -926,7 +926,7 @@ define <32 x bfloat> @fma_load_321_v32bf16(<32 x bfloat> %x, <32 x bfloat> %y, p define <32 x bfloat> @fma_load_132_v32bf16(<32 x bfloat> %x, <32 x bfloat> %y, ptr %zp) { ; CHECK-LABEL: fma_load_132_v32bf16: ; CHECK: # %bb.0: -; CHECK-NEXT: vfmadd132nepbf16 (%rdi), %zmm1, %zmm0 +; CHECK-NEXT: vfmadd132bf16 (%rdi), %zmm1, %zmm0 ; CHECK-NEXT: retq %z = load <32 x bfloat>, ptr %zp %a = call <32 x bfloat> @llvm.fma.v32bf16(<32 x bfloat> %x, <32 x bfloat> %z, <32 x bfloat> %y) @@ -936,7 +936,7 @@ define <32 x bfloat> @fma_load_132_v32bf16(<32 x bfloat> %x, <32 x bfloat> %y, p define <32 x bfloat> @fma_load_312_v32bf16(<32 x bfloat> %x, <32 x bfloat> %y, ptr %zp) { ; CHECK-LABEL: fma_load_312_v32bf16: ; CHECK: # %bb.0: -; CHECK-NEXT: vfmadd132nepbf16 (%rdi), %zmm1, %zmm0 +; CHECK-NEXT: vfmadd132bf16 (%rdi), %zmm1, %zmm0 ; CHECK-NEXT: retq %z = load <32 x bfloat>, ptr %zp %a = call <32 x bfloat> @llvm.fma.v32bf16(<32 x bfloat> %z, <32 x bfloat> %x, <32 x bfloat> %y) @@ -947,7 +947,7 @@ define <32 x bfloat> @fma_mask_123_v32bf16(<32 x bfloat> %x, <32 x bfloat> %y, < ; CHECK-LABEL: fma_mask_123_v32bf16: ; CHECK: # %bb.0: ; CHECK-NEXT: kmovd %edi, %k1 -; CHECK-NEXT: vfmadd132nepbf16 %zmm1, %zmm2, %zmm0 {%k1} +; CHECK-NEXT: vfmadd132bf16 %zmm1, %zmm2, %zmm0 {%k1} ; CHECK-NEXT: retq %a = call <32 x bfloat> @llvm.fma.v32bf16(<32 x bfloat> %x, <32 x bfloat> %y, <32 x bfloat> %z) %b = bitcast i32 %mask to <32 x i1> @@ -959,7 +959,7 @@ define <32 x bfloat> @fma_mask_213_v32bf16(<32 x bfloat> %x, <32 x bfloat> %y, < ; CHECK-LABEL: fma_mask_213_v32bf16: ; CHECK: # %bb.0: ; CHECK-NEXT: kmovd %edi, %k1 -; CHECK-NEXT: vfmadd213nepbf16 %zmm2, %zmm1, %zmm0 {%k1} +; CHECK-NEXT: vfmadd213bf16 %zmm2, %zmm1, %zmm0 {%k1} ; CHECK-NEXT: retq %a = call <32 x bfloat> @llvm.fma.v32bf16(<32 x bfloat> %y, <32 x bfloat> %x, <32 x bfloat> %z) %b = bitcast i32 %mask to <32 x i1> @@ -971,7 +971,7 @@ define <32 x bfloat> @fma_mask_231_v32bf16(<32 x bfloat> %x, <32 x bfloat> %y, < ; CHECK-LABEL: fma_mask_231_v32bf16: ; CHECK: # %bb.0: ; CHECK-NEXT: kmovd %edi, %k1 -; CHECK-NEXT: vfmadd231nepbf16 %zmm2, %zmm1, %zmm0 {%k1} +; CHECK-NEXT: vfmadd231bf16 %zmm2, %zmm1, %zmm0 {%k1} ; CHECK-NEXT: retq %a = call <32 x bfloat> @llvm.fma.v32bf16(<32 x bfloat> %y, <32 x bfloat> %z, <32 x bfloat> %x) %b = bitcast i32 %mask to <32 x i1> @@ -983,7 +983,7 @@ define <32 x bfloat> @fma_mask_321_v32bf16(<32 x bfloat> %x, <32 x bfloat> %y, < ; CHECK-LABEL: fma_mask_321_v32bf16: ; CHECK: # %bb.0: ; CHECK-NEXT: kmovd %edi, %k1 -; CHECK-NEXT: vfmadd231nepbf16 %zmm1, %zmm2, %zmm0 {%k1} +; CHECK-NEXT: vfmadd231bf16 %zmm1, %zmm2, %zmm0 {%k1} ; CHECK-NEXT: retq %a = call <32 x bfloat> @llvm.fma.v32bf16(<32 x bfloat> %z, <32 x bfloat> %y, <32 x bfloat> %x) %b = bitcast i32 %mask to <32 x i1> @@ -995,7 +995,7 @@ define <32 x bfloat> @fma_mask_132_v32bf16(<32 x bfloat> %x, <32 x bfloat> %y, < ; CHECK-LABEL: fma_mask_132_v32bf16: ; CHECK: # %bb.0: ; CHECK-NEXT: kmovd %edi, %k1 -; CHECK-NEXT: vfmadd132nepbf16 %zmm2, %zmm1, %zmm0 {%k1} +; CHECK-NEXT: vfmadd132bf16 %zmm2, %zmm1, %zmm0 {%k1} ; CHECK-NEXT: retq %a = call <32 x bfloat> @llvm.fma.v32bf16(<32 x bfloat> %x, <32 x bfloat> %z, <32 x bfloat> %y) %b = bitcast i32 %mask to <32 x i1> @@ -1007,7 +1007,7 @@ define <32 x bfloat> @fma_mask_312_v32bf16(<32 x bfloat> %x, <32 x bfloat> %y, < ; CHECK-LABEL: fma_mask_312_v32bf16: ; CHECK: # %bb.0: ; CHECK-NEXT: kmovd %edi, %k1 -; CHECK-NEXT: vfmadd213nepbf16 %zmm1, %zmm2, %zmm0 {%k1} +; CHECK-NEXT: vfmadd213bf16 %zmm1, %zmm2, %zmm0 {%k1} ; CHECK-NEXT: retq %a = call <32 x bfloat> @llvm.fma.v32bf16(<32 x bfloat> %z, <32 x bfloat> %x, <32 x bfloat> %y) %b = bitcast i32 %mask to <32 x i1> @@ -1019,7 +1019,7 @@ define <32 x bfloat> @fma_maskz_123_v32bf16(<32 x bfloat> %x, <32 x bfloat> %y, ; CHECK-LABEL: fma_maskz_123_v32bf16: ; CHECK: # %bb.0: ; CHECK-NEXT: kmovd %edi, %k1 -; CHECK-NEXT: vfmadd213nepbf16 %zmm2, %zmm1, %zmm0 {%k1} {z} +; CHECK-NEXT: vfmadd213bf16 %zmm2, %zmm1, %zmm0 {%k1} {z} ; CHECK-NEXT: retq %a = call <32 x bfloat> @llvm.fma.v32bf16(<32 x bfloat> %x, <32 x bfloat> %y, <32 x bfloat> %z) %b = bitcast i32 %mask to <32 x i1> @@ -1031,7 +1031,7 @@ define <32 x bfloat> @fma_maskz_213_v32bf16(<32 x bfloat> %x, <32 x bfloat> %y, ; CHECK-LABEL: fma_maskz_213_v32bf16: ; CHECK: # %bb.0: ; CHECK-NEXT: kmovd %edi, %k1 -; CHECK-NEXT: vfmadd213nepbf16 %zmm2, %zmm1, %zmm0 {%k1} {z} +; CHECK-NEXT: vfmadd213bf16 %zmm2, %zmm1, %zmm0 {%k1} {z} ; CHECK-NEXT: retq %a = call <32 x bfloat> @llvm.fma.v32bf16(<32 x bfloat> %y, <32 x bfloat> %x, <32 x bfloat> %z) %b = bitcast i32 %mask to <32 x i1> @@ -1043,7 +1043,7 @@ define <32 x bfloat> @fma_maskz_231_v32bf16(<32 x bfloat> %x, <32 x bfloat> %y, ; CHECK-LABEL: fma_maskz_231_v32bf16: ; CHECK: # %bb.0: ; CHECK-NEXT: kmovd %edi, %k1 -; CHECK-NEXT: vfmadd231nepbf16 %zmm1, %zmm2, %zmm0 {%k1} {z} +; CHECK-NEXT: vfmadd231bf16 %zmm1, %zmm2, %zmm0 {%k1} {z} ; CHECK-NEXT: retq %a = call <32 x bfloat> @llvm.fma.v32bf16(<32 x bfloat> %y, <32 x bfloat> %z, <32 x bfloat> %x) %b = bitcast i32 %mask to <32 x i1> @@ -1055,7 +1055,7 @@ define <32 x bfloat> @fma_maskz_321_v32bf16(<32 x bfloat> %x, <32 x bfloat> %y, ; CHECK-LABEL: fma_maskz_321_v32bf16: ; CHECK: # %bb.0: ; CHECK-NEXT: kmovd %edi, %k1 -; CHECK-NEXT: vfmadd231nepbf16 %zmm1, %zmm2, %zmm0 {%k1} {z} +; CHECK-NEXT: vfmadd231bf16 %zmm1, %zmm2, %zmm0 {%k1} {z} ; CHECK-NEXT: retq %a = call <32 x bfloat> @llvm.fma.v32bf16(<32 x bfloat> %z, <32 x bfloat> %y, <32 x bfloat> %x) %b = bitcast i32 %mask to <32 x i1> @@ -1067,7 +1067,7 @@ define <32 x bfloat> @fma_maskz_132_v32bf16(<32 x bfloat> %x, <32 x bfloat> %y, ; CHECK-LABEL: fma_maskz_132_v32bf16: ; CHECK: # %bb.0: ; CHECK-NEXT: kmovd %edi, %k1 -; CHECK-NEXT: vfmadd213nepbf16 %zmm1, %zmm2, %zmm0 {%k1} {z} +; CHECK-NEXT: vfmadd213bf16 %zmm1, %zmm2, %zmm0 {%k1} {z} ; CHECK-NEXT: retq %a = call <32 x bfloat> @llvm.fma.v32bf16(<32 x bfloat> %x, <32 x bfloat> %z, <32 x bfloat> %y) %b = bitcast i32 %mask to <32 x i1> @@ -1079,7 +1079,7 @@ define <32 x bfloat> @fma_maskz_312_v32bf16(<32 x bfloat> %x, <32 x bfloat> %y, ; CHECK-LABEL: fma_maskz_312_v32bf16: ; CHECK: # %bb.0: ; CHECK-NEXT: kmovd %edi, %k1 -; CHECK-NEXT: vfmadd213nepbf16 %zmm1, %zmm2, %zmm0 {%k1} {z} +; CHECK-NEXT: vfmadd213bf16 %zmm1, %zmm2, %zmm0 {%k1} {z} ; CHECK-NEXT: retq %a = call <32 x bfloat> @llvm.fma.v32bf16(<32 x bfloat> %z, <32 x bfloat> %x, <32 x bfloat> %y) %b = bitcast i32 %mask to <32 x i1> @@ -1091,7 +1091,7 @@ define <32 x bfloat> @fma_mask_load_123_v32bf16(<32 x bfloat> %x, <32 x bfloat> ; CHECK-LABEL: fma_mask_load_123_v32bf16: ; CHECK: # %bb.0: ; CHECK-NEXT: kmovd %esi, %k1 -; CHECK-NEXT: vfmadd213nepbf16 (%rdi), %zmm1, %zmm0 {%k1} +; CHECK-NEXT: vfmadd213bf16 (%rdi), %zmm1, %zmm0 {%k1} ; CHECK-NEXT: retq %z = load <32 x bfloat>, ptr %zp %a = call <32 x bfloat> @llvm.fma.v32bf16(<32 x bfloat> %x, <32 x bfloat> %y, <32 x bfloat> %z) @@ -1104,7 +1104,7 @@ define <32 x bfloat> @fma_mask_load_213_v32bf16(<32 x bfloat> %x, <32 x bfloat> ; CHECK-LABEL: fma_mask_load_213_v32bf16: ; CHECK: # %bb.0: ; CHECK-NEXT: kmovd %esi, %k1 -; CHECK-NEXT: vfmadd213nepbf16 (%rdi), %zmm1, %zmm0 {%k1} +; CHECK-NEXT: vfmadd213bf16 (%rdi), %zmm1, %zmm0 {%k1} ; CHECK-NEXT: retq %z = load <32 x bfloat>, ptr %zp %a = call <32 x bfloat> @llvm.fma.v32bf16(<32 x bfloat> %y, <32 x bfloat> %x, <32 x bfloat> %z) @@ -1117,7 +1117,7 @@ define <32 x bfloat> @fma_mask_load_231_v32bf16(<32 x bfloat> %x, <32 x bfloat> ; CHECK-LABEL: fma_mask_load_231_v32bf16: ; CHECK: # %bb.0: ; CHECK-NEXT: kmovd %esi, %k1 -; CHECK-NEXT: vfmadd231nepbf16 (%rdi), %zmm1, %zmm0 {%k1} +; CHECK-NEXT: vfmadd231bf16 (%rdi), %zmm1, %zmm0 {%k1} ; CHECK-NEXT: retq %z = load <32 x bfloat>, ptr %zp %a = call <32 x bfloat> @llvm.fma.v32bf16(<32 x bfloat> %y, <32 x bfloat> %z, <32 x bfloat> %x) @@ -1130,7 +1130,7 @@ define <32 x bfloat> @fma_mask_load_321_v32bf16(<32 x bfloat> %x, <32 x bfloat> ; CHECK-LABEL: fma_mask_load_321_v32bf16: ; CHECK: # %bb.0: ; CHECK-NEXT: kmovd %esi, %k1 -; CHECK-NEXT: vfmadd231nepbf16 (%rdi), %zmm1, %zmm0 {%k1} +; CHECK-NEXT: vfmadd231bf16 (%rdi), %zmm1, %zmm0 {%k1} ; CHECK-NEXT: retq %z = load <32 x bfloat>, ptr %zp %a = call <32 x bfloat> @llvm.fma.v32bf16(<32 x bfloat> %z, <32 x bfloat> %y, <32 x bfloat> %x) @@ -1143,7 +1143,7 @@ define <32 x bfloat> @fma_mask_load_132_v32bf16(<32 x bfloat> %x, <32 x bfloat> ; CHECK-LABEL: fma_mask_load_132_v32bf16: ; CHECK: # %bb.0: ; CHECK-NEXT: kmovd %esi, %k1 -; CHECK-NEXT: vfmadd132nepbf16 (%rdi), %zmm1, %zmm0 {%k1} +; CHECK-NEXT: vfmadd132bf16 (%rdi), %zmm1, %zmm0 {%k1} ; CHECK-NEXT: retq %z = load <32 x bfloat>, ptr %zp %a = call <32 x bfloat> @llvm.fma.v32bf16(<32 x bfloat> %x, <32 x bfloat> %z, <32 x bfloat> %y) @@ -1156,7 +1156,7 @@ define <32 x bfloat> @fma_mask_load_312_v32bf16(<32 x bfloat> %x, <32 x bfloat> ; CHECK-LABEL: fma_mask_load_312_v32bf16: ; CHECK: # %bb.0: ; CHECK-NEXT: kmovd %esi, %k1 -; CHECK-NEXT: vfmadd132nepbf16 (%rdi), %zmm1, %zmm0 {%k1} +; CHECK-NEXT: vfmadd132bf16 (%rdi), %zmm1, %zmm0 {%k1} ; CHECK-NEXT: retq %z = load <32 x bfloat>, ptr %zp %a = call <32 x bfloat> @llvm.fma.v32bf16(<32 x bfloat> %z, <32 x bfloat> %x, <32 x bfloat> %y) @@ -1169,7 +1169,7 @@ define <32 x bfloat> @fma_maskz_load_123_v32bf16(<32 x bfloat> %x, <32 x bfloat> ; CHECK-LABEL: fma_maskz_load_123_v32bf16: ; CHECK: # %bb.0: ; CHECK-NEXT: kmovd %esi, %k1 -; CHECK-NEXT: vfmadd213nepbf16 (%rdi), %zmm1, %zmm0 {%k1} {z} +; CHECK-NEXT: vfmadd213bf16 (%rdi), %zmm1, %zmm0 {%k1} {z} ; CHECK-NEXT: retq %z = load <32 x bfloat>, ptr %zp %a = call <32 x bfloat> @llvm.fma.v32bf16(<32 x bfloat> %x, <32 x bfloat> %y, <32 x bfloat> %z) @@ -1182,7 +1182,7 @@ define <32 x bfloat> @fma_maskz_load_213_v32bf16(<32 x bfloat> %x, <32 x bfloat> ; CHECK-LABEL: fma_maskz_load_213_v32bf16: ; CHECK: # %bb.0: ; CHECK-NEXT: kmovd %esi, %k1 -; CHECK-NEXT: vfmadd213nepbf16 (%rdi), %zmm1, %zmm0 {%k1} {z} +; CHECK-NEXT: vfmadd213bf16 (%rdi), %zmm1, %zmm0 {%k1} {z} ; CHECK-NEXT: retq %z = load <32 x bfloat>, ptr %zp %a = call <32 x bfloat> @llvm.fma.v32bf16(<32 x bfloat> %y, <32 x bfloat> %x, <32 x bfloat> %z) @@ -1195,7 +1195,7 @@ define <32 x bfloat> @fma_maskz_load_231_v32bf16(<32 x bfloat> %x, <32 x bfloat> ; CHECK-LABEL: fma_maskz_load_231_v32bf16: ; CHECK: # %bb.0: ; CHECK-NEXT: kmovd %esi, %k1 -; CHECK-NEXT: vfmadd231nepbf16 (%rdi), %zmm1, %zmm0 {%k1} {z} +; CHECK-NEXT: vfmadd231bf16 (%rdi), %zmm1, %zmm0 {%k1} {z} ; CHECK-NEXT: retq %z = load <32 x bfloat>, ptr %zp %a = call <32 x bfloat> @llvm.fma.v32bf16(<32 x bfloat> %y, <32 x bfloat> %z, <32 x bfloat> %x) @@ -1208,7 +1208,7 @@ define <32 x bfloat> @fma_maskz_load_321_v32bf16(<32 x bfloat> %x, <32 x bfloat> ; CHECK-LABEL: fma_maskz_load_321_v32bf16: ; CHECK: # %bb.0: ; CHECK-NEXT: kmovd %esi, %k1 -; CHECK-NEXT: vfmadd231nepbf16 (%rdi), %zmm1, %zmm0 {%k1} {z} +; CHECK-NEXT: vfmadd231bf16 (%rdi), %zmm1, %zmm0 {%k1} {z} ; CHECK-NEXT: retq %z = load <32 x bfloat>, ptr %zp %a = call <32 x bfloat> @llvm.fma.v32bf16(<32 x bfloat> %z, <32 x bfloat> %y, <32 x bfloat> %x) @@ -1221,7 +1221,7 @@ define <32 x bfloat> @fma_maskz_load_132_v32bf16(<32 x bfloat> %x, <32 x bfloat> ; CHECK-LABEL: fma_maskz_load_132_v32bf16: ; CHECK: # %bb.0: ; CHECK-NEXT: kmovd %esi, %k1 -; CHECK-NEXT: vfmadd132nepbf16 (%rdi), %zmm1, %zmm0 {%k1} {z} +; CHECK-NEXT: vfmadd132bf16 (%rdi), %zmm1, %zmm0 {%k1} {z} ; CHECK-NEXT: retq %z = load <32 x bfloat>, ptr %zp %a = call <32 x bfloat> @llvm.fma.v32bf16(<32 x bfloat> %x, <32 x bfloat> %z, <32 x bfloat> %y) @@ -1234,7 +1234,7 @@ define <32 x bfloat> @fma_maskz_load_312_v32bf16(<32 x bfloat> %x, <32 x bfloat> ; CHECK-LABEL: fma_maskz_load_312_v32bf16: ; CHECK: # %bb.0: ; CHECK-NEXT: kmovd %esi, %k1 -; CHECK-NEXT: vfmadd132nepbf16 (%rdi), %zmm1, %zmm0 {%k1} {z} +; CHECK-NEXT: vfmadd132bf16 (%rdi), %zmm1, %zmm0 {%k1} {z} ; CHECK-NEXT: retq %z = load <32 x bfloat>, ptr %zp %a = call <32 x bfloat> @llvm.fma.v32bf16(<32 x bfloat> %z, <32 x bfloat> %x, <32 x bfloat> %y) diff --git a/llvm/test/CodeGen/X86/avx10_2_512bf16-arith.ll b/llvm/test/CodeGen/X86/avx10_2_512bf16-arith.ll index 33c40ac6bb32c..1e2cf4956bd08 100644 --- a/llvm/test/CodeGen/X86/avx10_2_512bf16-arith.ll +++ b/llvm/test/CodeGen/X86/avx10_2_512bf16-arith.ll @@ -2,26 +2,26 @@ ; RUN: llc < %s -verify-machineinstrs -mtriple=x86_64-unknown-unknown --show-mc-encoding -mattr=+avx10.2-512 | FileCheck %s --check-prefixes=CHECK,X64 ; RUN: llc < %s -verify-machineinstrs -mtriple=i686-unknown-unknown --show-mc-encoding -mattr=+avx10.2-512 | FileCheck %s --check-prefixes=CHECK,X86 -define <32 x bfloat> @test_int_x86_avx10_vaddnepbf16512(<32 x bfloat> %x1, <32 x bfloat> %x2) { -; CHECK-LABEL: test_int_x86_avx10_vaddnepbf16512: +define <32 x bfloat> @test_int_x86_avx10_vaddbf16512(<32 x bfloat> %x1, <32 x bfloat> %x2) { +; CHECK-LABEL: test_int_x86_avx10_vaddbf16512: ; CHECK: # %bb.0: -; CHECK-NEXT: vaddnepbf16 %zmm1, %zmm0, %zmm0 # encoding: [0x62,0xf5,0x7d,0x48,0x58,0xc1] +; CHECK-NEXT: vaddbf16 %zmm1, %zmm0, %zmm0 # encoding: [0x62,0xf5,0x7d,0x48,0x58,0xc1] ; CHECK-NEXT: ret{{[l|q]}} # encoding: [0xc3] %res = fadd <32 x bfloat> %x1, %x2 ret <32 x bfloat> %res } -define <32 x bfloat> @test_int_x86_avx10_mask_add_nepbf16_512(<32 x bfloat> %src, <32 x bfloat> %x1, <32 x bfloat> %x2, i32 %msk, ptr %ptr) { -; X64-LABEL: test_int_x86_avx10_mask_add_nepbf16_512: +define <32 x bfloat> @test_int_x86_avx10_mask_add_bf16_512(<32 x bfloat> %src, <32 x bfloat> %x1, <32 x bfloat> %x2, i32 %msk, ptr %ptr) { +; X64-LABEL: test_int_x86_avx10_mask_add_bf16_512: ; X64: # %bb.0: ; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf] -; X64-NEXT: vaddnepbf16 %zmm2, %zmm1, %zmm0 {%k1} # encoding: [0x62,0xf5,0x75,0x49,0x58,0xc2] +; X64-NEXT: vaddbf16 %zmm2, %zmm1, %zmm0 {%k1} # encoding: [0x62,0xf5,0x75,0x49,0x58,0xc2] ; X64-NEXT: retq # encoding: [0xc3] ; -; X86-LABEL: test_int_x86_avx10_mask_add_nepbf16_512: +; X86-LABEL: test_int_x86_avx10_mask_add_bf16_512: ; X86: # %bb.0: ; X86-NEXT: kmovd {{[0-9]+}}(%esp), %k1 # encoding: [0xc4,0xe1,0xf9,0x90,0x4c,0x24,0x04] -; X86-NEXT: vaddnepbf16 %zmm2, %zmm1, %zmm0 {%k1} # encoding: [0x62,0xf5,0x75,0x49,0x58,0xc2] +; X86-NEXT: vaddbf16 %zmm2, %zmm1, %zmm0 {%k1} # encoding: [0x62,0xf5,0x75,0x49,0x58,0xc2] ; X86-NEXT: retl # encoding: [0xc3] %mask = bitcast i32 %msk to <32 x i1> %res0 = fadd <32 x bfloat> %x1, %x2 @@ -29,22 +29,22 @@ define <32 x bfloat> @test_int_x86_avx10_mask_add_nepbf16_512(<32 x bfloat> %src ret <32 x bfloat> %res } -define <32 x bfloat> @test_int_x86_avx10_maskz_add_nepbf16_512(<32 x bfloat> %src, <32 x bfloat> %x1, <32 x bfloat> %x2, i32 %msk, ptr %ptr) { -; X64-LABEL: test_int_x86_avx10_maskz_add_nepbf16_512: +define <32 x bfloat> @test_int_x86_avx10_maskz_add_bf16_512(<32 x bfloat> %src, <32 x bfloat> %x1, <32 x bfloat> %x2, i32 %msk, ptr %ptr) { +; X64-LABEL: test_int_x86_avx10_maskz_add_bf16_512: ; X64: # %bb.0: ; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf] -; X64-NEXT: vaddnepbf16 %zmm2, %zmm1, %zmm0 {%k1} {z} # encoding: [0x62,0xf5,0x75,0xc9,0x58,0xc2] -; X64-NEXT: vaddnepbf16 (%rsi), %zmm1, %zmm1 {%k1} {z} # encoding: [0x62,0xf5,0x75,0xc9,0x58,0x0e] -; X64-NEXT: vaddnepbf16 %zmm1, %zmm0, %zmm0 # encoding: [0x62,0xf5,0x7d,0x48,0x58,0xc1] +; X64-NEXT: vaddbf16 %zmm2, %zmm1, %zmm0 {%k1} {z} # encoding: [0x62,0xf5,0x75,0xc9,0x58,0xc2] +; X64-NEXT: vaddbf16 (%rsi), %zmm1, %zmm1 {%k1} {z} # encoding: [0x62,0xf5,0x75,0xc9,0x58,0x0e] +; X64-NEXT: vaddbf16 %zmm1, %zmm0, %zmm0 # encoding: [0x62,0xf5,0x7d,0x48,0x58,0xc1] ; X64-NEXT: retq # encoding: [0xc3] ; -; X86-LABEL: test_int_x86_avx10_maskz_add_nepbf16_512: +; X86-LABEL: test_int_x86_avx10_maskz_add_bf16_512: ; X86: # %bb.0: ; X86-NEXT: movl {{[0-9]+}}(%esp), %eax # encoding: [0x8b,0x44,0x24,0x08] ; X86-NEXT: kmovd {{[0-9]+}}(%esp), %k1 # encoding: [0xc4,0xe1,0xf9,0x90,0x4c,0x24,0x04] -; X86-NEXT: vaddnepbf16 %zmm2, %zmm1, %zmm0 {%k1} {z} # encoding: [0x62,0xf5,0x75,0xc9,0x58,0xc2] -; X86-NEXT: vaddnepbf16 (%eax), %zmm1, %zmm1 {%k1} {z} # encoding: [0x62,0xf5,0x75,0xc9,0x58,0x08] -; X86-NEXT: vaddnepbf16 %zmm1, %zmm0, %zmm0 # encoding: [0x62,0xf5,0x7d,0x48,0x58,0xc1] +; X86-NEXT: vaddbf16 %zmm2, %zmm1, %zmm0 {%k1} {z} # encoding: [0x62,0xf5,0x75,0xc9,0x58,0xc2] +; X86-NEXT: vaddbf16 (%eax), %zmm1, %zmm1 {%k1} {z} # encoding: [0x62,0xf5,0x75,0xc9,0x58,0x08] +; X86-NEXT: vaddbf16 %zmm1, %zmm0, %zmm0 # encoding: [0x62,0xf5,0x7d,0x48,0x58,0xc1] ; X86-NEXT: retl # encoding: [0xc3] %mask = bitcast i32 %msk to <32 x i1> %val = load <32 x bfloat>, ptr %ptr @@ -56,26 +56,26 @@ define <32 x bfloat> @test_int_x86_avx10_maskz_add_nepbf16_512(<32 x bfloat> %sr ret <32 x bfloat> %res3 } -define <32 x bfloat> @test_int_x86_avx10_sub_nepbf16_512(<32 x bfloat> %x1, <32 x bfloat> %x2) { -; CHECK-LABEL: test_int_x86_avx10_sub_nepbf16_512: +define <32 x bfloat> @test_int_x86_avx10_sub_bf16_512(<32 x bfloat> %x1, <32 x bfloat> %x2) { +; CHECK-LABEL: test_int_x86_avx10_sub_bf16_512: ; CHECK: # %bb.0: -; CHECK-NEXT: vsubnepbf16 %zmm1, %zmm0, %zmm0 # encoding: [0x62,0xf5,0x7d,0x48,0x5c,0xc1] +; CHECK-NEXT: vsubbf16 %zmm1, %zmm0, %zmm0 # encoding: [0x62,0xf5,0x7d,0x48,0x5c,0xc1] ; CHECK-NEXT: ret{{[l|q]}} # encoding: [0xc3] %res = fsub <32 x bfloat> %x1, %x2 ret <32 x bfloat> %res } -define <32 x bfloat> @test_int_x86_avx10_mask_sub_nepbf16_512(<32 x bfloat> %src, <32 x bfloat> %x1, <32 x bfloat> %x2, i32 %msk, ptr %ptr) { -; X64-LABEL: test_int_x86_avx10_mask_sub_nepbf16_512: +define <32 x bfloat> @test_int_x86_avx10_mask_sub_bf16_512(<32 x bfloat> %src, <32 x bfloat> %x1, <32 x bfloat> %x2, i32 %msk, ptr %ptr) { +; X64-LABEL: test_int_x86_avx10_mask_sub_bf16_512: ; X64: # %bb.0: ; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf] -; X64-NEXT: vsubnepbf16 %zmm2, %zmm1, %zmm0 {%k1} # encoding: [0x62,0xf5,0x75,0x49,0x5c,0xc2] +; X64-NEXT: vsubbf16 %zmm2, %zmm1, %zmm0 {%k1} # encoding: [0x62,0xf5,0x75,0x49,0x5c,0xc2] ; X64-NEXT: retq # encoding: [0xc3] ; -; X86-LABEL: test_int_x86_avx10_mask_sub_nepbf16_512: +; X86-LABEL: test_int_x86_avx10_mask_sub_bf16_512: ; X86: # %bb.0: ; X86-NEXT: kmovd {{[0-9]+}}(%esp), %k1 # encoding: [0xc4,0xe1,0xf9,0x90,0x4c,0x24,0x04] -; X86-NEXT: vsubnepbf16 %zmm2, %zmm1, %zmm0 {%k1} # encoding: [0x62,0xf5,0x75,0x49,0x5c,0xc2] +; X86-NEXT: vsubbf16 %zmm2, %zmm1, %zmm0 {%k1} # encoding: [0x62,0xf5,0x75,0x49,0x5c,0xc2] ; X86-NEXT: retl # encoding: [0xc3] %mask = bitcast i32 %msk to <32 x i1> %res0 = fsub <32 x bfloat> %x1, %x2 @@ -83,22 +83,22 @@ define <32 x bfloat> @test_int_x86_avx10_mask_sub_nepbf16_512(<32 x bfloat> %src ret <32 x bfloat> %res } -define <32 x bfloat> @test_int_x86_avx10_maskz_sub_nepbf16_512(<32 x bfloat> %src, <32 x bfloat> %x1, <32 x bfloat> %x2, i32 %msk, ptr %ptr) { -; X64-LABEL: test_int_x86_avx10_maskz_sub_nepbf16_512: +define <32 x bfloat> @test_int_x86_avx10_maskz_sub_bf16_512(<32 x bfloat> %src, <32 x bfloat> %x1, <32 x bfloat> %x2, i32 %msk, ptr %ptr) { +; X64-LABEL: test_int_x86_avx10_maskz_sub_bf16_512: ; X64: # %bb.0: ; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf] -; X64-NEXT: vsubnepbf16 %zmm2, %zmm1, %zmm0 {%k1} {z} # encoding: [0x62,0xf5,0x75,0xc9,0x5c,0xc2] -; X64-NEXT: vsubnepbf16 (%rsi), %zmm1, %zmm1 # encoding: [0x62,0xf5,0x75,0x48,0x5c,0x0e] -; X64-NEXT: vsubnepbf16 %zmm1, %zmm0, %zmm0 {%k1} # encoding: [0x62,0xf5,0x7d,0x49,0x5c,0xc1] +; X64-NEXT: vsubbf16 %zmm2, %zmm1, %zmm0 {%k1} {z} # encoding: [0x62,0xf5,0x75,0xc9,0x5c,0xc2] +; X64-NEXT: vsubbf16 (%rsi), %zmm1, %zmm1 # encoding: [0x62,0xf5,0x75,0x48,0x5c,0x0e] +; X64-NEXT: vsubbf16 %zmm1, %zmm0, %zmm0 {%k1} # encoding: [0x62,0xf5,0x7d,0x49,0x5c,0xc1] ; X64-NEXT: retq # encoding: [0xc3] ; -; X86-LABEL: test_int_x86_avx10_maskz_sub_nepbf16_512: +; X86-LABEL: test_int_x86_avx10_maskz_sub_bf16_512: ; X86: # %bb.0: ; X86-NEXT: movl {{[0-9]+}}(%esp), %eax # encoding: [0x8b,0x44,0x24,0x08] ; X86-NEXT: kmovd {{[0-9]+}}(%esp), %k1 # encoding: [0xc4,0xe1,0xf9,0x90,0x4c,0x24,0x04] -; X86-NEXT: vsubnepbf16 %zmm2, %zmm1, %zmm0 {%k1} {z} # encoding: [0x62,0xf5,0x75,0xc9,0x5c,0xc2] -; X86-NEXT: vsubnepbf16 (%eax), %zmm1, %zmm1 # encoding: [0x62,0xf5,0x75,0x48,0x5c,0x08] -; X86-NEXT: vsubnepbf16 %zmm1, %zmm0, %zmm0 {%k1} # encoding: [0x62,0xf5,0x7d,0x49,0x5c,0xc1] +; X86-NEXT: vsubbf16 %zmm2, %zmm1, %zmm0 {%k1} {z} # encoding: [0x62,0xf5,0x75,0xc9,0x5c,0xc2] +; X86-NEXT: vsubbf16 (%eax), %zmm1, %zmm1 # encoding: [0x62,0xf5,0x75,0x48,0x5c,0x08] +; X86-NEXT: vsubbf16 %zmm1, %zmm0, %zmm0 {%k1} # encoding: [0x62,0xf5,0x7d,0x49,0x5c,0xc1] ; X86-NEXT: retl # encoding: [0xc3] %mask = bitcast i32 %msk to <32 x i1> %val = load <32 x bfloat>, ptr %ptr @@ -110,28 +110,28 @@ define <32 x bfloat> @test_int_x86_avx10_maskz_sub_nepbf16_512(<32 x bfloat> %sr ret <32 x bfloat> %res3 } -declare <32 x bfloat> @llvm.x86.avx10.vmulnepbf16512(<32 x bfloat>, <32 x bfloat>) +declare <32 x bfloat> @llvm.x86.avx10.vmulbf16512(<32 x bfloat>, <32 x bfloat>) -define <32 x bfloat> @test_int_x86_avx10_mul_nepbf16_512(<32 x bfloat> %x1, <32 x bfloat> %x2) { -; CHECK-LABEL: test_int_x86_avx10_mul_nepbf16_512: +define <32 x bfloat> @test_int_x86_avx10_mul_bf16_512(<32 x bfloat> %x1, <32 x bfloat> %x2) { +; CHECK-LABEL: test_int_x86_avx10_mul_bf16_512: ; CHECK: # %bb.0: -; CHECK-NEXT: vmulnepbf16 %zmm1, %zmm0, %zmm0 # encoding: [0x62,0xf5,0x7d,0x48,0x59,0xc1] +; CHECK-NEXT: vmulbf16 %zmm1, %zmm0, %zmm0 # encoding: [0x62,0xf5,0x7d,0x48,0x59,0xc1] ; CHECK-NEXT: ret{{[l|q]}} # encoding: [0xc3] %res = fmul <32 x bfloat> %x1, %x2 ret <32 x bfloat> %res } -define <32 x bfloat> @test_int_x86_avx10_mask_mul_nepbf16_512(<32 x bfloat> %src, <32 x bfloat> %x1, <32 x bfloat> %x2, i32 %msk, ptr %ptr) { -; X64-LABEL: test_int_x86_avx10_mask_mul_nepbf16_512: +define <32 x bfloat> @test_int_x86_avx10_mask_mul_bf16_512(<32 x bfloat> %src, <32 x bfloat> %x1, <32 x bfloat> %x2, i32 %msk, ptr %ptr) { +; X64-LABEL: test_int_x86_avx10_mask_mul_bf16_512: ; X64: # %bb.0: ; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf] -; X64-NEXT: vmulnepbf16 %zmm2, %zmm1, %zmm0 {%k1} # encoding: [0x62,0xf5,0x75,0x49,0x59,0xc2] +; X64-NEXT: vmulbf16 %zmm2, %zmm1, %zmm0 {%k1} # encoding: [0x62,0xf5,0x75,0x49,0x59,0xc2] ; X64-NEXT: retq # encoding: [0xc3] ; -; X86-LABEL: test_int_x86_avx10_mask_mul_nepbf16_512: +; X86-LABEL: test_int_x86_avx10_mask_mul_bf16_512: ; X86: # %bb.0: ; X86-NEXT: kmovd {{[0-9]+}}(%esp), %k1 # encoding: [0xc4,0xe1,0xf9,0x90,0x4c,0x24,0x04] -; X86-NEXT: vmulnepbf16 %zmm2, %zmm1, %zmm0 {%k1} # encoding: [0x62,0xf5,0x75,0x49,0x59,0xc2] +; X86-NEXT: vmulbf16 %zmm2, %zmm1, %zmm0 {%k1} # encoding: [0x62,0xf5,0x75,0x49,0x59,0xc2] ; X86-NEXT: retl # encoding: [0xc3] %mask = bitcast i32 %msk to <32 x i1> %res0 = fmul <32 x bfloat> %x1, %x2 @@ -139,22 +139,22 @@ define <32 x bfloat> @test_int_x86_avx10_mask_mul_nepbf16_512(<32 x bfloat> %src ret <32 x bfloat> %res } -define <32 x bfloat> @test_int_x86_avx10_maskz_mul_nepbf16_512(<32 x bfloat> %src, <32 x bfloat> %x1, <32 x bfloat> %x2, i32 %msk, ptr %ptr) { -; X64-LABEL: test_int_x86_avx10_maskz_mul_nepbf16_512: +define <32 x bfloat> @test_int_x86_avx10_maskz_mul_bf16_512(<32 x bfloat> %src, <32 x bfloat> %x1, <32 x bfloat> %x2, i32 %msk, ptr %ptr) { +; X64-LABEL: test_int_x86_avx10_maskz_mul_bf16_512: ; X64: # %bb.0: ; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf] -; X64-NEXT: vmulnepbf16 %zmm2, %zmm1, %zmm0 {%k1} {z} # encoding: [0x62,0xf5,0x75,0xc9,0x59,0xc2] -; X64-NEXT: vmulnepbf16 (%rsi), %zmm1, %zmm1 {%k1} {z} # encoding: [0x62,0xf5,0x75,0xc9,0x59,0x0e] -; X64-NEXT: vmulnepbf16 %zmm1, %zmm0, %zmm0 # encoding: [0x62,0xf5,0x7d,0x48,0x59,0xc1] +; X64-NEXT: vmulbf16 %zmm2, %zmm1, %zmm0 {%k1} {z} # encoding: [0x62,0xf5,0x75,0xc9,0x59,0xc2] +; X64-NEXT: vmulbf16 (%rsi), %zmm1, %zmm1 {%k1} {z} # encoding: [0x62,0xf5,0x75,0xc9,0x59,0x0e] +; X64-NEXT: vmulbf16 %zmm1, %zmm0, %zmm0 # encoding: [0x62,0xf5,0x7d,0x48,0x59,0xc1] ; X64-NEXT: retq # encoding: [0xc3] ; -; X86-LABEL: test_int_x86_avx10_maskz_mul_nepbf16_512: +; X86-LABEL: test_int_x86_avx10_maskz_mul_bf16_512: ; X86: # %bb.0: ; X86-NEXT: movl {{[0-9]+}}(%esp), %eax # encoding: [0x8b,0x44,0x24,0x08] ; X86-NEXT: kmovd {{[0-9]+}}(%esp), %k1 # encoding: [0xc4,0xe1,0xf9,0x90,0x4c,0x24,0x04] -; X86-NEXT: vmulnepbf16 %zmm2, %zmm1, %zmm0 {%k1} {z} # encoding: [0x62,0xf5,0x75,0xc9,0x59,0xc2] -; X86-NEXT: vmulnepbf16 (%eax), %zmm1, %zmm1 {%k1} {z} # encoding: [0x62,0xf5,0x75,0xc9,0x59,0x08] -; X86-NEXT: vmulnepbf16 %zmm1, %zmm0, %zmm0 # encoding: [0x62,0xf5,0x7d,0x48,0x59,0xc1] +; X86-NEXT: vmulbf16 %zmm2, %zmm1, %zmm0 {%k1} {z} # encoding: [0x62,0xf5,0x75,0xc9,0x59,0xc2] +; X86-NEXT: vmulbf16 (%eax), %zmm1, %zmm1 {%k1} {z} # encoding: [0x62,0xf5,0x75,0xc9,0x59,0x08] +; X86-NEXT: vmulbf16 %zmm1, %zmm0, %zmm0 # encoding: [0x62,0xf5,0x7d,0x48,0x59,0xc1] ; X86-NEXT: retl # encoding: [0xc3] %mask = bitcast i32 %msk to <32 x i1> %val = load <32 x bfloat>, ptr %ptr @@ -166,26 +166,26 @@ define <32 x bfloat> @test_int_x86_avx10_maskz_mul_nepbf16_512(<32 x bfloat> %sr ret <32 x bfloat> %res3 } -define <32 x bfloat> @test_int_x86_avx10_div_nepbf16_512(<32 x bfloat> %x1, <32 x bfloat> %x2) { -; CHECK-LABEL: test_int_x86_avx10_div_nepbf16_512: +define <32 x bfloat> @test_int_x86_avx10_div_bf16_512(<32 x bfloat> %x1, <32 x bfloat> %x2) { +; CHECK-LABEL: test_int_x86_avx10_div_bf16_512: ; CHECK: # %bb.0: -; CHECK-NEXT: vdivnepbf16 %zmm1, %zmm0, %zmm0 # encoding: [0x62,0xf5,0x7d,0x48,0x5e,0xc1] +; CHECK-NEXT: vdivbf16 %zmm1, %zmm0, %zmm0 # encoding: [0x62,0xf5,0x7d,0x48,0x5e,0xc1] ; CHECK-NEXT: ret{{[l|q]}} # encoding: [0xc3] %res = fdiv <32 x bfloat> %x1, %x2 ret <32 x bfloat> %res } -define <32 x bfloat> @test_int_x86_avx10_mask_div_nepbf16_512(<32 x bfloat> %src, <32 x bfloat> %x1, <32 x bfloat> %x2, i32 %msk, ptr %ptr) { -; X64-LABEL: test_int_x86_avx10_mask_div_nepbf16_512: +define <32 x bfloat> @test_int_x86_avx10_mask_div_bf16_512(<32 x bfloat> %src, <32 x bfloat> %x1, <32 x bfloat> %x2, i32 %msk, ptr %ptr) { +; X64-LABEL: test_int_x86_avx10_mask_div_bf16_512: ; X64: # %bb.0: ; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf] -; X64-NEXT: vdivnepbf16 %zmm2, %zmm1, %zmm0 {%k1} # encoding: [0x62,0xf5,0x75,0x49,0x5e,0xc2] +; X64-NEXT: vdivbf16 %zmm2, %zmm1, %zmm0 {%k1} # encoding: [0x62,0xf5,0x75,0x49,0x5e,0xc2] ; X64-NEXT: retq # encoding: [0xc3] ; -; X86-LABEL: test_int_x86_avx10_mask_div_nepbf16_512: +; X86-LABEL: test_int_x86_avx10_mask_div_bf16_512: ; X86: # %bb.0: ; X86-NEXT: kmovd {{[0-9]+}}(%esp), %k1 # encoding: [0xc4,0xe1,0xf9,0x90,0x4c,0x24,0x04] -; X86-NEXT: vdivnepbf16 %zmm2, %zmm1, %zmm0 {%k1} # encoding: [0x62,0xf5,0x75,0x49,0x5e,0xc2] +; X86-NEXT: vdivbf16 %zmm2, %zmm1, %zmm0 {%k1} # encoding: [0x62,0xf5,0x75,0x49,0x5e,0xc2] ; X86-NEXT: retl # encoding: [0xc3] %mask = bitcast i32 %msk to <32 x i1> %res0 = fdiv <32 x bfloat> %x1, %x2 @@ -193,22 +193,22 @@ define <32 x bfloat> @test_int_x86_avx10_mask_div_nepbf16_512(<32 x bfloat> %src ret <32 x bfloat> %res } -define <32 x bfloat> @test_int_x86_avx10_maskz_div_nepbf16_512(<32 x bfloat> %src, <32 x bfloat> %x1, <32 x bfloat> %x2, i32 %msk, ptr %ptr) { -; X64-LABEL: test_int_x86_avx10_maskz_div_nepbf16_512: +define <32 x bfloat> @test_int_x86_avx10_maskz_div_bf16_512(<32 x bfloat> %src, <32 x bfloat> %x1, <32 x bfloat> %x2, i32 %msk, ptr %ptr) { +; X64-LABEL: test_int_x86_avx10_maskz_div_bf16_512: ; X64: # %bb.0: ; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf] -; X64-NEXT: vdivnepbf16 %zmm2, %zmm1, %zmm0 {%k1} {z} # encoding: [0x62,0xf5,0x75,0xc9,0x5e,0xc2] -; X64-NEXT: vdivnepbf16 (%rsi), %zmm1, %zmm1 {%k1} {z} # encoding: [0x62,0xf5,0x75,0xc9,0x5e,0x0e] -; X64-NEXT: vdivnepbf16 %zmm1, %zmm0, %zmm0 # encoding: [0x62,0xf5,0x7d,0x48,0x5e,0xc1] +; X64-NEXT: vdivbf16 %zmm2, %zmm1, %zmm0 {%k1} {z} # encoding: [0x62,0xf5,0x75,0xc9,0x5e,0xc2] +; X64-NEXT: vdivbf16 (%rsi), %zmm1, %zmm1 {%k1} {z} # encoding: [0x62,0xf5,0x75,0xc9,0x5e,0x0e] +; X64-NEXT: vdivbf16 %zmm1, %zmm0, %zmm0 # encoding: [0x62,0xf5,0x7d,0x48,0x5e,0xc1] ; X64-NEXT: retq # encoding: [0xc3] ; -; X86-LABEL: test_int_x86_avx10_maskz_div_nepbf16_512: +; X86-LABEL: test_int_x86_avx10_maskz_div_bf16_512: ; X86: # %bb.0: ; X86-NEXT: movl {{[0-9]+}}(%esp), %eax # encoding: [0x8b,0x44,0x24,0x08] ; X86-NEXT: kmovd {{[0-9]+}}(%esp), %k1 # encoding: [0xc4,0xe1,0xf9,0x90,0x4c,0x24,0x04] -; X86-NEXT: vdivnepbf16 %zmm2, %zmm1, %zmm0 {%k1} {z} # encoding: [0x62,0xf5,0x75,0xc9,0x5e,0xc2] -; X86-NEXT: vdivnepbf16 (%eax), %zmm1, %zmm1 {%k1} {z} # encoding: [0x62,0xf5,0x75,0xc9,0x5e,0x08] -; X86-NEXT: vdivnepbf16 %zmm1, %zmm0, %zmm0 # encoding: [0x62,0xf5,0x7d,0x48,0x5e,0xc1] +; X86-NEXT: vdivbf16 %zmm2, %zmm1, %zmm0 {%k1} {z} # encoding: [0x62,0xf5,0x75,0xc9,0x5e,0xc2] +; X86-NEXT: vdivbf16 (%eax), %zmm1, %zmm1 {%k1} {z} # encoding: [0x62,0xf5,0x75,0xc9,0x5e,0x08] +; X86-NEXT: vdivbf16 %zmm1, %zmm0, %zmm0 # encoding: [0x62,0xf5,0x7d,0x48,0x5e,0xc1] ; X86-NEXT: retl # encoding: [0xc3] %mask = bitcast i32 %msk to <32 x i1> %val = load <32 x bfloat>, ptr %ptr @@ -220,10 +220,10 @@ define <32 x bfloat> @test_int_x86_avx10_maskz_div_nepbf16_512(<32 x bfloat> %sr ret <32 x bfloat> %res3 } -define i32 @test_int_x86_avx10_vcmppbf16512(<32 x bfloat> %x1, <32 x bfloat> %x2) { -; CHECK-LABEL: test_int_x86_avx10_vcmppbf16512: +define i32 @test_int_x86_avx10_vcmpbf16512(<32 x bfloat> %x1, <32 x bfloat> %x2) { +; CHECK-LABEL: test_int_x86_avx10_vcmpbf16512: ; CHECK: # %bb.0: -; CHECK-NEXT: vcmpunordpbf16 %zmm1, %zmm0, %k0 # encoding: [0x62,0xf3,0x7f,0x48,0xc2,0xc1,0x03] +; CHECK-NEXT: vcmpunordbf16 %zmm1, %zmm0, %k0 # encoding: [0x62,0xf3,0x7f,0x48,0xc2,0xc1,0x03] ; CHECK-NEXT: kmovd %k0, %eax # encoding: [0xc5,0xfb,0x93,0xc0] ; CHECK-NEXT: vzeroupper # encoding: [0xc5,0xf8,0x77] ; CHECK-NEXT: ret{{[l|q]}} # encoding: [0xc3] @@ -233,10 +233,10 @@ define i32 @test_int_x86_avx10_vcmppbf16512(<32 x bfloat> %x1, <32 x bfloat> %x2 } ; FIXME: _mm512_mask_cmp_p[s|h]_mask is not using {k2} but gcc does -define i32 @test_int_x86_avx10_vcmppbf16512_mask2(<32 x bfloat> %x1, <32 x bfloat> %x2) { -; CHECK-LABEL: test_int_x86_avx10_vcmppbf16512_mask2: +define i32 @test_int_x86_avx10_vcmpbf16512_mask2(<32 x bfloat> %x1, <32 x bfloat> %x2) { +; CHECK-LABEL: test_int_x86_avx10_vcmpbf16512_mask2: ; CHECK: # %bb.0: -; CHECK-NEXT: vcmpeqpbf16 %zmm1, %zmm0, %k0 # encoding: [0x62,0xf3,0x7f,0x48,0xc2,0xc1,0x00] +; CHECK-NEXT: vcmpeqbf16 %zmm1, %zmm0, %k0 # encoding: [0x62,0xf3,0x7f,0x48,0xc2,0xc1,0x00] ; CHECK-NEXT: kmovd %k0, %eax # encoding: [0xc5,0xfb,0x93,0xc0] ; CHECK-NEXT: andl $3, %eax # encoding: [0x83,0xe0,0x03] ; CHECK-NEXT: vzeroupper # encoding: [0xc5,0xf8,0x77] @@ -247,10 +247,10 @@ define i32 @test_int_x86_avx10_vcmppbf16512_mask2(<32 x bfloat> %x1, <32 x bfloa ret i32 %3 } -define <32 x bfloat> @test_sqrt_nepbf16_512(<32 x bfloat> %a0) { -; CHECK-LABEL: test_sqrt_nepbf16_512: +define <32 x bfloat> @test_sqrt_bf16_512(<32 x bfloat> %a0) { +; CHECK-LABEL: test_sqrt_bf16_512: ; CHECK: # %bb.0: -; CHECK-NEXT: vsqrtnepbf16 %zmm0, %zmm0 # encoding: [0x62,0xf5,0x7d,0x48,0x51,0xc0] +; CHECK-NEXT: vsqrtbf16 %zmm0, %zmm0 # encoding: [0x62,0xf5,0x7d,0x48,0x51,0xc0] ; CHECK-NEXT: ret{{[l|q]}} # encoding: [0xc3] %1 = tail call <32 x bfloat> @llvm.sqrt.v32bf16(<32 x bfloat> %a0) ret <32 x bfloat> %1 @@ -260,13 +260,13 @@ define <32 x bfloat> @test_mm512_mask_sqrt_pbh(<32 x bfloat> %__W, i32 %__U, <32 ; X64-LABEL: test_mm512_mask_sqrt_pbh: ; X64: # %bb.0: # %entry ; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf] -; X64-NEXT: vsqrtnepbf16 %zmm1, %zmm0 {%k1} # encoding: [0x62,0xf5,0x7d,0x49,0x51,0xc1] +; X64-NEXT: vsqrtbf16 %zmm1, %zmm0 {%k1} # encoding: [0x62,0xf5,0x7d,0x49,0x51,0xc1] ; X64-NEXT: retq # encoding: [0xc3] ; ; X86-LABEL: test_mm512_mask_sqrt_pbh: ; X86: # %bb.0: # %entry ; X86-NEXT: kmovd {{[0-9]+}}(%esp), %k1 # encoding: [0xc4,0xe1,0xf9,0x90,0x4c,0x24,0x04] -; X86-NEXT: vsqrtnepbf16 %zmm1, %zmm0 {%k1} # encoding: [0x62,0xf5,0x7d,0x49,0x51,0xc1] +; X86-NEXT: vsqrtbf16 %zmm1, %zmm0 {%k1} # encoding: [0x62,0xf5,0x7d,0x49,0x51,0xc1] ; X86-NEXT: retl # encoding: [0xc3] entry: %0 = tail call <32 x bfloat> @llvm.sqrt.v32bf16(<32 x bfloat> %__A) @@ -279,13 +279,13 @@ define <32 x bfloat> @test_mm512_maskz_sqrt_pbh(i32 %__U, <32 x bfloat>%__A) { ; X64-LABEL: test_mm512_maskz_sqrt_pbh: ; X64: # %bb.0: # %entry ; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf] -; X64-NEXT: vsqrtnepbf16 %zmm0, %zmm0 {%k1} {z} # encoding: [0x62,0xf5,0x7d,0xc9,0x51,0xc0] +; X64-NEXT: vsqrtbf16 %zmm0, %zmm0 {%k1} {z} # encoding: [0x62,0xf5,0x7d,0xc9,0x51,0xc0] ; X64-NEXT: retq # encoding: [0xc3] ; ; X86-LABEL: test_mm512_maskz_sqrt_pbh: ; X86: # %bb.0: # %entry ; X86-NEXT: kmovd {{[0-9]+}}(%esp), %k1 # encoding: [0xc4,0xe1,0xf9,0x90,0x4c,0x24,0x04] -; X86-NEXT: vsqrtnepbf16 %zmm0, %zmm0 {%k1} {z} # encoding: [0x62,0xf5,0x7d,0xc9,0x51,0xc0] +; X86-NEXT: vsqrtbf16 %zmm0, %zmm0 {%k1} {z} # encoding: [0x62,0xf5,0x7d,0xc9,0x51,0xc0] ; X86-NEXT: retl # encoding: [0xc3] entry: %0 = tail call <32 x bfloat> @llvm.sqrt.v32bf16(<32 x bfloat> %__A) @@ -297,7 +297,7 @@ entry: define <32 x bfloat> @test_mm512_fmaddne_pbh(<32 x bfloat> %__A, <32 x bfloat> %__B, <32 x bfloat> %__C) { ; CHECK-LABEL: test_mm512_fmaddne_pbh: ; CHECK: # %bb.0: # %entry -; CHECK-NEXT: vfmadd213nepbf16 %zmm2, %zmm1, %zmm0 # encoding: [0x62,0xf6,0x74,0x48,0xa8,0xc2] +; CHECK-NEXT: vfmadd213bf16 %zmm2, %zmm1, %zmm0 # encoding: [0x62,0xf6,0x74,0x48,0xa8,0xc2] ; CHECK-NEXT: ret{{[l|q]}} # encoding: [0xc3] entry: %0 = tail call <32 x bfloat> @llvm.fma.v32bf16(<32 x bfloat> %__A, <32 x bfloat> %__B, <32 x bfloat> %__C) @@ -308,13 +308,13 @@ define <32 x bfloat> @test_mm512_mask_fmaddne_pbh(<32 x bfloat> %__A, i32 %__U, ; X64-LABEL: test_mm512_mask_fmaddne_pbh: ; X64: # %bb.0: # %entry ; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf] -; X64-NEXT: vfmadd132nepbf16 %zmm1, %zmm2, %zmm0 {%k1} # encoding: [0x62,0xf6,0x6c,0x49,0x98,0xc1] +; X64-NEXT: vfmadd132bf16 %zmm1, %zmm2, %zmm0 {%k1} # encoding: [0x62,0xf6,0x6c,0x49,0x98,0xc1] ; X64-NEXT: retq # encoding: [0xc3] ; ; X86-LABEL: test_mm512_mask_fmaddne_pbh: ; X86: # %bb.0: # %entry ; X86-NEXT: kmovd {{[0-9]+}}(%esp), %k1 # encoding: [0xc4,0xe1,0xf9,0x90,0x4c,0x24,0x04] -; X86-NEXT: vfmadd132nepbf16 %zmm1, %zmm2, %zmm0 {%k1} # encoding: [0x62,0xf6,0x6c,0x49,0x98,0xc1] +; X86-NEXT: vfmadd132bf16 %zmm1, %zmm2, %zmm0 {%k1} # encoding: [0x62,0xf6,0x6c,0x49,0x98,0xc1] ; X86-NEXT: retl # encoding: [0xc3] entry: %0 = tail call <32 x bfloat> @llvm.fma.v32bf16(<32 x bfloat> %__A, <32 x bfloat> %__B, <32 x bfloat> %__C) @@ -327,14 +327,14 @@ define <32 x bfloat> @test_mm512_mask3_fmaddne_pbh(<32 x bfloat> %__A, <32 x bfl ; X64-LABEL: test_mm512_mask3_fmaddne_pbh: ; X64: # %bb.0: # %entry ; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf] -; X64-NEXT: vfmadd231nepbf16 %zmm1, %zmm0, %zmm2 {%k1} # encoding: [0x62,0xf6,0x7c,0x49,0xb8,0xd1] +; X64-NEXT: vfmadd231bf16 %zmm1, %zmm0, %zmm2 {%k1} # encoding: [0x62,0xf6,0x7c,0x49,0xb8,0xd1] ; X64-NEXT: vmovaps %zmm2, %zmm0 # encoding: [0x62,0xf1,0x7c,0x48,0x28,0xc2] ; X64-NEXT: retq # encoding: [0xc3] ; ; X86-LABEL: test_mm512_mask3_fmaddne_pbh: ; X86: # %bb.0: # %entry ; X86-NEXT: kmovd {{[0-9]+}}(%esp), %k1 # encoding: [0xc4,0xe1,0xf9,0x90,0x4c,0x24,0x04] -; X86-NEXT: vfmadd231nepbf16 %zmm1, %zmm0, %zmm2 {%k1} # encoding: [0x62,0xf6,0x7c,0x49,0xb8,0xd1] +; X86-NEXT: vfmadd231bf16 %zmm1, %zmm0, %zmm2 {%k1} # encoding: [0x62,0xf6,0x7c,0x49,0xb8,0xd1] ; X86-NEXT: vmovaps %zmm2, %zmm0 # encoding: [0x62,0xf1,0x7c,0x48,0x28,0xc2] ; X86-NEXT: retl # encoding: [0xc3] entry: @@ -348,13 +348,13 @@ define <32 x bfloat> @test_mm512_maskz_fmaddne_pbh(i32 %__U, <32 x bfloat> %__A, ; X64-LABEL: test_mm512_maskz_fmaddne_pbh: ; X64: # %bb.0: # %entry ; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf] -; X64-NEXT: vfmadd213nepbf16 %zmm2, %zmm1, %zmm0 {%k1} {z} # encoding: [0x62,0xf6,0x74,0xc9,0xa8,0xc2] +; X64-NEXT: vfmadd213bf16 %zmm2, %zmm1, %zmm0 {%k1} {z} # encoding: [0x62,0xf6,0x74,0xc9,0xa8,0xc2] ; X64-NEXT: retq # encoding: [0xc3] ; ; X86-LABEL: test_mm512_maskz_fmaddne_pbh: ; X86: # %bb.0: # %entry ; X86-NEXT: kmovd {{[0-9]+}}(%esp), %k1 # encoding: [0xc4,0xe1,0xf9,0x90,0x4c,0x24,0x04] -; X86-NEXT: vfmadd213nepbf16 %zmm2, %zmm1, %zmm0 {%k1} {z} # encoding: [0x62,0xf6,0x74,0xc9,0xa8,0xc2] +; X86-NEXT: vfmadd213bf16 %zmm2, %zmm1, %zmm0 {%k1} {z} # encoding: [0x62,0xf6,0x74,0xc9,0xa8,0xc2] ; X86-NEXT: retl # encoding: [0xc3] entry: %0 = tail call <32 x bfloat> @llvm.fma.v32bf16(<32 x bfloat> %__A, <32 x bfloat> %__B, <32 x bfloat> %__C) @@ -366,7 +366,7 @@ entry: define <32 x bfloat> @test_mm512_fmsubne_pbh(<32 x bfloat> %__A, <32 x bfloat> %__B, <32 x bfloat> %__C) { ; CHECK-LABEL: test_mm512_fmsubne_pbh: ; CHECK: # %bb.0: # %entry -; CHECK-NEXT: vfmsub213nepbf16 %zmm2, %zmm1, %zmm0 # encoding: [0x62,0xf6,0x74,0x48,0xaa,0xc2] +; CHECK-NEXT: vfmsub213bf16 %zmm2, %zmm1, %zmm0 # encoding: [0x62,0xf6,0x74,0x48,0xaa,0xc2] ; CHECK-NEXT: ret{{[l|q]}} # encoding: [0xc3] entry: %fneg.i = fneg <32 x bfloat> %__C @@ -378,13 +378,13 @@ define <32 x bfloat> @test_mm512_mask_fmsubne_pbh(<32 x bfloat> %__A, i32 %__U, ; X64-LABEL: test_mm512_mask_fmsubne_pbh: ; X64: # %bb.0: # %entry ; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf] -; X64-NEXT: vfmsub132nepbf16 %zmm1, %zmm2, %zmm0 {%k1} # encoding: [0x62,0xf6,0x6c,0x49,0x9a,0xc1] +; X64-NEXT: vfmsub132bf16 %zmm1, %zmm2, %zmm0 {%k1} # encoding: [0x62,0xf6,0x6c,0x49,0x9a,0xc1] ; X64-NEXT: retq # encoding: [0xc3] ; ; X86-LABEL: test_mm512_mask_fmsubne_pbh: ; X86: # %bb.0: # %entry ; X86-NEXT: kmovd {{[0-9]+}}(%esp), %k1 # encoding: [0xc4,0xe1,0xf9,0x90,0x4c,0x24,0x04] -; X86-NEXT: vfmsub132nepbf16 %zmm1, %zmm2, %zmm0 {%k1} # encoding: [0x62,0xf6,0x6c,0x49,0x9a,0xc1] +; X86-NEXT: vfmsub132bf16 %zmm1, %zmm2, %zmm0 {%k1} # encoding: [0x62,0xf6,0x6c,0x49,0x9a,0xc1] ; X86-NEXT: retl # encoding: [0xc3] entry: %fneg.i.i = fneg <32 x bfloat> %__C @@ -398,14 +398,14 @@ define <32 x bfloat> @test_mm512_mask3_fmsubne_pbh(<32 x bfloat> %__A, <32 x bfl ; X64-LABEL: test_mm512_mask3_fmsubne_pbh: ; X64: # %bb.0: # %entry ; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf] -; X64-NEXT: vfmsub231nepbf16 %zmm1, %zmm0, %zmm2 {%k1} # encoding: [0x62,0xf6,0x7c,0x49,0xba,0xd1] +; X64-NEXT: vfmsub231bf16 %zmm1, %zmm0, %zmm2 {%k1} # encoding: [0x62,0xf6,0x7c,0x49,0xba,0xd1] ; X64-NEXT: vmovaps %zmm2, %zmm0 # encoding: [0x62,0xf1,0x7c,0x48,0x28,0xc2] ; X64-NEXT: retq # encoding: [0xc3] ; ; X86-LABEL: test_mm512_mask3_fmsubne_pbh: ; X86: # %bb.0: # %entry ; X86-NEXT: kmovd {{[0-9]+}}(%esp), %k1 # encoding: [0xc4,0xe1,0xf9,0x90,0x4c,0x24,0x04] -; X86-NEXT: vfmsub231nepbf16 %zmm1, %zmm0, %zmm2 {%k1} # encoding: [0x62,0xf6,0x7c,0x49,0xba,0xd1] +; X86-NEXT: vfmsub231bf16 %zmm1, %zmm0, %zmm2 {%k1} # encoding: [0x62,0xf6,0x7c,0x49,0xba,0xd1] ; X86-NEXT: vmovaps %zmm2, %zmm0 # encoding: [0x62,0xf1,0x7c,0x48,0x28,0xc2] ; X86-NEXT: retl # encoding: [0xc3] entry: @@ -420,13 +420,13 @@ define <32 x bfloat> @test_mm512_maskz_fmsubne_pbh(i32 %__U, <32 x bfloat> %__A, ; X64-LABEL: test_mm512_maskz_fmsubne_pbh: ; X64: # %bb.0: # %entry ; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf] -; X64-NEXT: vfmsub213nepbf16 %zmm2, %zmm1, %zmm0 {%k1} {z} # encoding: [0x62,0xf6,0x74,0xc9,0xaa,0xc2] +; X64-NEXT: vfmsub213bf16 %zmm2, %zmm1, %zmm0 {%k1} {z} # encoding: [0x62,0xf6,0x74,0xc9,0xaa,0xc2] ; X64-NEXT: retq # encoding: [0xc3] ; ; X86-LABEL: test_mm512_maskz_fmsubne_pbh: ; X86: # %bb.0: # %entry ; X86-NEXT: kmovd {{[0-9]+}}(%esp), %k1 # encoding: [0xc4,0xe1,0xf9,0x90,0x4c,0x24,0x04] -; X86-NEXT: vfmsub213nepbf16 %zmm2, %zmm1, %zmm0 {%k1} {z} # encoding: [0x62,0xf6,0x74,0xc9,0xaa,0xc2] +; X86-NEXT: vfmsub213bf16 %zmm2, %zmm1, %zmm0 {%k1} {z} # encoding: [0x62,0xf6,0x74,0xc9,0xaa,0xc2] ; X86-NEXT: retl # encoding: [0xc3] entry: %fneg.i.i = fneg <32 x bfloat> %__C @@ -439,7 +439,7 @@ entry: define <32 x bfloat> @test_mm512_fnmaddne_pbh(<32 x bfloat> %__A, <32 x bfloat> %__B, <32 x bfloat> %__C) { ; CHECK-LABEL: test_mm512_fnmaddne_pbh: ; CHECK: # %bb.0: # %entry -; CHECK-NEXT: vfnmadd213nepbf16 %zmm2, %zmm1, %zmm0 # encoding: [0x62,0xf6,0x74,0x48,0xac,0xc2] +; CHECK-NEXT: vfnmadd213bf16 %zmm2, %zmm1, %zmm0 # encoding: [0x62,0xf6,0x74,0x48,0xac,0xc2] ; CHECK-NEXT: ret{{[l|q]}} # encoding: [0xc3] entry: %fneg.i = fneg <32 x bfloat> %__B @@ -451,13 +451,13 @@ define <32 x bfloat> @test_mm512_mask_fnmaddne_pbh(<32 x bfloat> %__A, i32 %__U, ; X64-LABEL: test_mm512_mask_fnmaddne_pbh: ; X64: # %bb.0: # %entry ; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf] -; X64-NEXT: vfnmadd132nepbf16 %zmm1, %zmm2, %zmm0 {%k1} # encoding: [0x62,0xf6,0x6c,0x49,0x9c,0xc1] +; X64-NEXT: vfnmadd132bf16 %zmm1, %zmm2, %zmm0 {%k1} # encoding: [0x62,0xf6,0x6c,0x49,0x9c,0xc1] ; X64-NEXT: retq # encoding: [0xc3] ; ; X86-LABEL: test_mm512_mask_fnmaddne_pbh: ; X86: # %bb.0: # %entry ; X86-NEXT: kmovd {{[0-9]+}}(%esp), %k1 # encoding: [0xc4,0xe1,0xf9,0x90,0x4c,0x24,0x04] -; X86-NEXT: vfnmadd132nepbf16 %zmm1, %zmm2, %zmm0 {%k1} # encoding: [0x62,0xf6,0x6c,0x49,0x9c,0xc1] +; X86-NEXT: vfnmadd132bf16 %zmm1, %zmm2, %zmm0 {%k1} # encoding: [0x62,0xf6,0x6c,0x49,0x9c,0xc1] ; X86-NEXT: retl # encoding: [0xc3] entry: %fneg.i.i = fneg <32 x bfloat> %__B @@ -471,14 +471,14 @@ define <32 x bfloat> @test_mm512_mask3_fnmaddne_pbh(<32 x bfloat> %__A, <32 x bf ; X64-LABEL: test_mm512_mask3_fnmaddne_pbh: ; X64: # %bb.0: # %entry ; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf] -; X64-NEXT: vfnmadd231nepbf16 %zmm1, %zmm0, %zmm2 {%k1} # encoding: [0x62,0xf6,0x7c,0x49,0xbc,0xd1] +; X64-NEXT: vfnmadd231bf16 %zmm1, %zmm0, %zmm2 {%k1} # encoding: [0x62,0xf6,0x7c,0x49,0xbc,0xd1] ; X64-NEXT: vmovaps %zmm2, %zmm0 # encoding: [0x62,0xf1,0x7c,0x48,0x28,0xc2] ; X64-NEXT: retq # encoding: [0xc3] ; ; X86-LABEL: test_mm512_mask3_fnmaddne_pbh: ; X86: # %bb.0: # %entry ; X86-NEXT: kmovd {{[0-9]+}}(%esp), %k1 # encoding: [0xc4,0xe1,0xf9,0x90,0x4c,0x24,0x04] -; X86-NEXT: vfnmadd231nepbf16 %zmm1, %zmm0, %zmm2 {%k1} # encoding: [0x62,0xf6,0x7c,0x49,0xbc,0xd1] +; X86-NEXT: vfnmadd231bf16 %zmm1, %zmm0, %zmm2 {%k1} # encoding: [0x62,0xf6,0x7c,0x49,0xbc,0xd1] ; X86-NEXT: vmovaps %zmm2, %zmm0 # encoding: [0x62,0xf1,0x7c,0x48,0x28,0xc2] ; X86-NEXT: retl # encoding: [0xc3] entry: @@ -493,13 +493,13 @@ define <32 x bfloat> @test_mm512_maskz_fnmaddne_pbh(i32 %__U, <32 x bfloat> %__A ; X64-LABEL: test_mm512_maskz_fnmaddne_pbh: ; X64: # %bb.0: # %entry ; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf] -; X64-NEXT: vfnmadd213nepbf16 %zmm2, %zmm1, %zmm0 {%k1} {z} # encoding: [0x62,0xf6,0x74,0xc9,0xac,0xc2] +; X64-NEXT: vfnmadd213bf16 %zmm2, %zmm1, %zmm0 {%k1} {z} # encoding: [0x62,0xf6,0x74,0xc9,0xac,0xc2] ; X64-NEXT: retq # encoding: [0xc3] ; ; X86-LABEL: test_mm512_maskz_fnmaddne_pbh: ; X86: # %bb.0: # %entry ; X86-NEXT: kmovd {{[0-9]+}}(%esp), %k1 # encoding: [0xc4,0xe1,0xf9,0x90,0x4c,0x24,0x04] -; X86-NEXT: vfnmadd213nepbf16 %zmm2, %zmm1, %zmm0 {%k1} {z} # encoding: [0x62,0xf6,0x74,0xc9,0xac,0xc2] +; X86-NEXT: vfnmadd213bf16 %zmm2, %zmm1, %zmm0 {%k1} {z} # encoding: [0x62,0xf6,0x74,0xc9,0xac,0xc2] ; X86-NEXT: retl # encoding: [0xc3] entry: %fneg.i.i = fneg <32 x bfloat> %__B @@ -512,7 +512,7 @@ entry: define <32 x bfloat> @test_mm512_fnmsubne_pbh(<32 x bfloat> %__A, <32 x bfloat> %__B, <32 x bfloat> %__C) { ; CHECK-LABEL: test_mm512_fnmsubne_pbh: ; CHECK: # %bb.0: # %entry -; CHECK-NEXT: vfnmsub213nepbf16 %zmm2, %zmm1, %zmm0 # encoding: [0x62,0xf6,0x74,0x48,0xae,0xc2] +; CHECK-NEXT: vfnmsub213bf16 %zmm2, %zmm1, %zmm0 # encoding: [0x62,0xf6,0x74,0x48,0xae,0xc2] ; CHECK-NEXT: ret{{[l|q]}} # encoding: [0xc3] entry: %fneg.i = fneg <32 x bfloat> %__B @@ -525,13 +525,13 @@ define <32 x bfloat> @test_mm512_mask_fnmsubne_pbh(<32 x bfloat> %__A, i32 %__U, ; X64-LABEL: test_mm512_mask_fnmsubne_pbh: ; X64: # %bb.0: # %entry ; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf] -; X64-NEXT: vfnmsub132nepbf16 %zmm1, %zmm2, %zmm0 {%k1} # encoding: [0x62,0xf6,0x6c,0x49,0x9e,0xc1] +; X64-NEXT: vfnmsub132bf16 %zmm1, %zmm2, %zmm0 {%k1} # encoding: [0x62,0xf6,0x6c,0x49,0x9e,0xc1] ; X64-NEXT: retq # encoding: [0xc3] ; ; X86-LABEL: test_mm512_mask_fnmsubne_pbh: ; X86: # %bb.0: # %entry ; X86-NEXT: kmovd {{[0-9]+}}(%esp), %k1 # encoding: [0xc4,0xe1,0xf9,0x90,0x4c,0x24,0x04] -; X86-NEXT: vfnmsub132nepbf16 %zmm1, %zmm2, %zmm0 {%k1} # encoding: [0x62,0xf6,0x6c,0x49,0x9e,0xc1] +; X86-NEXT: vfnmsub132bf16 %zmm1, %zmm2, %zmm0 {%k1} # encoding: [0x62,0xf6,0x6c,0x49,0x9e,0xc1] ; X86-NEXT: retl # encoding: [0xc3] entry: %fneg.i.i = fneg <32 x bfloat> %__B @@ -546,14 +546,14 @@ define <32 x bfloat> @test_mm512_mask3_fnmsubne_pbh(<32 x bfloat> %__A, <32 x bf ; X64-LABEL: test_mm512_mask3_fnmsubne_pbh: ; X64: # %bb.0: # %entry ; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf] -; X64-NEXT: vfnmsub231nepbf16 %zmm1, %zmm0, %zmm2 {%k1} # encoding: [0x62,0xf6,0x7c,0x49,0xbe,0xd1] +; X64-NEXT: vfnmsub231bf16 %zmm1, %zmm0, %zmm2 {%k1} # encoding: [0x62,0xf6,0x7c,0x49,0xbe,0xd1] ; X64-NEXT: vmovaps %zmm2, %zmm0 # encoding: [0x62,0xf1,0x7c,0x48,0x28,0xc2] ; X64-NEXT: retq # encoding: [0xc3] ; ; X86-LABEL: test_mm512_mask3_fnmsubne_pbh: ; X86: # %bb.0: # %entry ; X86-NEXT: kmovd {{[0-9]+}}(%esp), %k1 # encoding: [0xc4,0xe1,0xf9,0x90,0x4c,0x24,0x04] -; X86-NEXT: vfnmsub231nepbf16 %zmm1, %zmm0, %zmm2 {%k1} # encoding: [0x62,0xf6,0x7c,0x49,0xbe,0xd1] +; X86-NEXT: vfnmsub231bf16 %zmm1, %zmm0, %zmm2 {%k1} # encoding: [0x62,0xf6,0x7c,0x49,0xbe,0xd1] ; X86-NEXT: vmovaps %zmm2, %zmm0 # encoding: [0x62,0xf1,0x7c,0x48,0x28,0xc2] ; X86-NEXT: retl # encoding: [0xc3] entry: @@ -569,13 +569,13 @@ define <32 x bfloat> @test_mm512_maskz_fnmsubne_pbh(i32 %__U, <32 x bfloat> %__A ; X64-LABEL: test_mm512_maskz_fnmsubne_pbh: ; X64: # %bb.0: # %entry ; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf] -; X64-NEXT: vfnmsub213nepbf16 %zmm2, %zmm1, %zmm0 {%k1} {z} # encoding: [0x62,0xf6,0x74,0xc9,0xae,0xc2] +; X64-NEXT: vfnmsub213bf16 %zmm2, %zmm1, %zmm0 {%k1} {z} # encoding: [0x62,0xf6,0x74,0xc9,0xae,0xc2] ; X64-NEXT: retq # encoding: [0xc3] ; ; X86-LABEL: test_mm512_maskz_fnmsubne_pbh: ; X86: # %bb.0: # %entry ; X86-NEXT: kmovd {{[0-9]+}}(%esp), %k1 # encoding: [0xc4,0xe1,0xf9,0x90,0x4c,0x24,0x04] -; X86-NEXT: vfnmsub213nepbf16 %zmm2, %zmm1, %zmm0 {%k1} {z} # encoding: [0x62,0xf6,0x74,0xc9,0xae,0xc2] +; X86-NEXT: vfnmsub213bf16 %zmm2, %zmm1, %zmm0 {%k1} {z} # encoding: [0x62,0xf6,0x74,0xc9,0xae,0xc2] ; X86-NEXT: retl # encoding: [0xc3] entry: %fneg.i.i = fneg <32 x bfloat> %__B diff --git a/llvm/test/CodeGen/X86/avx10_2_512bf16-intrinsics.ll b/llvm/test/CodeGen/X86/avx10_2_512bf16-intrinsics.ll index 5f2bcf0556b02..da17b995afedf 100644 --- a/llvm/test/CodeGen/X86/avx10_2_512bf16-intrinsics.ll +++ b/llvm/test/CodeGen/X86/avx10_2_512bf16-intrinsics.ll @@ -2,231 +2,231 @@ ; RUN: llc < %s -verify-machineinstrs -mtriple=x86_64-unknown-unknown --show-mc-encoding -mattr=+avx10.2-512 | FileCheck %s --check-prefixes=CHECK,X64 ; RUN: llc < %s -verify-machineinstrs -mtriple=i686-unknown-unknown --show-mc-encoding -mattr=+avx10.2-512 | FileCheck %s --check-prefixes=CHECK,X86 -declare <32 x bfloat> @llvm.x86.avx10.vminpbf16512(<32 x bfloat>, <32 x bfloat>) +declare <32 x bfloat> @llvm.x86.avx10.vminbf16512(<32 x bfloat>, <32 x bfloat>) -define <32 x bfloat> @test_int_x86_avx10_min_nepbf16_512(<32 x bfloat> %x1, <32 x bfloat> %x2) { -; CHECK-LABEL: test_int_x86_avx10_min_nepbf16_512: +define <32 x bfloat> @test_int_x86_avx10_min_bf16_512(<32 x bfloat> %x1, <32 x bfloat> %x2) { +; CHECK-LABEL: test_int_x86_avx10_min_bf16_512: ; CHECK: # %bb.0: -; CHECK-NEXT: vminpbf16 %zmm1, %zmm0, %zmm0 # encoding: [0x62,0xf5,0x7d,0x48,0x5d,0xc1] +; CHECK-NEXT: vminbf16 %zmm1, %zmm0, %zmm0 # encoding: [0x62,0xf5,0x7d,0x48,0x5d,0xc1] ; CHECK-NEXT: ret{{[l|q]}} # encoding: [0xc3] - %res0 = call <32 x bfloat> @llvm.x86.avx10.vminpbf16512(<32 x bfloat> %x1, <32 x bfloat> %x2) + %res0 = call <32 x bfloat> @llvm.x86.avx10.vminbf16512(<32 x bfloat> %x1, <32 x bfloat> %x2) ret <32 x bfloat> %res0 } -define <32 x bfloat> @test_int_x86_avx10_maskz_min_nepbf16_512(<32 x bfloat> %x1, <32 x bfloat> %x2, i32 %msk) { -; X64-LABEL: test_int_x86_avx10_maskz_min_nepbf16_512: +define <32 x bfloat> @test_int_x86_avx10_maskz_min_bf16_512(<32 x bfloat> %x1, <32 x bfloat> %x2, i32 %msk) { +; X64-LABEL: test_int_x86_avx10_maskz_min_bf16_512: ; X64: # %bb.0: ; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf] -; X64-NEXT: vminpbf16 %zmm1, %zmm0, %zmm0 {%k1} {z} # encoding: [0x62,0xf5,0x7d,0xc9,0x5d,0xc1] +; X64-NEXT: vminbf16 %zmm1, %zmm0, %zmm0 {%k1} {z} # encoding: [0x62,0xf5,0x7d,0xc9,0x5d,0xc1] ; X64-NEXT: retq # encoding: [0xc3] ; -; X86-LABEL: test_int_x86_avx10_maskz_min_nepbf16_512: +; X86-LABEL: test_int_x86_avx10_maskz_min_bf16_512: ; X86: # %bb.0: ; X86-NEXT: kmovd {{[0-9]+}}(%esp), %k1 # encoding: [0xc4,0xe1,0xf9,0x90,0x4c,0x24,0x04] -; X86-NEXT: vminpbf16 %zmm1, %zmm0, %zmm0 {%k1} {z} # encoding: [0x62,0xf5,0x7d,0xc9,0x5d,0xc1] +; X86-NEXT: vminbf16 %zmm1, %zmm0, %zmm0 {%k1} {z} # encoding: [0x62,0xf5,0x7d,0xc9,0x5d,0xc1] ; X86-NEXT: retl # encoding: [0xc3] %mask = bitcast i32 %msk to <32 x i1> - %res0 = call <32 x bfloat> @llvm.x86.avx10.vminpbf16512(<32 x bfloat> %x1, <32 x bfloat> %x2) + %res0 = call <32 x bfloat> @llvm.x86.avx10.vminbf16512(<32 x bfloat> %x1, <32 x bfloat> %x2) %res1 = select <32 x i1> %mask, <32 x bfloat> %res0, <32 x bfloat> zeroinitializer ret <32 x bfloat> %res1 } -declare <32 x bfloat> @llvm.x86.avx10.vmaxpbf16512(<32 x bfloat>, <32 x bfloat>) +declare <32 x bfloat> @llvm.x86.avx10.vmaxbf16512(<32 x bfloat>, <32 x bfloat>) -define <32 x bfloat> @test_int_x86_avx10_max_nepbf16_512(<32 x bfloat> %x1, <32 x bfloat> %x2) { -; CHECK-LABEL: test_int_x86_avx10_max_nepbf16_512: +define <32 x bfloat> @test_int_x86_avx10_max_bf16_512(<32 x bfloat> %x1, <32 x bfloat> %x2) { +; CHECK-LABEL: test_int_x86_avx10_max_bf16_512: ; CHECK: # %bb.0: -; CHECK-NEXT: vmaxpbf16 %zmm1, %zmm0, %zmm0 # encoding: [0x62,0xf5,0x7d,0x48,0x5f,0xc1] +; CHECK-NEXT: vmaxbf16 %zmm1, %zmm0, %zmm0 # encoding: [0x62,0xf5,0x7d,0x48,0x5f,0xc1] ; CHECK-NEXT: ret{{[l|q]}} # encoding: [0xc3] - %res0 = call <32 x bfloat> @llvm.x86.avx10.vmaxpbf16512(<32 x bfloat> %x1, <32 x bfloat> %x2) + %res0 = call <32 x bfloat> @llvm.x86.avx10.vmaxbf16512(<32 x bfloat> %x1, <32 x bfloat> %x2) ret <32 x bfloat> %res0 } -define <32 x bfloat> @test_int_x86_avx10_maskz_max_nepbf16_512(<32 x bfloat> %x1, <32 x bfloat> %x2, i32 %msk) { -; X64-LABEL: test_int_x86_avx10_maskz_max_nepbf16_512: +define <32 x bfloat> @test_int_x86_avx10_maskz_max_bf16_512(<32 x bfloat> %x1, <32 x bfloat> %x2, i32 %msk) { +; X64-LABEL: test_int_x86_avx10_maskz_max_bf16_512: ; X64: # %bb.0: ; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf] -; X64-NEXT: vmaxpbf16 %zmm1, %zmm0, %zmm0 {%k1} {z} # encoding: [0x62,0xf5,0x7d,0xc9,0x5f,0xc1] +; X64-NEXT: vmaxbf16 %zmm1, %zmm0, %zmm0 {%k1} {z} # encoding: [0x62,0xf5,0x7d,0xc9,0x5f,0xc1] ; X64-NEXT: retq # encoding: [0xc3] ; -; X86-LABEL: test_int_x86_avx10_maskz_max_nepbf16_512: +; X86-LABEL: test_int_x86_avx10_maskz_max_bf16_512: ; X86: # %bb.0: ; X86-NEXT: kmovd {{[0-9]+}}(%esp), %k1 # encoding: [0xc4,0xe1,0xf9,0x90,0x4c,0x24,0x04] -; X86-NEXT: vmaxpbf16 %zmm1, %zmm0, %zmm0 {%k1} {z} # encoding: [0x62,0xf5,0x7d,0xc9,0x5f,0xc1] +; X86-NEXT: vmaxbf16 %zmm1, %zmm0, %zmm0 {%k1} {z} # encoding: [0x62,0xf5,0x7d,0xc9,0x5f,0xc1] ; X86-NEXT: retl # encoding: [0xc3] %mask = bitcast i32 %msk to <32 x i1> - %res0 = call <32 x bfloat> @llvm.x86.avx10.vmaxpbf16512(<32 x bfloat> %x1, <32 x bfloat> %x2) + %res0 = call <32 x bfloat> @llvm.x86.avx10.vmaxbf16512(<32 x bfloat> %x1, <32 x bfloat> %x2) %res1 = select <32 x i1> %mask, <32 x bfloat> %res0, <32 x bfloat> zeroinitializer ret <32 x bfloat> %res1 } -declare <32 x bfloat> @llvm.x86.avx10.mask.rsqrt.nepbf16.512(<32 x bfloat>, <32 x bfloat>, i32) +declare <32 x bfloat> @llvm.x86.avx10.mask.rsqrt.bf16.512(<32 x bfloat>, <32 x bfloat>, i32) -define <32 x bfloat> @test_rsqrt_nepbf16_512(<32 x bfloat> %a0) { -; CHECK-LABEL: test_rsqrt_nepbf16_512: +define <32 x bfloat> @test_rsqrt_bf16_512(<32 x bfloat> %a0) { +; CHECK-LABEL: test_rsqrt_bf16_512: ; CHECK: # %bb.0: -; CHECK-NEXT: vrsqrtpbf16 %zmm0, %zmm0 # encoding: [0x62,0xf6,0x7c,0x48,0x4e,0xc0] +; CHECK-NEXT: vrsqrtbf16 %zmm0, %zmm0 # encoding: [0x62,0xf6,0x7c,0x48,0x4e,0xc0] ; CHECK-NEXT: ret{{[l|q]}} # encoding: [0xc3] - %res = call <32 x bfloat> @llvm.x86.avx10.mask.rsqrt.nepbf16.512(<32 x bfloat> %a0, <32 x bfloat> zeroinitializer, i32 -1) + %res = call <32 x bfloat> @llvm.x86.avx10.mask.rsqrt.bf16.512(<32 x bfloat> %a0, <32 x bfloat> zeroinitializer, i32 -1) ret <32 x bfloat> %res } -declare <32 x i1> @llvm.x86.avx10.fpclass.nepbf16.512(<32 x bfloat>, i32) +declare <32 x i1> @llvm.x86.avx10.fpclass.bf16.512(<32 x bfloat>, i32) -define i32 @test_int_x86_avx512_fpclass_nepbf16_512(<32 x bfloat> %x0) { -; CHECK-LABEL: test_int_x86_avx512_fpclass_nepbf16_512: +define i32 @test_int_x86_avx512_fpclass_bf16_512(<32 x bfloat> %x0) { +; CHECK-LABEL: test_int_x86_avx512_fpclass_bf16_512: ; CHECK: # %bb.0: -; CHECK-NEXT: vfpclasspbf16 $6, %zmm0, %k1 # encoding: [0x62,0xf3,0x7f,0x48,0x66,0xc8,0x06] +; CHECK-NEXT: vfpclassbf16 $6, %zmm0, %k1 # encoding: [0x62,0xf3,0x7f,0x48,0x66,0xc8,0x06] ; CHECK-NEXT: # k1 = isPositiveZero(zmm0) | isNegativeZero(zmm0) -; CHECK-NEXT: vfpclasspbf16 $0, %zmm0, %k0 {%k1} # encoding: [0x62,0xf3,0x7f,0x49,0x66,0xc0,0x00] +; CHECK-NEXT: vfpclassbf16 $0, %zmm0, %k0 {%k1} # encoding: [0x62,0xf3,0x7f,0x49,0x66,0xc0,0x00] ; CHECK-NEXT: # k0 {%k1} = false ; CHECK-NEXT: kmovd %k0, %eax # encoding: [0xc5,0xfb,0x93,0xc0] ; CHECK-NEXT: vzeroupper # encoding: [0xc5,0xf8,0x77] ; CHECK-NEXT: ret{{[l|q]}} # encoding: [0xc3] - %res = call <32 x i1> @llvm.x86.avx10.fpclass.nepbf16.512(<32 x bfloat> %x0, i32 0) - %res1 = call <32 x i1> @llvm.x86.avx10.fpclass.nepbf16.512(<32 x bfloat> %x0, i32 6) + %res = call <32 x i1> @llvm.x86.avx10.fpclass.bf16.512(<32 x bfloat> %x0, i32 0) + %res1 = call <32 x i1> @llvm.x86.avx10.fpclass.bf16.512(<32 x bfloat> %x0, i32 6) %1 = and <32 x i1> %res1, %res %2 = bitcast <32 x i1> %1 to i32 ret i32 %2 } -declare <32 x bfloat> @llvm.x86.avx10.mask.rcp.nepbf16.512(<32 x bfloat>, <32 x bfloat>, i32) +declare <32 x bfloat> @llvm.x86.avx10.mask.rcp.bf16.512(<32 x bfloat>, <32 x bfloat>, i32) -define <32 x bfloat> @test_rcp_nepbf16_512(<32 x bfloat> %a0, <32 x bfloat> %a1, i32 %mask) { -; X64-LABEL: test_rcp_nepbf16_512: +define <32 x bfloat> @test_rcp_bf16_512(<32 x bfloat> %a0, <32 x bfloat> %a1, i32 %mask) { +; X64-LABEL: test_rcp_bf16_512: ; X64: # %bb.0: ; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf] -; X64-NEXT: vrcppbf16 %zmm0, %zmm1 {%k1} # encoding: [0x62,0xf6,0x7c,0x49,0x4c,0xc8] +; X64-NEXT: vrcpbf16 %zmm0, %zmm1 {%k1} # encoding: [0x62,0xf6,0x7c,0x49,0x4c,0xc8] ; X64-NEXT: vmovaps %zmm1, %zmm0 # encoding: [0x62,0xf1,0x7c,0x48,0x28,0xc1] ; X64-NEXT: retq # encoding: [0xc3] ; -; X86-LABEL: test_rcp_nepbf16_512: +; X86-LABEL: test_rcp_bf16_512: ; X86: # %bb.0: ; X86-NEXT: kmovd {{[0-9]+}}(%esp), %k1 # encoding: [0xc4,0xe1,0xf9,0x90,0x4c,0x24,0x04] -; X86-NEXT: vrcppbf16 %zmm0, %zmm1 {%k1} # encoding: [0x62,0xf6,0x7c,0x49,0x4c,0xc8] +; X86-NEXT: vrcpbf16 %zmm0, %zmm1 {%k1} # encoding: [0x62,0xf6,0x7c,0x49,0x4c,0xc8] ; X86-NEXT: vmovaps %zmm1, %zmm0 # encoding: [0x62,0xf1,0x7c,0x48,0x28,0xc1] ; X86-NEXT: retl # encoding: [0xc3] - %res = call <32 x bfloat> @llvm.x86.avx10.mask.rcp.nepbf16.512(<32 x bfloat> %a0, <32 x bfloat> %a1, i32 %mask) + %res = call <32 x bfloat> @llvm.x86.avx10.mask.rcp.bf16.512(<32 x bfloat> %a0, <32 x bfloat> %a1, i32 %mask) ret <32 x bfloat> %res } -declare <32 x bfloat> @llvm.x86.avx10.mask.reduce.nepbf16.512(<32 x bfloat>, i32, <32 x bfloat>, i32) +declare <32 x bfloat> @llvm.x86.avx10.mask.reduce.bf16.512(<32 x bfloat>, i32, <32 x bfloat>, i32) -define <32 x bfloat>@test_int_x86_avx512_mask_reduce_nepbf16_512(<32 x bfloat> %x0, <32 x bfloat> %x2, i32 %x3) { -; X64-LABEL: test_int_x86_avx512_mask_reduce_nepbf16_512: +define <32 x bfloat>@test_int_x86_avx512_mask_reduce_bf16_512(<32 x bfloat> %x0, <32 x bfloat> %x2, i32 %x3) { +; X64-LABEL: test_int_x86_avx512_mask_reduce_bf16_512: ; X64: # %bb.0: ; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf] -; X64-NEXT: vreducenepbf16 $8, %zmm0, %zmm1 {%k1} # encoding: [0x62,0xf3,0x7f,0x49,0x56,0xc8,0x08] -; X64-NEXT: vreducenepbf16 $4, %zmm0, %zmm0 # encoding: [0x62,0xf3,0x7f,0x48,0x56,0xc0,0x04] -; X64-NEXT: vaddnepbf16 %zmm0, %zmm1, %zmm0 # encoding: [0x62,0xf5,0x75,0x48,0x58,0xc0] +; X64-NEXT: vreducebf16 $8, %zmm0, %zmm1 {%k1} # encoding: [0x62,0xf3,0x7f,0x49,0x56,0xc8,0x08] +; X64-NEXT: vreducebf16 $4, %zmm0, %zmm0 # encoding: [0x62,0xf3,0x7f,0x48,0x56,0xc0,0x04] +; X64-NEXT: vaddbf16 %zmm0, %zmm1, %zmm0 # encoding: [0x62,0xf5,0x75,0x48,0x58,0xc0] ; X64-NEXT: retq # encoding: [0xc3] ; -; X86-LABEL: test_int_x86_avx512_mask_reduce_nepbf16_512: +; X86-LABEL: test_int_x86_avx512_mask_reduce_bf16_512: ; X86: # %bb.0: ; X86-NEXT: kmovd {{[0-9]+}}(%esp), %k1 # encoding: [0xc4,0xe1,0xf9,0x90,0x4c,0x24,0x04] -; X86-NEXT: vreducenepbf16 $8, %zmm0, %zmm1 {%k1} # encoding: [0x62,0xf3,0x7f,0x49,0x56,0xc8,0x08] -; X86-NEXT: vreducenepbf16 $4, %zmm0, %zmm0 # encoding: [0x62,0xf3,0x7f,0x48,0x56,0xc0,0x04] -; X86-NEXT: vaddnepbf16 %zmm0, %zmm1, %zmm0 # encoding: [0x62,0xf5,0x75,0x48,0x58,0xc0] +; X86-NEXT: vreducebf16 $8, %zmm0, %zmm1 {%k1} # encoding: [0x62,0xf3,0x7f,0x49,0x56,0xc8,0x08] +; X86-NEXT: vreducebf16 $4, %zmm0, %zmm0 # encoding: [0x62,0xf3,0x7f,0x48,0x56,0xc0,0x04] +; X86-NEXT: vaddbf16 %zmm0, %zmm1, %zmm0 # encoding: [0x62,0xf5,0x75,0x48,0x58,0xc0] ; X86-NEXT: retl # encoding: [0xc3] - %res = call <32 x bfloat> @llvm.x86.avx10.mask.reduce.nepbf16.512(<32 x bfloat> %x0, i32 8, <32 x bfloat> %x2, i32 %x3) - %res1 = call <32 x bfloat> @llvm.x86.avx10.mask.reduce.nepbf16.512(<32 x bfloat> %x0, i32 4, <32 x bfloat> %x2, i32 -1) + %res = call <32 x bfloat> @llvm.x86.avx10.mask.reduce.bf16.512(<32 x bfloat> %x0, i32 8, <32 x bfloat> %x2, i32 %x3) + %res1 = call <32 x bfloat> @llvm.x86.avx10.mask.reduce.bf16.512(<32 x bfloat> %x0, i32 4, <32 x bfloat> %x2, i32 -1) %res2 = fadd <32 x bfloat> %res, %res1 ret <32 x bfloat> %res2 } -declare <32 x bfloat> @llvm.x86.avx10.mask.rndscale.nepbf16.512(<32 x bfloat>, i32, <32 x bfloat>, i32) +declare <32 x bfloat> @llvm.x86.avx10.mask.rndscale.bf16.512(<32 x bfloat>, i32, <32 x bfloat>, i32) -define <32 x bfloat>@test_int_x86_avx512_mask_rndscale_nepbf16_512(<32 x bfloat> %x0, <32 x bfloat> %x2, i32 %x3) { -; X64-LABEL: test_int_x86_avx512_mask_rndscale_nepbf16_512: +define <32 x bfloat>@test_int_x86_avx512_mask_rndscale_bf16_512(<32 x bfloat> %x0, <32 x bfloat> %x2, i32 %x3) { +; X64-LABEL: test_int_x86_avx512_mask_rndscale_bf16_512: ; X64: # %bb.0: ; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf] -; X64-NEXT: vrndscalenepbf16 $8, %zmm0, %zmm1 {%k1} # encoding: [0x62,0xf3,0x7f,0x49,0x08,0xc8,0x08] -; X64-NEXT: vrndscalenepbf16 $4, %zmm0, %zmm0 # encoding: [0x62,0xf3,0x7f,0x48,0x08,0xc0,0x04] -; X64-NEXT: vaddnepbf16 %zmm0, %zmm1, %zmm0 # encoding: [0x62,0xf5,0x75,0x48,0x58,0xc0] +; X64-NEXT: vrndscalebf16 $8, %zmm0, %zmm1 {%k1} # encoding: [0x62,0xf3,0x7f,0x49,0x08,0xc8,0x08] +; X64-NEXT: vrndscalebf16 $4, %zmm0, %zmm0 # encoding: [0x62,0xf3,0x7f,0x48,0x08,0xc0,0x04] +; X64-NEXT: vaddbf16 %zmm0, %zmm1, %zmm0 # encoding: [0x62,0xf5,0x75,0x48,0x58,0xc0] ; X64-NEXT: retq # encoding: [0xc3] ; -; X86-LABEL: test_int_x86_avx512_mask_rndscale_nepbf16_512: +; X86-LABEL: test_int_x86_avx512_mask_rndscale_bf16_512: ; X86: # %bb.0: ; X86-NEXT: kmovd {{[0-9]+}}(%esp), %k1 # encoding: [0xc4,0xe1,0xf9,0x90,0x4c,0x24,0x04] -; X86-NEXT: vrndscalenepbf16 $8, %zmm0, %zmm1 {%k1} # encoding: [0x62,0xf3,0x7f,0x49,0x08,0xc8,0x08] -; X86-NEXT: vrndscalenepbf16 $4, %zmm0, %zmm0 # encoding: [0x62,0xf3,0x7f,0x48,0x08,0xc0,0x04] -; X86-NEXT: vaddnepbf16 %zmm0, %zmm1, %zmm0 # encoding: [0x62,0xf5,0x75,0x48,0x58,0xc0] +; X86-NEXT: vrndscalebf16 $8, %zmm0, %zmm1 {%k1} # encoding: [0x62,0xf3,0x7f,0x49,0x08,0xc8,0x08] +; X86-NEXT: vrndscalebf16 $4, %zmm0, %zmm0 # encoding: [0x62,0xf3,0x7f,0x48,0x08,0xc0,0x04] +; X86-NEXT: vaddbf16 %zmm0, %zmm1, %zmm0 # encoding: [0x62,0xf5,0x75,0x48,0x58,0xc0] ; X86-NEXT: retl # encoding: [0xc3] - %res = call <32 x bfloat> @llvm.x86.avx10.mask.rndscale.nepbf16.512(<32 x bfloat> %x0, i32 8, <32 x bfloat> %x2, i32 %x3) - %res1 = call <32 x bfloat> @llvm.x86.avx10.mask.rndscale.nepbf16.512(<32 x bfloat> %x0, i32 4, <32 x bfloat> %x2, i32 -1) + %res = call <32 x bfloat> @llvm.x86.avx10.mask.rndscale.bf16.512(<32 x bfloat> %x0, i32 8, <32 x bfloat> %x2, i32 %x3) + %res1 = call <32 x bfloat> @llvm.x86.avx10.mask.rndscale.bf16.512(<32 x bfloat> %x0, i32 4, <32 x bfloat> %x2, i32 -1) %res2 = fadd <32 x bfloat> %res, %res1 ret <32 x bfloat> %res2 } -declare <32 x bfloat> @llvm.x86.avx10.mask.getexp.nepbf16.512(<32 x bfloat>, <32 x bfloat>, i32) +declare <32 x bfloat> @llvm.x86.avx10.mask.getexp.bf16.512(<32 x bfloat>, <32 x bfloat>, i32) -define <32 x bfloat>@test_int_x86_avx512_mask_getexp_nepbf16_512(<32 x bfloat> %x0, <32 x bfloat> %x1, i32 %x2) { -; X64-LABEL: test_int_x86_avx512_mask_getexp_nepbf16_512: +define <32 x bfloat>@test_int_x86_avx512_mask_getexp_bf16_512(<32 x bfloat> %x0, <32 x bfloat> %x1, i32 %x2) { +; X64-LABEL: test_int_x86_avx512_mask_getexp_bf16_512: ; X64: # %bb.0: ; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf] -; X64-NEXT: vgetexppbf16 %zmm0, %zmm0 # encoding: [0x62,0xf5,0x7d,0x48,0x42,0xc0] +; X64-NEXT: vgetexpbf16 %zmm0, %zmm0 # encoding: [0x62,0xf5,0x7d,0x48,0x42,0xc0] ; X64-NEXT: vmovdqu16 %zmm0, %zmm1 {%k1} # encoding: [0x62,0xf1,0xff,0x49,0x6f,0xc8] -; X64-NEXT: vaddnepbf16 %zmm0, %zmm1, %zmm0 # encoding: [0x62,0xf5,0x75,0x48,0x58,0xc0] +; X64-NEXT: vaddbf16 %zmm0, %zmm1, %zmm0 # encoding: [0x62,0xf5,0x75,0x48,0x58,0xc0] ; X64-NEXT: retq # encoding: [0xc3] ; -; X86-LABEL: test_int_x86_avx512_mask_getexp_nepbf16_512: +; X86-LABEL: test_int_x86_avx512_mask_getexp_bf16_512: ; X86: # %bb.0: ; X86-NEXT: kmovd {{[0-9]+}}(%esp), %k1 # encoding: [0xc4,0xe1,0xf9,0x90,0x4c,0x24,0x04] -; X86-NEXT: vgetexppbf16 %zmm0, %zmm0 # encoding: [0x62,0xf5,0x7d,0x48,0x42,0xc0] +; X86-NEXT: vgetexpbf16 %zmm0, %zmm0 # encoding: [0x62,0xf5,0x7d,0x48,0x42,0xc0] ; X86-NEXT: vmovdqu16 %zmm0, %zmm1 {%k1} # encoding: [0x62,0xf1,0xff,0x49,0x6f,0xc8] -; X86-NEXT: vaddnepbf16 %zmm0, %zmm1, %zmm0 # encoding: [0x62,0xf5,0x75,0x48,0x58,0xc0] +; X86-NEXT: vaddbf16 %zmm0, %zmm1, %zmm0 # encoding: [0x62,0xf5,0x75,0x48,0x58,0xc0] ; X86-NEXT: retl # encoding: [0xc3] - %res1 = call <32 x bfloat> @llvm.x86.avx10.mask.getexp.nepbf16.512(<32 x bfloat> %x0, <32 x bfloat> %x1, i32 %x2) - %res2 = call <32 x bfloat> @llvm.x86.avx10.mask.getexp.nepbf16.512(<32 x bfloat> %x0, <32 x bfloat> zeroinitializer, i32 -1) + %res1 = call <32 x bfloat> @llvm.x86.avx10.mask.getexp.bf16.512(<32 x bfloat> %x0, <32 x bfloat> %x1, i32 %x2) + %res2 = call <32 x bfloat> @llvm.x86.avx10.mask.getexp.bf16.512(<32 x bfloat> %x0, <32 x bfloat> zeroinitializer, i32 -1) %res3 = fadd <32 x bfloat> %res1, %res2 ret <32 x bfloat> %res3 } -declare <32 x bfloat> @llvm.x86.avx10.mask.getmant.nepbf16.512(<32 x bfloat>, i32, <32 x bfloat>, i32) +declare <32 x bfloat> @llvm.x86.avx10.mask.getmant.bf16.512(<32 x bfloat>, i32, <32 x bfloat>, i32) -define <32 x bfloat>@test_int_x86_avx512_mask_getmant_nepbf16_512(<32 x bfloat> %x0, <32 x bfloat> %x2, i32 %x3) { -; X64-LABEL: test_int_x86_avx512_mask_getmant_nepbf16_512: +define <32 x bfloat>@test_int_x86_avx512_mask_getmant_bf16_512(<32 x bfloat> %x0, <32 x bfloat> %x2, i32 %x3) { +; X64-LABEL: test_int_x86_avx512_mask_getmant_bf16_512: ; X64: # %bb.0: ; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf] -; X64-NEXT: vgetmantpbf16 $8, %zmm0, %zmm1 {%k1} # encoding: [0x62,0xf3,0x7f,0x49,0x26,0xc8,0x08] -; X64-NEXT: vgetmantpbf16 $4, %zmm0, %zmm0 # encoding: [0x62,0xf3,0x7f,0x48,0x26,0xc0,0x04] -; X64-NEXT: vaddnepbf16 %zmm0, %zmm1, %zmm0 # encoding: [0x62,0xf5,0x75,0x48,0x58,0xc0] +; X64-NEXT: vgetmantbf16 $8, %zmm0, %zmm1 {%k1} # encoding: [0x62,0xf3,0x7f,0x49,0x26,0xc8,0x08] +; X64-NEXT: vgetmantbf16 $4, %zmm0, %zmm0 # encoding: [0x62,0xf3,0x7f,0x48,0x26,0xc0,0x04] +; X64-NEXT: vaddbf16 %zmm0, %zmm1, %zmm0 # encoding: [0x62,0xf5,0x75,0x48,0x58,0xc0] ; X64-NEXT: retq # encoding: [0xc3] ; -; X86-LABEL: test_int_x86_avx512_mask_getmant_nepbf16_512: +; X86-LABEL: test_int_x86_avx512_mask_getmant_bf16_512: ; X86: # %bb.0: ; X86-NEXT: kmovd {{[0-9]+}}(%esp), %k1 # encoding: [0xc4,0xe1,0xf9,0x90,0x4c,0x24,0x04] -; X86-NEXT: vgetmantpbf16 $8, %zmm0, %zmm1 {%k1} # encoding: [0x62,0xf3,0x7f,0x49,0x26,0xc8,0x08] -; X86-NEXT: vgetmantpbf16 $4, %zmm0, %zmm0 # encoding: [0x62,0xf3,0x7f,0x48,0x26,0xc0,0x04] -; X86-NEXT: vaddnepbf16 %zmm0, %zmm1, %zmm0 # encoding: [0x62,0xf5,0x75,0x48,0x58,0xc0] +; X86-NEXT: vgetmantbf16 $8, %zmm0, %zmm1 {%k1} # encoding: [0x62,0xf3,0x7f,0x49,0x26,0xc8,0x08] +; X86-NEXT: vgetmantbf16 $4, %zmm0, %zmm0 # encoding: [0x62,0xf3,0x7f,0x48,0x26,0xc0,0x04] +; X86-NEXT: vaddbf16 %zmm0, %zmm1, %zmm0 # encoding: [0x62,0xf5,0x75,0x48,0x58,0xc0] ; X86-NEXT: retl # encoding: [0xc3] - %res = call <32 x bfloat> @llvm.x86.avx10.mask.getmant.nepbf16.512(<32 x bfloat> %x0, i32 8, <32 x bfloat> %x2, i32 %x3) - %res1 = call <32 x bfloat> @llvm.x86.avx10.mask.getmant.nepbf16.512(<32 x bfloat> %x0, i32 4, <32 x bfloat> %x2, i32 -1) + %res = call <32 x bfloat> @llvm.x86.avx10.mask.getmant.bf16.512(<32 x bfloat> %x0, i32 8, <32 x bfloat> %x2, i32 %x3) + %res1 = call <32 x bfloat> @llvm.x86.avx10.mask.getmant.bf16.512(<32 x bfloat> %x0, i32 4, <32 x bfloat> %x2, i32 -1) %res2 = fadd <32 x bfloat> %res, %res1 ret <32 x bfloat> %res2 } -declare <32 x bfloat> @llvm.x86.avx10.mask.scalef.nepbf16.512(<32 x bfloat>, <32 x bfloat>, <32 x bfloat>, i32) +declare <32 x bfloat> @llvm.x86.avx10.mask.scalef.bf16.512(<32 x bfloat>, <32 x bfloat>, <32 x bfloat>, i32) -define <32 x bfloat>@test_int_x86_avx512_mask_scalef_nepbf16_512(<32 x bfloat> %x0, <32 x bfloat> %x1, <32 x bfloat> %x2, i32 %x3) { -; X64-LABEL: test_int_x86_avx512_mask_scalef_nepbf16_512: +define <32 x bfloat>@test_int_x86_avx512_mask_scalef_bf16_512(<32 x bfloat> %x0, <32 x bfloat> %x1, <32 x bfloat> %x2, i32 %x3) { +; X64-LABEL: test_int_x86_avx512_mask_scalef_bf16_512: ; X64: # %bb.0: ; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf] -; X64-NEXT: vscalefpbf16 %zmm1, %zmm0, %zmm0 # encoding: [0x62,0xf6,0x7c,0x48,0x2c,0xc1] +; X64-NEXT: vscalefbf16 %zmm1, %zmm0, %zmm0 # encoding: [0x62,0xf6,0x7c,0x48,0x2c,0xc1] ; X64-NEXT: vmovdqu16 %zmm0, %zmm2 {%k1} # encoding: [0x62,0xf1,0xff,0x49,0x6f,0xd0] -; X64-NEXT: vaddnepbf16 %zmm0, %zmm2, %zmm0 # encoding: [0x62,0xf5,0x6d,0x48,0x58,0xc0] +; X64-NEXT: vaddbf16 %zmm0, %zmm2, %zmm0 # encoding: [0x62,0xf5,0x6d,0x48,0x58,0xc0] ; X64-NEXT: retq # encoding: [0xc3] ; -; X86-LABEL: test_int_x86_avx512_mask_scalef_nepbf16_512: +; X86-LABEL: test_int_x86_avx512_mask_scalef_bf16_512: ; X86: # %bb.0: ; X86-NEXT: kmovd {{[0-9]+}}(%esp), %k1 # encoding: [0xc4,0xe1,0xf9,0x90,0x4c,0x24,0x04] -; X86-NEXT: vscalefpbf16 %zmm1, %zmm0, %zmm0 # encoding: [0x62,0xf6,0x7c,0x48,0x2c,0xc1] +; X86-NEXT: vscalefbf16 %zmm1, %zmm0, %zmm0 # encoding: [0x62,0xf6,0x7c,0x48,0x2c,0xc1] ; X86-NEXT: vmovdqu16 %zmm0, %zmm2 {%k1} # encoding: [0x62,0xf1,0xff,0x49,0x6f,0xd0] -; X86-NEXT: vaddnepbf16 %zmm0, %zmm2, %zmm0 # encoding: [0x62,0xf5,0x6d,0x48,0x58,0xc0] +; X86-NEXT: vaddbf16 %zmm0, %zmm2, %zmm0 # encoding: [0x62,0xf5,0x6d,0x48,0x58,0xc0] ; X86-NEXT: retl # encoding: [0xc3] %mask = bitcast i32 %x3 to <32 x i1> - %res1 = call <32 x bfloat> @llvm.x86.avx10.mask.scalef.nepbf16.512(<32 x bfloat> %x0, <32 x bfloat> %x1, <32 x bfloat> %x2, i32 %x3) - %res2 = call <32 x bfloat> @llvm.x86.avx10.mask.scalef.nepbf16.512(<32 x bfloat> %x0, <32 x bfloat> %x1, <32 x bfloat> zeroinitializer, i32 -1) + %res1 = call <32 x bfloat> @llvm.x86.avx10.mask.scalef.bf16.512(<32 x bfloat> %x0, <32 x bfloat> %x1, <32 x bfloat> %x2, i32 %x3) + %res2 = call <32 x bfloat> @llvm.x86.avx10.mask.scalef.bf16.512(<32 x bfloat> %x0, <32 x bfloat> %x1, <32 x bfloat> zeroinitializer, i32 -1) %res3 = fadd <32 x bfloat> %res1, %res2 ret <32 x bfloat> %res3 } diff --git a/llvm/test/CodeGen/X86/avx10_2bf16-arith.ll b/llvm/test/CodeGen/X86/avx10_2bf16-arith.ll index c97d27ff324bb..42831a453cb1d 100644 --- a/llvm/test/CodeGen/X86/avx10_2bf16-arith.ll +++ b/llvm/test/CodeGen/X86/avx10_2bf16-arith.ll @@ -2,48 +2,48 @@ ; RUN: llc < %s -verify-machineinstrs -mtriple=x86_64-unknown-unknown --show-mc-encoding -mattr=+avx10.2-256 | FileCheck %s --check-prefixes=CHECK,X64 ; RUN: llc < %s -verify-machineinstrs -mtriple=i686-unknown-unknown --show-mc-encoding -mattr=+avx10.2-256 | FileCheck %s --check-prefixes=CHECK,X86 -define <16 x bfloat> @test_int_x86_avx10_add_nepbf16_256(<16 x bfloat> %x1, <16 x bfloat> %x2) { -; CHECK-LABEL: test_int_x86_avx10_add_nepbf16_256: +define <16 x bfloat> @test_int_x86_avx10_add_bf16_256(<16 x bfloat> %x1, <16 x bfloat> %x2) { +; CHECK-LABEL: test_int_x86_avx10_add_bf16_256: ; CHECK: # %bb.0: -; CHECK-NEXT: vaddnepbf16 %ymm1, %ymm0, %ymm0 # encoding: [0x62,0xf5,0x7d,0x28,0x58,0xc1] +; CHECK-NEXT: vaddbf16 %ymm1, %ymm0, %ymm0 # encoding: [0x62,0xf5,0x7d,0x28,0x58,0xc1] ; CHECK-NEXT: ret{{[l|q]}} # encoding: [0xc3] %res = fadd <16 x bfloat> %x1, %x2 ret <16 x bfloat> %res } -define <16 x bfloat> @test_int_x86_avx10_mask_add_nepbf16_256(<16 x bfloat> %src, <16 x bfloat> %x1, <16 x bfloat> %x2, i16 %msk, ptr %ptr) { -; X64-LABEL: test_int_x86_avx10_mask_add_nepbf16_256: +define <16 x bfloat> @test_int_x86_avx10_mask_add_bf16_256(<16 x bfloat> %src, <16 x bfloat> %x1, <16 x bfloat> %x2, i16 %msk, ptr %ptr) { +; X64-LABEL: test_int_x86_avx10_mask_add_bf16_256: ; X64: # %bb.0: ; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf] -; X64-NEXT: vaddnepbf16 %ymm2, %ymm1, %ymm0 {%k1} # encoding: [0x62,0xf5,0x75,0x29,0x58,0xc2] +; X64-NEXT: vaddbf16 %ymm2, %ymm1, %ymm0 {%k1} # encoding: [0x62,0xf5,0x75,0x29,0x58,0xc2] ; X64-NEXT: retq # encoding: [0xc3] ; -; X86-LABEL: test_int_x86_avx10_mask_add_nepbf16_256: +; X86-LABEL: test_int_x86_avx10_mask_add_bf16_256: ; X86: # %bb.0: ; X86-NEXT: kmovw {{[0-9]+}}(%esp), %k1 # encoding: [0xc5,0xf8,0x90,0x4c,0x24,0x04] -; X86-NEXT: vaddnepbf16 %ymm2, %ymm1, %ymm0 {%k1} # encoding: [0x62,0xf5,0x75,0x29,0x58,0xc2] +; X86-NEXT: vaddbf16 %ymm2, %ymm1, %ymm0 {%k1} # encoding: [0x62,0xf5,0x75,0x29,0x58,0xc2] ; X86-NEXT: retl # encoding: [0xc3] %mask = bitcast i16 %msk to <16 x i1> %res0 = fadd <16 x bfloat> %x1, %x2 %res = select <16 x i1> %mask, <16 x bfloat> %res0, <16 x bfloat> %src ret <16 x bfloat> %res } -define <16 x bfloat> @test_int_x86_avx10_maskz_add_nepbf16_256(<16 x bfloat> %src, <16 x bfloat> %x1, <16 x bfloat> %x2, i16 %msk, ptr %ptr) { -; X64-LABEL: test_int_x86_avx10_maskz_add_nepbf16_256: +define <16 x bfloat> @test_int_x86_avx10_maskz_add_bf16_256(<16 x bfloat> %src, <16 x bfloat> %x1, <16 x bfloat> %x2, i16 %msk, ptr %ptr) { +; X64-LABEL: test_int_x86_avx10_maskz_add_bf16_256: ; X64: # %bb.0: ; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf] -; X64-NEXT: vaddnepbf16 %ymm2, %ymm1, %ymm0 {%k1} {z} # encoding: [0x62,0xf5,0x75,0xa9,0x58,0xc2] -; X64-NEXT: vaddnepbf16 (%rsi), %ymm1, %ymm1 {%k1} {z} # encoding: [0x62,0xf5,0x75,0xa9,0x58,0x0e] -; X64-NEXT: vaddnepbf16 %ymm1, %ymm0, %ymm0 # encoding: [0x62,0xf5,0x7d,0x28,0x58,0xc1] +; X64-NEXT: vaddbf16 %ymm2, %ymm1, %ymm0 {%k1} {z} # encoding: [0x62,0xf5,0x75,0xa9,0x58,0xc2] +; X64-NEXT: vaddbf16 (%rsi), %ymm1, %ymm1 {%k1} {z} # encoding: [0x62,0xf5,0x75,0xa9,0x58,0x0e] +; X64-NEXT: vaddbf16 %ymm1, %ymm0, %ymm0 # encoding: [0x62,0xf5,0x7d,0x28,0x58,0xc1] ; X64-NEXT: retq # encoding: [0xc3] ; -; X86-LABEL: test_int_x86_avx10_maskz_add_nepbf16_256: +; X86-LABEL: test_int_x86_avx10_maskz_add_bf16_256: ; X86: # %bb.0: ; X86-NEXT: movl {{[0-9]+}}(%esp), %eax # encoding: [0x8b,0x44,0x24,0x08] ; X86-NEXT: kmovw {{[0-9]+}}(%esp), %k1 # encoding: [0xc5,0xf8,0x90,0x4c,0x24,0x04] -; X86-NEXT: vaddnepbf16 %ymm2, %ymm1, %ymm0 {%k1} {z} # encoding: [0x62,0xf5,0x75,0xa9,0x58,0xc2] -; X86-NEXT: vaddnepbf16 (%eax), %ymm1, %ymm1 {%k1} {z} # encoding: [0x62,0xf5,0x75,0xa9,0x58,0x08] -; X86-NEXT: vaddnepbf16 %ymm1, %ymm0, %ymm0 # encoding: [0x62,0xf5,0x7d,0x28,0x58,0xc1] +; X86-NEXT: vaddbf16 %ymm2, %ymm1, %ymm0 {%k1} {z} # encoding: [0x62,0xf5,0x75,0xa9,0x58,0xc2] +; X86-NEXT: vaddbf16 (%eax), %ymm1, %ymm1 {%k1} {z} # encoding: [0x62,0xf5,0x75,0xa9,0x58,0x08] +; X86-NEXT: vaddbf16 %ymm1, %ymm0, %ymm0 # encoding: [0x62,0xf5,0x7d,0x28,0x58,0xc1] ; X86-NEXT: retl # encoding: [0xc3] %mask = bitcast i16 %msk to <16 x i1> %val = load <16 x bfloat>, ptr %ptr @@ -55,26 +55,26 @@ define <16 x bfloat> @test_int_x86_avx10_maskz_add_nepbf16_256(<16 x bfloat> %sr ret <16 x bfloat> %res3 } -define <8 x bfloat> @test_int_x86_avx10_add_nepbf16_128(<8 x bfloat> %x1, <8 x bfloat> %x2) { -; CHECK-LABEL: test_int_x86_avx10_add_nepbf16_128: +define <8 x bfloat> @test_int_x86_avx10_add_bf16_128(<8 x bfloat> %x1, <8 x bfloat> %x2) { +; CHECK-LABEL: test_int_x86_avx10_add_bf16_128: ; CHECK: # %bb.0: -; CHECK-NEXT: vaddnepbf16 %xmm1, %xmm0, %xmm0 # encoding: [0x62,0xf5,0x7d,0x08,0x58,0xc1] +; CHECK-NEXT: vaddbf16 %xmm1, %xmm0, %xmm0 # encoding: [0x62,0xf5,0x7d,0x08,0x58,0xc1] ; CHECK-NEXT: ret{{[l|q]}} # encoding: [0xc3] %res = fadd <8 x bfloat> %x1, %x2 ret <8 x bfloat> %res } -define <8 x bfloat> @test_int_x86_avx10_mask_add_nepbf16_128(<8 x bfloat> %src, <8 x bfloat> %x1, <8 x bfloat> %x2, i8 %msk, ptr %ptr) { -; X64-LABEL: test_int_x86_avx10_mask_add_nepbf16_128: +define <8 x bfloat> @test_int_x86_avx10_mask_add_bf16_128(<8 x bfloat> %src, <8 x bfloat> %x1, <8 x bfloat> %x2, i8 %msk, ptr %ptr) { +; X64-LABEL: test_int_x86_avx10_mask_add_bf16_128: ; X64: # %bb.0: ; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf] -; X64-NEXT: vaddnepbf16 %xmm2, %xmm1, %xmm0 {%k1} # encoding: [0x62,0xf5,0x75,0x09,0x58,0xc2] +; X64-NEXT: vaddbf16 %xmm2, %xmm1, %xmm0 {%k1} # encoding: [0x62,0xf5,0x75,0x09,0x58,0xc2] ; X64-NEXT: retq # encoding: [0xc3] ; -; X86-LABEL: test_int_x86_avx10_mask_add_nepbf16_128: +; X86-LABEL: test_int_x86_avx10_mask_add_bf16_128: ; X86: # %bb.0: ; X86-NEXT: kmovb {{[0-9]+}}(%esp), %k1 # encoding: [0xc5,0xf9,0x90,0x4c,0x24,0x04] -; X86-NEXT: vaddnepbf16 %xmm2, %xmm1, %xmm0 {%k1} # encoding: [0x62,0xf5,0x75,0x09,0x58,0xc2] +; X86-NEXT: vaddbf16 %xmm2, %xmm1, %xmm0 {%k1} # encoding: [0x62,0xf5,0x75,0x09,0x58,0xc2] ; X86-NEXT: retl # encoding: [0xc3] %mask = bitcast i8 %msk to <8 x i1> %res0 = fadd <8 x bfloat> %x1, %x2 @@ -82,22 +82,22 @@ define <8 x bfloat> @test_int_x86_avx10_mask_add_nepbf16_128(<8 x bfloat> %src, ret <8 x bfloat> %res } -define <8 x bfloat> @test_int_x86_avx10_maskz_add_nepbf16_128(<8 x bfloat> %src, <8 x bfloat> %x1, <8 x bfloat> %x2, i8 %msk, ptr %ptr) { -; X64-LABEL: test_int_x86_avx10_maskz_add_nepbf16_128: +define <8 x bfloat> @test_int_x86_avx10_maskz_add_bf16_128(<8 x bfloat> %src, <8 x bfloat> %x1, <8 x bfloat> %x2, i8 %msk, ptr %ptr) { +; X64-LABEL: test_int_x86_avx10_maskz_add_bf16_128: ; X64: # %bb.0: ; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf] -; X64-NEXT: vaddnepbf16 %xmm2, %xmm1, %xmm0 {%k1} {z} # encoding: [0x62,0xf5,0x75,0x89,0x58,0xc2] -; X64-NEXT: vaddnepbf16 (%rsi), %xmm1, %xmm1 {%k1} {z} # encoding: [0x62,0xf5,0x75,0x89,0x58,0x0e] -; X64-NEXT: vaddnepbf16 %xmm1, %xmm0, %xmm0 # encoding: [0x62,0xf5,0x7d,0x08,0x58,0xc1] +; X64-NEXT: vaddbf16 %xmm2, %xmm1, %xmm0 {%k1} {z} # encoding: [0x62,0xf5,0x75,0x89,0x58,0xc2] +; X64-NEXT: vaddbf16 (%rsi), %xmm1, %xmm1 {%k1} {z} # encoding: [0x62,0xf5,0x75,0x89,0x58,0x0e] +; X64-NEXT: vaddbf16 %xmm1, %xmm0, %xmm0 # encoding: [0x62,0xf5,0x7d,0x08,0x58,0xc1] ; X64-NEXT: retq # encoding: [0xc3] ; -; X86-LABEL: test_int_x86_avx10_maskz_add_nepbf16_128: +; X86-LABEL: test_int_x86_avx10_maskz_add_bf16_128: ; X86: # %bb.0: ; X86-NEXT: movl {{[0-9]+}}(%esp), %eax # encoding: [0x8b,0x44,0x24,0x08] ; X86-NEXT: kmovb {{[0-9]+}}(%esp), %k1 # encoding: [0xc5,0xf9,0x90,0x4c,0x24,0x04] -; X86-NEXT: vaddnepbf16 %xmm2, %xmm1, %xmm0 {%k1} {z} # encoding: [0x62,0xf5,0x75,0x89,0x58,0xc2] -; X86-NEXT: vaddnepbf16 (%eax), %xmm1, %xmm1 {%k1} {z} # encoding: [0x62,0xf5,0x75,0x89,0x58,0x08] -; X86-NEXT: vaddnepbf16 %xmm1, %xmm0, %xmm0 # encoding: [0x62,0xf5,0x7d,0x08,0x58,0xc1] +; X86-NEXT: vaddbf16 %xmm2, %xmm1, %xmm0 {%k1} {z} # encoding: [0x62,0xf5,0x75,0x89,0x58,0xc2] +; X86-NEXT: vaddbf16 (%eax), %xmm1, %xmm1 {%k1} {z} # encoding: [0x62,0xf5,0x75,0x89,0x58,0x08] +; X86-NEXT: vaddbf16 %xmm1, %xmm0, %xmm0 # encoding: [0x62,0xf5,0x7d,0x08,0x58,0xc1] ; X86-NEXT: retl # encoding: [0xc3] %mask = bitcast i8 %msk to <8 x i1> %val = load <8 x bfloat>, ptr %ptr @@ -109,26 +109,26 @@ define <8 x bfloat> @test_int_x86_avx10_maskz_add_nepbf16_128(<8 x bfloat> %src, ret <8 x bfloat> %res3 } -define <16 x bfloat> @test_int_x86_avx10_sub_nepbf16_256(<16 x bfloat> %x1, <16 x bfloat> %x2) { -; CHECK-LABEL: test_int_x86_avx10_sub_nepbf16_256: +define <16 x bfloat> @test_int_x86_avx10_sub_bf16_256(<16 x bfloat> %x1, <16 x bfloat> %x2) { +; CHECK-LABEL: test_int_x86_avx10_sub_bf16_256: ; CHECK: # %bb.0: -; CHECK-NEXT: vsubnepbf16 %ymm1, %ymm0, %ymm0 # encoding: [0x62,0xf5,0x7d,0x28,0x5c,0xc1] +; CHECK-NEXT: vsubbf16 %ymm1, %ymm0, %ymm0 # encoding: [0x62,0xf5,0x7d,0x28,0x5c,0xc1] ; CHECK-NEXT: ret{{[l|q]}} # encoding: [0xc3] %res = fsub <16 x bfloat> %x1, %x2 ret <16 x bfloat> %res } -define <16 x bfloat> @test_int_x86_avx10_mask_sub_nepbf16_256(<16 x bfloat> %src, <16 x bfloat> %x1, <16 x bfloat> %x2, i16 %msk, ptr %ptr) { -; X64-LABEL: test_int_x86_avx10_mask_sub_nepbf16_256: +define <16 x bfloat> @test_int_x86_avx10_mask_sub_bf16_256(<16 x bfloat> %src, <16 x bfloat> %x1, <16 x bfloat> %x2, i16 %msk, ptr %ptr) { +; X64-LABEL: test_int_x86_avx10_mask_sub_bf16_256: ; X64: # %bb.0: ; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf] -; X64-NEXT: vsubnepbf16 %ymm2, %ymm1, %ymm0 {%k1} # encoding: [0x62,0xf5,0x75,0x29,0x5c,0xc2] +; X64-NEXT: vsubbf16 %ymm2, %ymm1, %ymm0 {%k1} # encoding: [0x62,0xf5,0x75,0x29,0x5c,0xc2] ; X64-NEXT: retq # encoding: [0xc3] ; -; X86-LABEL: test_int_x86_avx10_mask_sub_nepbf16_256: +; X86-LABEL: test_int_x86_avx10_mask_sub_bf16_256: ; X86: # %bb.0: ; X86-NEXT: kmovw {{[0-9]+}}(%esp), %k1 # encoding: [0xc5,0xf8,0x90,0x4c,0x24,0x04] -; X86-NEXT: vsubnepbf16 %ymm2, %ymm1, %ymm0 {%k1} # encoding: [0x62,0xf5,0x75,0x29,0x5c,0xc2] +; X86-NEXT: vsubbf16 %ymm2, %ymm1, %ymm0 {%k1} # encoding: [0x62,0xf5,0x75,0x29,0x5c,0xc2] ; X86-NEXT: retl # encoding: [0xc3] %mask = bitcast i16 %msk to <16 x i1> %res0 = fsub <16 x bfloat> %x1, %x2 @@ -136,22 +136,22 @@ define <16 x bfloat> @test_int_x86_avx10_mask_sub_nepbf16_256(<16 x bfloat> %src ret <16 x bfloat> %res } -define <16 x bfloat> @test_int_x86_avx10_maskz_sub_nepbf16_256(<16 x bfloat> %src, <16 x bfloat> %x1, <16 x bfloat> %x2, i16 %msk, ptr %ptr) { -; X64-LABEL: test_int_x86_avx10_maskz_sub_nepbf16_256: +define <16 x bfloat> @test_int_x86_avx10_maskz_sub_bf16_256(<16 x bfloat> %src, <16 x bfloat> %x1, <16 x bfloat> %x2, i16 %msk, ptr %ptr) { +; X64-LABEL: test_int_x86_avx10_maskz_sub_bf16_256: ; X64: # %bb.0: ; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf] -; X64-NEXT: vsubnepbf16 %ymm2, %ymm1, %ymm0 {%k1} {z} # encoding: [0x62,0xf5,0x75,0xa9,0x5c,0xc2] -; X64-NEXT: vsubnepbf16 (%rsi), %ymm1, %ymm1 # encoding: [0x62,0xf5,0x75,0x28,0x5c,0x0e] -; X64-NEXT: vsubnepbf16 %ymm1, %ymm0, %ymm0 {%k1} # encoding: [0x62,0xf5,0x7d,0x29,0x5c,0xc1] +; X64-NEXT: vsubbf16 %ymm2, %ymm1, %ymm0 {%k1} {z} # encoding: [0x62,0xf5,0x75,0xa9,0x5c,0xc2] +; X64-NEXT: vsubbf16 (%rsi), %ymm1, %ymm1 # encoding: [0x62,0xf5,0x75,0x28,0x5c,0x0e] +; X64-NEXT: vsubbf16 %ymm1, %ymm0, %ymm0 {%k1} # encoding: [0x62,0xf5,0x7d,0x29,0x5c,0xc1] ; X64-NEXT: retq # encoding: [0xc3] ; -; X86-LABEL: test_int_x86_avx10_maskz_sub_nepbf16_256: +; X86-LABEL: test_int_x86_avx10_maskz_sub_bf16_256: ; X86: # %bb.0: ; X86-NEXT: movl {{[0-9]+}}(%esp), %eax # encoding: [0x8b,0x44,0x24,0x08] ; X86-NEXT: kmovw {{[0-9]+}}(%esp), %k1 # encoding: [0xc5,0xf8,0x90,0x4c,0x24,0x04] -; X86-NEXT: vsubnepbf16 %ymm2, %ymm1, %ymm0 {%k1} {z} # encoding: [0x62,0xf5,0x75,0xa9,0x5c,0xc2] -; X86-NEXT: vsubnepbf16 (%eax), %ymm1, %ymm1 # encoding: [0x62,0xf5,0x75,0x28,0x5c,0x08] -; X86-NEXT: vsubnepbf16 %ymm1, %ymm0, %ymm0 {%k1} # encoding: [0x62,0xf5,0x7d,0x29,0x5c,0xc1] +; X86-NEXT: vsubbf16 %ymm2, %ymm1, %ymm0 {%k1} {z} # encoding: [0x62,0xf5,0x75,0xa9,0x5c,0xc2] +; X86-NEXT: vsubbf16 (%eax), %ymm1, %ymm1 # encoding: [0x62,0xf5,0x75,0x28,0x5c,0x08] +; X86-NEXT: vsubbf16 %ymm1, %ymm0, %ymm0 {%k1} # encoding: [0x62,0xf5,0x7d,0x29,0x5c,0xc1] ; X86-NEXT: retl # encoding: [0xc3] %mask = bitcast i16 %msk to <16 x i1> %val = load <16 x bfloat>, ptr %ptr @@ -163,26 +163,26 @@ define <16 x bfloat> @test_int_x86_avx10_maskz_sub_nepbf16_256(<16 x bfloat> %sr ret <16 x bfloat> %res3 } -define <8 x bfloat> @test_int_x86_avx10_sub_nepbf16_128(<8 x bfloat> %x1, <8 x bfloat> %x2) { -; CHECK-LABEL: test_int_x86_avx10_sub_nepbf16_128: +define <8 x bfloat> @test_int_x86_avx10_sub_bf16_128(<8 x bfloat> %x1, <8 x bfloat> %x2) { +; CHECK-LABEL: test_int_x86_avx10_sub_bf16_128: ; CHECK: # %bb.0: -; CHECK-NEXT: vsubnepbf16 %xmm1, %xmm0, %xmm0 # encoding: [0x62,0xf5,0x7d,0x08,0x5c,0xc1] +; CHECK-NEXT: vsubbf16 %xmm1, %xmm0, %xmm0 # encoding: [0x62,0xf5,0x7d,0x08,0x5c,0xc1] ; CHECK-NEXT: ret{{[l|q]}} # encoding: [0xc3] %res = fsub <8 x bfloat> %x1, %x2 ret <8 x bfloat> %res } -define <8 x bfloat> @test_int_x86_avx10_mask_sub_nepbf16_128(<8 x bfloat> %src, <8 x bfloat> %x1, <8 x bfloat> %x2, i8 %msk, ptr %ptr) { -; X64-LABEL: test_int_x86_avx10_mask_sub_nepbf16_128: +define <8 x bfloat> @test_int_x86_avx10_mask_sub_bf16_128(<8 x bfloat> %src, <8 x bfloat> %x1, <8 x bfloat> %x2, i8 %msk, ptr %ptr) { +; X64-LABEL: test_int_x86_avx10_mask_sub_bf16_128: ; X64: # %bb.0: ; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf] -; X64-NEXT: vsubnepbf16 %xmm2, %xmm1, %xmm0 {%k1} # encoding: [0x62,0xf5,0x75,0x09,0x5c,0xc2] +; X64-NEXT: vsubbf16 %xmm2, %xmm1, %xmm0 {%k1} # encoding: [0x62,0xf5,0x75,0x09,0x5c,0xc2] ; X64-NEXT: retq # encoding: [0xc3] ; -; X86-LABEL: test_int_x86_avx10_mask_sub_nepbf16_128: +; X86-LABEL: test_int_x86_avx10_mask_sub_bf16_128: ; X86: # %bb.0: ; X86-NEXT: kmovb {{[0-9]+}}(%esp), %k1 # encoding: [0xc5,0xf9,0x90,0x4c,0x24,0x04] -; X86-NEXT: vsubnepbf16 %xmm2, %xmm1, %xmm0 {%k1} # encoding: [0x62,0xf5,0x75,0x09,0x5c,0xc2] +; X86-NEXT: vsubbf16 %xmm2, %xmm1, %xmm0 {%k1} # encoding: [0x62,0xf5,0x75,0x09,0x5c,0xc2] ; X86-NEXT: retl # encoding: [0xc3] %mask = bitcast i8 %msk to <8 x i1> %res0 = fsub <8 x bfloat> %x1, %x2 @@ -190,22 +190,22 @@ define <8 x bfloat> @test_int_x86_avx10_mask_sub_nepbf16_128(<8 x bfloat> %src, ret <8 x bfloat> %res } -define <8 x bfloat> @test_int_x86_avx10_maskz_sub_nepbf16_128(<8 x bfloat> %src, <8 x bfloat> %x1, <8 x bfloat> %x2, i8 %msk, ptr %ptr) { -; X64-LABEL: test_int_x86_avx10_maskz_sub_nepbf16_128: +define <8 x bfloat> @test_int_x86_avx10_maskz_sub_bf16_128(<8 x bfloat> %src, <8 x bfloat> %x1, <8 x bfloat> %x2, i8 %msk, ptr %ptr) { +; X64-LABEL: test_int_x86_avx10_maskz_sub_bf16_128: ; X64: # %bb.0: ; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf] -; X64-NEXT: vsubnepbf16 %xmm2, %xmm1, %xmm0 {%k1} {z} # encoding: [0x62,0xf5,0x75,0x89,0x5c,0xc2] -; X64-NEXT: vsubnepbf16 (%rsi), %xmm1, %xmm1 # encoding: [0x62,0xf5,0x75,0x08,0x5c,0x0e] -; X64-NEXT: vsubnepbf16 %xmm1, %xmm0, %xmm0 {%k1} # encoding: [0x62,0xf5,0x7d,0x09,0x5c,0xc1] +; X64-NEXT: vsubbf16 %xmm2, %xmm1, %xmm0 {%k1} {z} # encoding: [0x62,0xf5,0x75,0x89,0x5c,0xc2] +; X64-NEXT: vsubbf16 (%rsi), %xmm1, %xmm1 # encoding: [0x62,0xf5,0x75,0x08,0x5c,0x0e] +; X64-NEXT: vsubbf16 %xmm1, %xmm0, %xmm0 {%k1} # encoding: [0x62,0xf5,0x7d,0x09,0x5c,0xc1] ; X64-NEXT: retq # encoding: [0xc3] ; -; X86-LABEL: test_int_x86_avx10_maskz_sub_nepbf16_128: +; X86-LABEL: test_int_x86_avx10_maskz_sub_bf16_128: ; X86: # %bb.0: ; X86-NEXT: movl {{[0-9]+}}(%esp), %eax # encoding: [0x8b,0x44,0x24,0x08] ; X86-NEXT: kmovb {{[0-9]+}}(%esp), %k1 # encoding: [0xc5,0xf9,0x90,0x4c,0x24,0x04] -; X86-NEXT: vsubnepbf16 %xmm2, %xmm1, %xmm0 {%k1} {z} # encoding: [0x62,0xf5,0x75,0x89,0x5c,0xc2] -; X86-NEXT: vsubnepbf16 (%eax), %xmm1, %xmm1 # encoding: [0x62,0xf5,0x75,0x08,0x5c,0x08] -; X86-NEXT: vsubnepbf16 %xmm1, %xmm0, %xmm0 {%k1} # encoding: [0x62,0xf5,0x7d,0x09,0x5c,0xc1] +; X86-NEXT: vsubbf16 %xmm2, %xmm1, %xmm0 {%k1} {z} # encoding: [0x62,0xf5,0x75,0x89,0x5c,0xc2] +; X86-NEXT: vsubbf16 (%eax), %xmm1, %xmm1 # encoding: [0x62,0xf5,0x75,0x08,0x5c,0x08] +; X86-NEXT: vsubbf16 %xmm1, %xmm0, %xmm0 {%k1} # encoding: [0x62,0xf5,0x7d,0x09,0x5c,0xc1] ; X86-NEXT: retl # encoding: [0xc3] %mask = bitcast i8 %msk to <8 x i1> %val = load <8 x bfloat>, ptr %ptr @@ -217,26 +217,26 @@ define <8 x bfloat> @test_int_x86_avx10_maskz_sub_nepbf16_128(<8 x bfloat> %src, ret <8 x bfloat> %res3 } -define <16 x bfloat> @test_int_x86_avx10_mul_nepbf16_256(<16 x bfloat> %x1, <16 x bfloat> %x2) { -; CHECK-LABEL: test_int_x86_avx10_mul_nepbf16_256: +define <16 x bfloat> @test_int_x86_avx10_mul_bf16_256(<16 x bfloat> %x1, <16 x bfloat> %x2) { +; CHECK-LABEL: test_int_x86_avx10_mul_bf16_256: ; CHECK: # %bb.0: -; CHECK-NEXT: vmulnepbf16 %ymm1, %ymm0, %ymm0 # encoding: [0x62,0xf5,0x7d,0x28,0x59,0xc1] +; CHECK-NEXT: vmulbf16 %ymm1, %ymm0, %ymm0 # encoding: [0x62,0xf5,0x7d,0x28,0x59,0xc1] ; CHECK-NEXT: ret{{[l|q]}} # encoding: [0xc3] %res = fmul <16 x bfloat> %x1, %x2 ret <16 x bfloat> %res } -define <16 x bfloat> @test_int_x86_avx10_mask_mul_nepbf16_256(<16 x bfloat> %src, <16 x bfloat> %x1, <16 x bfloat> %x2, i16 %msk, ptr %ptr) { -; X64-LABEL: test_int_x86_avx10_mask_mul_nepbf16_256: +define <16 x bfloat> @test_int_x86_avx10_mask_mul_bf16_256(<16 x bfloat> %src, <16 x bfloat> %x1, <16 x bfloat> %x2, i16 %msk, ptr %ptr) { +; X64-LABEL: test_int_x86_avx10_mask_mul_bf16_256: ; X64: # %bb.0: ; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf] -; X64-NEXT: vmulnepbf16 %ymm2, %ymm1, %ymm0 {%k1} # encoding: [0x62,0xf5,0x75,0x29,0x59,0xc2] +; X64-NEXT: vmulbf16 %ymm2, %ymm1, %ymm0 {%k1} # encoding: [0x62,0xf5,0x75,0x29,0x59,0xc2] ; X64-NEXT: retq # encoding: [0xc3] ; -; X86-LABEL: test_int_x86_avx10_mask_mul_nepbf16_256: +; X86-LABEL: test_int_x86_avx10_mask_mul_bf16_256: ; X86: # %bb.0: ; X86-NEXT: kmovw {{[0-9]+}}(%esp), %k1 # encoding: [0xc5,0xf8,0x90,0x4c,0x24,0x04] -; X86-NEXT: vmulnepbf16 %ymm2, %ymm1, %ymm0 {%k1} # encoding: [0x62,0xf5,0x75,0x29,0x59,0xc2] +; X86-NEXT: vmulbf16 %ymm2, %ymm1, %ymm0 {%k1} # encoding: [0x62,0xf5,0x75,0x29,0x59,0xc2] ; X86-NEXT: retl # encoding: [0xc3] %mask = bitcast i16 %msk to <16 x i1> %res0 = fmul <16 x bfloat> %x1, %x2 @@ -244,22 +244,22 @@ define <16 x bfloat> @test_int_x86_avx10_mask_mul_nepbf16_256(<16 x bfloat> %src ret <16 x bfloat> %res } -define <16 x bfloat> @test_int_x86_avx10_maskz_mul_nepbf16_256(<16 x bfloat> %src, <16 x bfloat> %x1, <16 x bfloat> %x2, i16 %msk, ptr %ptr) { -; X64-LABEL: test_int_x86_avx10_maskz_mul_nepbf16_256: +define <16 x bfloat> @test_int_x86_avx10_maskz_mul_bf16_256(<16 x bfloat> %src, <16 x bfloat> %x1, <16 x bfloat> %x2, i16 %msk, ptr %ptr) { +; X64-LABEL: test_int_x86_avx10_maskz_mul_bf16_256: ; X64: # %bb.0: ; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf] -; X64-NEXT: vmulnepbf16 %ymm2, %ymm1, %ymm0 {%k1} {z} # encoding: [0x62,0xf5,0x75,0xa9,0x59,0xc2] -; X64-NEXT: vmulnepbf16 (%rsi), %ymm1, %ymm1 {%k1} {z} # encoding: [0x62,0xf5,0x75,0xa9,0x59,0x0e] -; X64-NEXT: vmulnepbf16 %ymm1, %ymm0, %ymm0 # encoding: [0x62,0xf5,0x7d,0x28,0x59,0xc1] +; X64-NEXT: vmulbf16 %ymm2, %ymm1, %ymm0 {%k1} {z} # encoding: [0x62,0xf5,0x75,0xa9,0x59,0xc2] +; X64-NEXT: vmulbf16 (%rsi), %ymm1, %ymm1 {%k1} {z} # encoding: [0x62,0xf5,0x75,0xa9,0x59,0x0e] +; X64-NEXT: vmulbf16 %ymm1, %ymm0, %ymm0 # encoding: [0x62,0xf5,0x7d,0x28,0x59,0xc1] ; X64-NEXT: retq # encoding: [0xc3] ; -; X86-LABEL: test_int_x86_avx10_maskz_mul_nepbf16_256: +; X86-LABEL: test_int_x86_avx10_maskz_mul_bf16_256: ; X86: # %bb.0: ; X86-NEXT: movl {{[0-9]+}}(%esp), %eax # encoding: [0x8b,0x44,0x24,0x08] ; X86-NEXT: kmovw {{[0-9]+}}(%esp), %k1 # encoding: [0xc5,0xf8,0x90,0x4c,0x24,0x04] -; X86-NEXT: vmulnepbf16 %ymm2, %ymm1, %ymm0 {%k1} {z} # encoding: [0x62,0xf5,0x75,0xa9,0x59,0xc2] -; X86-NEXT: vmulnepbf16 (%eax), %ymm1, %ymm1 {%k1} {z} # encoding: [0x62,0xf5,0x75,0xa9,0x59,0x08] -; X86-NEXT: vmulnepbf16 %ymm1, %ymm0, %ymm0 # encoding: [0x62,0xf5,0x7d,0x28,0x59,0xc1] +; X86-NEXT: vmulbf16 %ymm2, %ymm1, %ymm0 {%k1} {z} # encoding: [0x62,0xf5,0x75,0xa9,0x59,0xc2] +; X86-NEXT: vmulbf16 (%eax), %ymm1, %ymm1 {%k1} {z} # encoding: [0x62,0xf5,0x75,0xa9,0x59,0x08] +; X86-NEXT: vmulbf16 %ymm1, %ymm0, %ymm0 # encoding: [0x62,0xf5,0x7d,0x28,0x59,0xc1] ; X86-NEXT: retl # encoding: [0xc3] %mask = bitcast i16 %msk to <16 x i1> %val = load <16 x bfloat>, ptr %ptr @@ -271,26 +271,26 @@ define <16 x bfloat> @test_int_x86_avx10_maskz_mul_nepbf16_256(<16 x bfloat> %sr ret <16 x bfloat> %res3 } -define <8 x bfloat> @test_int_x86_avx10_mul_nepbf16_128(<8 x bfloat> %x1, <8 x bfloat> %x2) { -; CHECK-LABEL: test_int_x86_avx10_mul_nepbf16_128: +define <8 x bfloat> @test_int_x86_avx10_mul_bf16_128(<8 x bfloat> %x1, <8 x bfloat> %x2) { +; CHECK-LABEL: test_int_x86_avx10_mul_bf16_128: ; CHECK: # %bb.0: -; CHECK-NEXT: vmulnepbf16 %xmm1, %xmm0, %xmm0 # encoding: [0x62,0xf5,0x7d,0x08,0x59,0xc1] +; CHECK-NEXT: vmulbf16 %xmm1, %xmm0, %xmm0 # encoding: [0x62,0xf5,0x7d,0x08,0x59,0xc1] ; CHECK-NEXT: ret{{[l|q]}} # encoding: [0xc3] %res = fmul <8 x bfloat> %x1, %x2 ret <8 x bfloat> %res } -define <8 x bfloat> @test_int_x86_avx10_mask_mul_nepbf16_128(<8 x bfloat> %src, <8 x bfloat> %x1, <8 x bfloat> %x2, i8 %msk, ptr %ptr) { -; X64-LABEL: test_int_x86_avx10_mask_mul_nepbf16_128: +define <8 x bfloat> @test_int_x86_avx10_mask_mul_bf16_128(<8 x bfloat> %src, <8 x bfloat> %x1, <8 x bfloat> %x2, i8 %msk, ptr %ptr) { +; X64-LABEL: test_int_x86_avx10_mask_mul_bf16_128: ; X64: # %bb.0: ; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf] -; X64-NEXT: vmulnepbf16 %xmm2, %xmm1, %xmm0 {%k1} # encoding: [0x62,0xf5,0x75,0x09,0x59,0xc2] +; X64-NEXT: vmulbf16 %xmm2, %xmm1, %xmm0 {%k1} # encoding: [0x62,0xf5,0x75,0x09,0x59,0xc2] ; X64-NEXT: retq # encoding: [0xc3] ; -; X86-LABEL: test_int_x86_avx10_mask_mul_nepbf16_128: +; X86-LABEL: test_int_x86_avx10_mask_mul_bf16_128: ; X86: # %bb.0: ; X86-NEXT: kmovb {{[0-9]+}}(%esp), %k1 # encoding: [0xc5,0xf9,0x90,0x4c,0x24,0x04] -; X86-NEXT: vmulnepbf16 %xmm2, %xmm1, %xmm0 {%k1} # encoding: [0x62,0xf5,0x75,0x09,0x59,0xc2] +; X86-NEXT: vmulbf16 %xmm2, %xmm1, %xmm0 {%k1} # encoding: [0x62,0xf5,0x75,0x09,0x59,0xc2] ; X86-NEXT: retl # encoding: [0xc3] %mask = bitcast i8 %msk to <8 x i1> %res0 = fmul <8 x bfloat> %x1, %x2 @@ -298,22 +298,22 @@ define <8 x bfloat> @test_int_x86_avx10_mask_mul_nepbf16_128(<8 x bfloat> %src, ret <8 x bfloat> %res } -define <8 x bfloat> @test_int_x86_avx10_maskz_mul_nepbf16_128(<8 x bfloat> %src, <8 x bfloat> %x1, <8 x bfloat> %x2, i8 %msk, ptr %ptr) { -; X64-LABEL: test_int_x86_avx10_maskz_mul_nepbf16_128: +define <8 x bfloat> @test_int_x86_avx10_maskz_mul_bf16_128(<8 x bfloat> %src, <8 x bfloat> %x1, <8 x bfloat> %x2, i8 %msk, ptr %ptr) { +; X64-LABEL: test_int_x86_avx10_maskz_mul_bf16_128: ; X64: # %bb.0: ; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf] -; X64-NEXT: vmulnepbf16 %xmm2, %xmm1, %xmm0 {%k1} {z} # encoding: [0x62,0xf5,0x75,0x89,0x59,0xc2] -; X64-NEXT: vmulnepbf16 (%rsi), %xmm1, %xmm1 {%k1} {z} # encoding: [0x62,0xf5,0x75,0x89,0x59,0x0e] -; X64-NEXT: vmulnepbf16 %xmm1, %xmm0, %xmm0 # encoding: [0x62,0xf5,0x7d,0x08,0x59,0xc1] +; X64-NEXT: vmulbf16 %xmm2, %xmm1, %xmm0 {%k1} {z} # encoding: [0x62,0xf5,0x75,0x89,0x59,0xc2] +; X64-NEXT: vmulbf16 (%rsi), %xmm1, %xmm1 {%k1} {z} # encoding: [0x62,0xf5,0x75,0x89,0x59,0x0e] +; X64-NEXT: vmulbf16 %xmm1, %xmm0, %xmm0 # encoding: [0x62,0xf5,0x7d,0x08,0x59,0xc1] ; X64-NEXT: retq # encoding: [0xc3] ; -; X86-LABEL: test_int_x86_avx10_maskz_mul_nepbf16_128: +; X86-LABEL: test_int_x86_avx10_maskz_mul_bf16_128: ; X86: # %bb.0: ; X86-NEXT: movl {{[0-9]+}}(%esp), %eax # encoding: [0x8b,0x44,0x24,0x08] ; X86-NEXT: kmovb {{[0-9]+}}(%esp), %k1 # encoding: [0xc5,0xf9,0x90,0x4c,0x24,0x04] -; X86-NEXT: vmulnepbf16 %xmm2, %xmm1, %xmm0 {%k1} {z} # encoding: [0x62,0xf5,0x75,0x89,0x59,0xc2] -; X86-NEXT: vmulnepbf16 (%eax), %xmm1, %xmm1 {%k1} {z} # encoding: [0x62,0xf5,0x75,0x89,0x59,0x08] -; X86-NEXT: vmulnepbf16 %xmm1, %xmm0, %xmm0 # encoding: [0x62,0xf5,0x7d,0x08,0x59,0xc1] +; X86-NEXT: vmulbf16 %xmm2, %xmm1, %xmm0 {%k1} {z} # encoding: [0x62,0xf5,0x75,0x89,0x59,0xc2] +; X86-NEXT: vmulbf16 (%eax), %xmm1, %xmm1 {%k1} {z} # encoding: [0x62,0xf5,0x75,0x89,0x59,0x08] +; X86-NEXT: vmulbf16 %xmm1, %xmm0, %xmm0 # encoding: [0x62,0xf5,0x7d,0x08,0x59,0xc1] ; X86-NEXT: retl # encoding: [0xc3] %mask = bitcast i8 %msk to <8 x i1> %val = load <8 x bfloat>, ptr %ptr @@ -325,26 +325,26 @@ define <8 x bfloat> @test_int_x86_avx10_maskz_mul_nepbf16_128(<8 x bfloat> %src, ret <8 x bfloat> %res3 } -define <16 x bfloat> @test_int_x86_avx10_div_nepbf16_256(<16 x bfloat> %x1, <16 x bfloat> %x2) { -; CHECK-LABEL: test_int_x86_avx10_div_nepbf16_256: +define <16 x bfloat> @test_int_x86_avx10_div_bf16_256(<16 x bfloat> %x1, <16 x bfloat> %x2) { +; CHECK-LABEL: test_int_x86_avx10_div_bf16_256: ; CHECK: # %bb.0: -; CHECK-NEXT: vdivnepbf16 %ymm1, %ymm0, %ymm0 # encoding: [0x62,0xf5,0x7d,0x28,0x5e,0xc1] +; CHECK-NEXT: vdivbf16 %ymm1, %ymm0, %ymm0 # encoding: [0x62,0xf5,0x7d,0x28,0x5e,0xc1] ; CHECK-NEXT: ret{{[l|q]}} # encoding: [0xc3] %res = fdiv <16 x bfloat> %x1, %x2 ret <16 x bfloat> %res } -define <16 x bfloat> @test_int_x86_avx10_mask_div_nepbf16_256(<16 x bfloat> %src, <16 x bfloat> %x1, <16 x bfloat> %x2, i16 %msk, ptr %ptr) { -; X64-LABEL: test_int_x86_avx10_mask_div_nepbf16_256: +define <16 x bfloat> @test_int_x86_avx10_mask_div_bf16_256(<16 x bfloat> %src, <16 x bfloat> %x1, <16 x bfloat> %x2, i16 %msk, ptr %ptr) { +; X64-LABEL: test_int_x86_avx10_mask_div_bf16_256: ; X64: # %bb.0: ; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf] -; X64-NEXT: vdivnepbf16 %ymm2, %ymm1, %ymm0 {%k1} # encoding: [0x62,0xf5,0x75,0x29,0x5e,0xc2] +; X64-NEXT: vdivbf16 %ymm2, %ymm1, %ymm0 {%k1} # encoding: [0x62,0xf5,0x75,0x29,0x5e,0xc2] ; X64-NEXT: retq # encoding: [0xc3] ; -; X86-LABEL: test_int_x86_avx10_mask_div_nepbf16_256: +; X86-LABEL: test_int_x86_avx10_mask_div_bf16_256: ; X86: # %bb.0: ; X86-NEXT: kmovw {{[0-9]+}}(%esp), %k1 # encoding: [0xc5,0xf8,0x90,0x4c,0x24,0x04] -; X86-NEXT: vdivnepbf16 %ymm2, %ymm1, %ymm0 {%k1} # encoding: [0x62,0xf5,0x75,0x29,0x5e,0xc2] +; X86-NEXT: vdivbf16 %ymm2, %ymm1, %ymm0 {%k1} # encoding: [0x62,0xf5,0x75,0x29,0x5e,0xc2] ; X86-NEXT: retl # encoding: [0xc3] %mask = bitcast i16 %msk to <16 x i1> %res0 = fdiv <16 x bfloat> %x1, %x2 @@ -353,22 +353,22 @@ define <16 x bfloat> @test_int_x86_avx10_mask_div_nepbf16_256(<16 x bfloat> %src } ; FIXME: assembly order is different from fp16 ones -define <16 x bfloat> @test_int_x86_avx10_maskz_div_nepbf16_256(<16 x bfloat> %src, <16 x bfloat> %x1, <16 x bfloat> %x2, i16 %msk, ptr %ptr) { -; X64-LABEL: test_int_x86_avx10_maskz_div_nepbf16_256: +define <16 x bfloat> @test_int_x86_avx10_maskz_div_bf16_256(<16 x bfloat> %src, <16 x bfloat> %x1, <16 x bfloat> %x2, i16 %msk, ptr %ptr) { +; X64-LABEL: test_int_x86_avx10_maskz_div_bf16_256: ; X64: # %bb.0: ; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf] -; X64-NEXT: vdivnepbf16 %ymm2, %ymm1, %ymm0 {%k1} {z} # encoding: [0x62,0xf5,0x75,0xa9,0x5e,0xc2] -; X64-NEXT: vdivnepbf16 (%rsi), %ymm1, %ymm1 {%k1} {z} # encoding: [0x62,0xf5,0x75,0xa9,0x5e,0x0e] -; X64-NEXT: vdivnepbf16 %ymm1, %ymm0, %ymm0 # encoding: [0x62,0xf5,0x7d,0x28,0x5e,0xc1] +; X64-NEXT: vdivbf16 %ymm2, %ymm1, %ymm0 {%k1} {z} # encoding: [0x62,0xf5,0x75,0xa9,0x5e,0xc2] +; X64-NEXT: vdivbf16 (%rsi), %ymm1, %ymm1 {%k1} {z} # encoding: [0x62,0xf5,0x75,0xa9,0x5e,0x0e] +; X64-NEXT: vdivbf16 %ymm1, %ymm0, %ymm0 # encoding: [0x62,0xf5,0x7d,0x28,0x5e,0xc1] ; X64-NEXT: retq # encoding: [0xc3] ; -; X86-LABEL: test_int_x86_avx10_maskz_div_nepbf16_256: +; X86-LABEL: test_int_x86_avx10_maskz_div_bf16_256: ; X86: # %bb.0: ; X86-NEXT: movl {{[0-9]+}}(%esp), %eax # encoding: [0x8b,0x44,0x24,0x08] ; X86-NEXT: kmovw {{[0-9]+}}(%esp), %k1 # encoding: [0xc5,0xf8,0x90,0x4c,0x24,0x04] -; X86-NEXT: vdivnepbf16 %ymm2, %ymm1, %ymm0 {%k1} {z} # encoding: [0x62,0xf5,0x75,0xa9,0x5e,0xc2] -; X86-NEXT: vdivnepbf16 (%eax), %ymm1, %ymm1 {%k1} {z} # encoding: [0x62,0xf5,0x75,0xa9,0x5e,0x08] -; X86-NEXT: vdivnepbf16 %ymm1, %ymm0, %ymm0 # encoding: [0x62,0xf5,0x7d,0x28,0x5e,0xc1] +; X86-NEXT: vdivbf16 %ymm2, %ymm1, %ymm0 {%k1} {z} # encoding: [0x62,0xf5,0x75,0xa9,0x5e,0xc2] +; X86-NEXT: vdivbf16 (%eax), %ymm1, %ymm1 {%k1} {z} # encoding: [0x62,0xf5,0x75,0xa9,0x5e,0x08] +; X86-NEXT: vdivbf16 %ymm1, %ymm0, %ymm0 # encoding: [0x62,0xf5,0x7d,0x28,0x5e,0xc1] ; X86-NEXT: retl # encoding: [0xc3] %mask = bitcast i16 %msk to <16 x i1> %val = load <16 x bfloat>, ptr %ptr @@ -380,26 +380,26 @@ define <16 x bfloat> @test_int_x86_avx10_maskz_div_nepbf16_256(<16 x bfloat> %sr ret <16 x bfloat> %res3 } -define <8 x bfloat> @test_int_x86_avx10_div_nepbf16_128(<8 x bfloat> %x1, <8 x bfloat> %x2) { -; CHECK-LABEL: test_int_x86_avx10_div_nepbf16_128: +define <8 x bfloat> @test_int_x86_avx10_div_bf16_128(<8 x bfloat> %x1, <8 x bfloat> %x2) { +; CHECK-LABEL: test_int_x86_avx10_div_bf16_128: ; CHECK: # %bb.0: -; CHECK-NEXT: vdivnepbf16 %xmm1, %xmm0, %xmm0 # encoding: [0x62,0xf5,0x7d,0x08,0x5e,0xc1] +; CHECK-NEXT: vdivbf16 %xmm1, %xmm0, %xmm0 # encoding: [0x62,0xf5,0x7d,0x08,0x5e,0xc1] ; CHECK-NEXT: ret{{[l|q]}} # encoding: [0xc3] %res = fdiv <8 x bfloat> %x1, %x2 ret <8 x bfloat> %res } -define <8 x bfloat> @test_int_x86_avx10_mask_div_nepbf16_128(<8 x bfloat> %src, <8 x bfloat> %x1, <8 x bfloat> %x2, i8 %msk, ptr %ptr) { -; X64-LABEL: test_int_x86_avx10_mask_div_nepbf16_128: +define <8 x bfloat> @test_int_x86_avx10_mask_div_bf16_128(<8 x bfloat> %src, <8 x bfloat> %x1, <8 x bfloat> %x2, i8 %msk, ptr %ptr) { +; X64-LABEL: test_int_x86_avx10_mask_div_bf16_128: ; X64: # %bb.0: ; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf] -; X64-NEXT: vdivnepbf16 %xmm2, %xmm1, %xmm0 {%k1} # encoding: [0x62,0xf5,0x75,0x09,0x5e,0xc2] +; X64-NEXT: vdivbf16 %xmm2, %xmm1, %xmm0 {%k1} # encoding: [0x62,0xf5,0x75,0x09,0x5e,0xc2] ; X64-NEXT: retq # encoding: [0xc3] ; -; X86-LABEL: test_int_x86_avx10_mask_div_nepbf16_128: +; X86-LABEL: test_int_x86_avx10_mask_div_bf16_128: ; X86: # %bb.0: ; X86-NEXT: kmovb {{[0-9]+}}(%esp), %k1 # encoding: [0xc5,0xf9,0x90,0x4c,0x24,0x04] -; X86-NEXT: vdivnepbf16 %xmm2, %xmm1, %xmm0 {%k1} # encoding: [0x62,0xf5,0x75,0x09,0x5e,0xc2] +; X86-NEXT: vdivbf16 %xmm2, %xmm1, %xmm0 {%k1} # encoding: [0x62,0xf5,0x75,0x09,0x5e,0xc2] ; X86-NEXT: retl # encoding: [0xc3] %mask = bitcast i8 %msk to <8 x i1> %res0 = fdiv <8 x bfloat> %x1, %x2 @@ -408,22 +408,22 @@ define <8 x bfloat> @test_int_x86_avx10_mask_div_nepbf16_128(<8 x bfloat> %src, } ; FIXME: assembly order is different from fp16 ones -define <8 x bfloat> @test_int_x86_avx10_maskz_div_nepbf16_128(<8 x bfloat> %src, <8 x bfloat> %x1, <8 x bfloat> %x2, i8 %msk, ptr %ptr) { -; X64-LABEL: test_int_x86_avx10_maskz_div_nepbf16_128: +define <8 x bfloat> @test_int_x86_avx10_maskz_div_bf16_128(<8 x bfloat> %src, <8 x bfloat> %x1, <8 x bfloat> %x2, i8 %msk, ptr %ptr) { +; X64-LABEL: test_int_x86_avx10_maskz_div_bf16_128: ; X64: # %bb.0: ; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf] -; X64-NEXT: vdivnepbf16 %xmm2, %xmm1, %xmm0 {%k1} {z} # encoding: [0x62,0xf5,0x75,0x89,0x5e,0xc2] -; X64-NEXT: vdivnepbf16 (%rsi), %xmm1, %xmm1 {%k1} {z} # encoding: [0x62,0xf5,0x75,0x89,0x5e,0x0e] -; X64-NEXT: vdivnepbf16 %xmm1, %xmm0, %xmm0 # encoding: [0x62,0xf5,0x7d,0x08,0x5e,0xc1] +; X64-NEXT: vdivbf16 %xmm2, %xmm1, %xmm0 {%k1} {z} # encoding: [0x62,0xf5,0x75,0x89,0x5e,0xc2] +; X64-NEXT: vdivbf16 (%rsi), %xmm1, %xmm1 {%k1} {z} # encoding: [0x62,0xf5,0x75,0x89,0x5e,0x0e] +; X64-NEXT: vdivbf16 %xmm1, %xmm0, %xmm0 # encoding: [0x62,0xf5,0x7d,0x08,0x5e,0xc1] ; X64-NEXT: retq # encoding: [0xc3] ; -; X86-LABEL: test_int_x86_avx10_maskz_div_nepbf16_128: +; X86-LABEL: test_int_x86_avx10_maskz_div_bf16_128: ; X86: # %bb.0: ; X86-NEXT: movl {{[0-9]+}}(%esp), %eax # encoding: [0x8b,0x44,0x24,0x08] ; X86-NEXT: kmovb {{[0-9]+}}(%esp), %k1 # encoding: [0xc5,0xf9,0x90,0x4c,0x24,0x04] -; X86-NEXT: vdivnepbf16 %xmm2, %xmm1, %xmm0 {%k1} {z} # encoding: [0x62,0xf5,0x75,0x89,0x5e,0xc2] -; X86-NEXT: vdivnepbf16 (%eax), %xmm1, %xmm1 {%k1} {z} # encoding: [0x62,0xf5,0x75,0x89,0x5e,0x08] -; X86-NEXT: vdivnepbf16 %xmm1, %xmm0, %xmm0 # encoding: [0x62,0xf5,0x7d,0x08,0x5e,0xc1] +; X86-NEXT: vdivbf16 %xmm2, %xmm1, %xmm0 {%k1} {z} # encoding: [0x62,0xf5,0x75,0x89,0x5e,0xc2] +; X86-NEXT: vdivbf16 (%eax), %xmm1, %xmm1 {%k1} {z} # encoding: [0x62,0xf5,0x75,0x89,0x5e,0x08] +; X86-NEXT: vdivbf16 %xmm1, %xmm0, %xmm0 # encoding: [0x62,0xf5,0x7d,0x08,0x5e,0xc1] ; X86-NEXT: retl # encoding: [0xc3] %mask = bitcast i8 %msk to <8 x i1> %val = load <8 x bfloat>, ptr %ptr @@ -435,10 +435,10 @@ define <8 x bfloat> @test_int_x86_avx10_maskz_div_nepbf16_128(<8 x bfloat> %src, ret <8 x bfloat> %res3 } -define i16 @test_int_x86_avx10_vcmppbf16256(<16 x bfloat> %x1, <16 x bfloat> %x2) { -; CHECK-LABEL: test_int_x86_avx10_vcmppbf16256: +define i16 @test_int_x86_avx10_vcmpbf16256(<16 x bfloat> %x1, <16 x bfloat> %x2) { +; CHECK-LABEL: test_int_x86_avx10_vcmpbf16256: ; CHECK: # %bb.0: -; CHECK-NEXT: vcmpunordpbf16 %ymm1, %ymm0, %k0 # encoding: [0x62,0xf3,0x7f,0x28,0xc2,0xc1,0x03] +; CHECK-NEXT: vcmpunordbf16 %ymm1, %ymm0, %k0 # encoding: [0x62,0xf3,0x7f,0x28,0xc2,0xc1,0x03] ; CHECK-NEXT: kmovd %k0, %eax # encoding: [0xc5,0xfb,0x93,0xc0] ; CHECK-NEXT: # kill: def $ax killed $ax killed $eax ; CHECK-NEXT: vzeroupper # encoding: [0xc5,0xf8,0x77] @@ -448,10 +448,10 @@ define i16 @test_int_x86_avx10_vcmppbf16256(<16 x bfloat> %x1, <16 x bfloat> %x2 ret i16 %res } -define i16 @test_int_x86_avx10_vcmppbf16256_mask2(<16 x bfloat> %x1, <16 x bfloat> %x2) { -; CHECK-LABEL: test_int_x86_avx10_vcmppbf16256_mask2: +define i16 @test_int_x86_avx10_vcmpbf16256_mask2(<16 x bfloat> %x1, <16 x bfloat> %x2) { +; CHECK-LABEL: test_int_x86_avx10_vcmpbf16256_mask2: ; CHECK: # %bb.0: -; CHECK-NEXT: vcmpeqpbf16 %ymm1, %ymm0, %k0 # encoding: [0x62,0xf3,0x7f,0x28,0xc2,0xc1,0x00] +; CHECK-NEXT: vcmpeqbf16 %ymm1, %ymm0, %k0 # encoding: [0x62,0xf3,0x7f,0x28,0xc2,0xc1,0x00] ; CHECK-NEXT: kmovd %k0, %eax # encoding: [0xc5,0xfb,0x93,0xc0] ; CHECK-NEXT: andl $3, %eax # encoding: [0x83,0xe0,0x03] ; CHECK-NEXT: # kill: def $ax killed $ax killed $eax @@ -463,10 +463,10 @@ define i16 @test_int_x86_avx10_vcmppbf16256_mask2(<16 x bfloat> %x1, <16 x bfloa ret i16 %3 } -define i8 @test_int_x86_avx10_vcmppbf16128(<8 x bfloat> %x1, <8 x bfloat> %x2) { -; CHECK-LABEL: test_int_x86_avx10_vcmppbf16128: +define i8 @test_int_x86_avx10_vcmpbf16128(<8 x bfloat> %x1, <8 x bfloat> %x2) { +; CHECK-LABEL: test_int_x86_avx10_vcmpbf16128: ; CHECK: # %bb.0: -; CHECK-NEXT: vcmpunordpbf16 %xmm1, %xmm0, %k0 # encoding: [0x62,0xf3,0x7f,0x08,0xc2,0xc1,0x03] +; CHECK-NEXT: vcmpunordbf16 %xmm1, %xmm0, %k0 # encoding: [0x62,0xf3,0x7f,0x08,0xc2,0xc1,0x03] ; CHECK-NEXT: kmovd %k0, %eax # encoding: [0xc5,0xfb,0x93,0xc0] ; CHECK-NEXT: # kill: def $al killed $al killed $eax ; CHECK-NEXT: ret{{[l|q]}} # encoding: [0xc3] @@ -475,10 +475,10 @@ define i8 @test_int_x86_avx10_vcmppbf16128(<8 x bfloat> %x1, <8 x bfloat> %x2) { ret i8 %res } -define i8 @test_int_x86_avx10_vcmppbf16128_mask2(<8 x bfloat> %x1, <8 x bfloat> %x2) { -; CHECK-LABEL: test_int_x86_avx10_vcmppbf16128_mask2: +define i8 @test_int_x86_avx10_vcmpbf16128_mask2(<8 x bfloat> %x1, <8 x bfloat> %x2) { +; CHECK-LABEL: test_int_x86_avx10_vcmpbf16128_mask2: ; CHECK: # %bb.0: -; CHECK-NEXT: vcmpeqpbf16 %xmm1, %xmm0, %k0 # encoding: [0x62,0xf3,0x7f,0x08,0xc2,0xc1,0x00] +; CHECK-NEXT: vcmpeqbf16 %xmm1, %xmm0, %k0 # encoding: [0x62,0xf3,0x7f,0x08,0xc2,0xc1,0x00] ; CHECK-NEXT: kmovd %k0, %eax # encoding: [0xc5,0xfb,0x93,0xc0] ; CHECK-NEXT: andb $3, %al # encoding: [0x24,0x03] ; CHECK-NEXT: # kill: def $al killed $al killed $eax @@ -489,10 +489,10 @@ define i8 @test_int_x86_avx10_vcmppbf16128_mask2(<8 x bfloat> %x1, <8 x bfloat> ret i8 %3 } -define <16 x bfloat> @test_sqrt_nepbf16_256(<16 x bfloat> %a0) { -; CHECK-LABEL: test_sqrt_nepbf16_256: +define <16 x bfloat> @test_sqrt_bf16_256(<16 x bfloat> %a0) { +; CHECK-LABEL: test_sqrt_bf16_256: ; CHECK: # %bb.0: -; CHECK-NEXT: vsqrtnepbf16 %ymm0, %ymm0 # encoding: [0x62,0xf5,0x7d,0x28,0x51,0xc0] +; CHECK-NEXT: vsqrtbf16 %ymm0, %ymm0 # encoding: [0x62,0xf5,0x7d,0x28,0x51,0xc0] ; CHECK-NEXT: ret{{[l|q]}} # encoding: [0xc3] %1 = tail call <16 x bfloat> @llvm.sqrt.v16bf16(<16 x bfloat> %a0) ret <16 x bfloat> %1 @@ -502,13 +502,13 @@ define <16 x bfloat> @test_mm256_mask_sqrt_pbh(<16 x bfloat> %__W, i16 %__U, <16 ; X64-LABEL: test_mm256_mask_sqrt_pbh: ; X64: # %bb.0: # %entry ; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf] -; X64-NEXT: vsqrtnepbf16 %ymm1, %ymm0 {%k1} # encoding: [0x62,0xf5,0x7d,0x29,0x51,0xc1] +; X64-NEXT: vsqrtbf16 %ymm1, %ymm0 {%k1} # encoding: [0x62,0xf5,0x7d,0x29,0x51,0xc1] ; X64-NEXT: retq # encoding: [0xc3] ; ; X86-LABEL: test_mm256_mask_sqrt_pbh: ; X86: # %bb.0: # %entry ; X86-NEXT: kmovw {{[0-9]+}}(%esp), %k1 # encoding: [0xc5,0xf8,0x90,0x4c,0x24,0x04] -; X86-NEXT: vsqrtnepbf16 %ymm1, %ymm0 {%k1} # encoding: [0x62,0xf5,0x7d,0x29,0x51,0xc1] +; X86-NEXT: vsqrtbf16 %ymm1, %ymm0 {%k1} # encoding: [0x62,0xf5,0x7d,0x29,0x51,0xc1] ; X86-NEXT: retl # encoding: [0xc3] entry: %0 = tail call <16 x bfloat> @llvm.sqrt.v16bf16(<16 x bfloat> %__A) @@ -521,13 +521,13 @@ define <16 x bfloat> @test_mm256_maskz_sqrt_pbh(i16 %__U, <16 x bfloat>%__A) { ; X64-LABEL: test_mm256_maskz_sqrt_pbh: ; X64: # %bb.0: # %entry ; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf] -; X64-NEXT: vsqrtnepbf16 %ymm0, %ymm0 {%k1} {z} # encoding: [0x62,0xf5,0x7d,0xa9,0x51,0xc0] +; X64-NEXT: vsqrtbf16 %ymm0, %ymm0 {%k1} {z} # encoding: [0x62,0xf5,0x7d,0xa9,0x51,0xc0] ; X64-NEXT: retq # encoding: [0xc3] ; ; X86-LABEL: test_mm256_maskz_sqrt_pbh: ; X86: # %bb.0: # %entry ; X86-NEXT: kmovw {{[0-9]+}}(%esp), %k1 # encoding: [0xc5,0xf8,0x90,0x4c,0x24,0x04] -; X86-NEXT: vsqrtnepbf16 %ymm0, %ymm0 {%k1} {z} # encoding: [0x62,0xf5,0x7d,0xa9,0x51,0xc0] +; X86-NEXT: vsqrtbf16 %ymm0, %ymm0 {%k1} {z} # encoding: [0x62,0xf5,0x7d,0xa9,0x51,0xc0] ; X86-NEXT: retl # encoding: [0xc3] entry: %0 = tail call <16 x bfloat> @llvm.sqrt.v16bf16(<16 x bfloat> %__A) @@ -536,10 +536,10 @@ entry: ret <16 x bfloat> %2 } -define <8 x bfloat> @test_sqrt_nepbf16_128(<8 x bfloat> %a0) { -; CHECK-LABEL: test_sqrt_nepbf16_128: +define <8 x bfloat> @test_sqrt_bf16_128(<8 x bfloat> %a0) { +; CHECK-LABEL: test_sqrt_bf16_128: ; CHECK: # %bb.0: -; CHECK-NEXT: vsqrtnepbf16 %xmm0, %xmm0 # encoding: [0x62,0xf5,0x7d,0x08,0x51,0xc0] +; CHECK-NEXT: vsqrtbf16 %xmm0, %xmm0 # encoding: [0x62,0xf5,0x7d,0x08,0x51,0xc0] ; CHECK-NEXT: ret{{[l|q]}} # encoding: [0xc3] %1 = tail call <8 x bfloat> @llvm.sqrt.v8bf16(<8 x bfloat> %a0) ret <8 x bfloat> %1 @@ -549,13 +549,13 @@ define <8 x bfloat> @test_mm_mask_sqrt_pbh(<8 x bfloat> %__W, i8 %__U, <8 x bflo ; X64-LABEL: test_mm_mask_sqrt_pbh: ; X64: # %bb.0: # %entry ; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf] -; X64-NEXT: vsqrtnepbf16 %xmm1, %xmm0 {%k1} # encoding: [0x62,0xf5,0x7d,0x09,0x51,0xc1] +; X64-NEXT: vsqrtbf16 %xmm1, %xmm0 {%k1} # encoding: [0x62,0xf5,0x7d,0x09,0x51,0xc1] ; X64-NEXT: retq # encoding: [0xc3] ; ; X86-LABEL: test_mm_mask_sqrt_pbh: ; X86: # %bb.0: # %entry ; X86-NEXT: kmovb {{[0-9]+}}(%esp), %k1 # encoding: [0xc5,0xf9,0x90,0x4c,0x24,0x04] -; X86-NEXT: vsqrtnepbf16 %xmm1, %xmm0 {%k1} # encoding: [0x62,0xf5,0x7d,0x09,0x51,0xc1] +; X86-NEXT: vsqrtbf16 %xmm1, %xmm0 {%k1} # encoding: [0x62,0xf5,0x7d,0x09,0x51,0xc1] ; X86-NEXT: retl # encoding: [0xc3] entry: %0 = tail call <8 x bfloat> @llvm.sqrt.v8bf16(<8 x bfloat> %__A) @@ -568,13 +568,13 @@ define <8 x bfloat> @test_mm_maskz_sqrt_pbh(i8 %__U, <8 x bfloat>%__A) { ; X64-LABEL: test_mm_maskz_sqrt_pbh: ; X64: # %bb.0: # %entry ; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf] -; X64-NEXT: vsqrtnepbf16 %xmm0, %xmm0 {%k1} {z} # encoding: [0x62,0xf5,0x7d,0x89,0x51,0xc0] +; X64-NEXT: vsqrtbf16 %xmm0, %xmm0 {%k1} {z} # encoding: [0x62,0xf5,0x7d,0x89,0x51,0xc0] ; X64-NEXT: retq # encoding: [0xc3] ; ; X86-LABEL: test_mm_maskz_sqrt_pbh: ; X86: # %bb.0: # %entry ; X86-NEXT: kmovb {{[0-9]+}}(%esp), %k1 # encoding: [0xc5,0xf9,0x90,0x4c,0x24,0x04] -; X86-NEXT: vsqrtnepbf16 %xmm0, %xmm0 {%k1} {z} # encoding: [0x62,0xf5,0x7d,0x89,0x51,0xc0] +; X86-NEXT: vsqrtbf16 %xmm0, %xmm0 {%k1} {z} # encoding: [0x62,0xf5,0x7d,0x89,0x51,0xc0] ; X86-NEXT: retl # encoding: [0xc3] entry: %0 = tail call <8 x bfloat> @llvm.sqrt.v8bf16(<8 x bfloat> %__A) @@ -586,7 +586,7 @@ entry: define <16 x bfloat> @test_mm256_fmaddne_pbh(<16 x bfloat> %__A, <16 x bfloat> %__B, <16 x bfloat> %__C) { ; CHECK-LABEL: test_mm256_fmaddne_pbh: ; CHECK: # %bb.0: # %entry -; CHECK-NEXT: vfmadd213nepbf16 %ymm2, %ymm1, %ymm0 # encoding: [0x62,0xf6,0x74,0x28,0xa8,0xc2] +; CHECK-NEXT: vfmadd213bf16 %ymm2, %ymm1, %ymm0 # encoding: [0x62,0xf6,0x74,0x28,0xa8,0xc2] ; CHECK-NEXT: ret{{[l|q]}} # encoding: [0xc3] entry: %0 = tail call <16 x bfloat> @llvm.fma.v16bf16(<16 x bfloat> %__A, <16 x bfloat> %__B, <16 x bfloat> %__C) @@ -597,13 +597,13 @@ define <16 x bfloat> @test_mm256_mask_fmaddne_pbh(<16 x bfloat> %__A, i16 zeroex ; X64-LABEL: test_mm256_mask_fmaddne_pbh: ; X64: # %bb.0: # %entry ; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf] -; X64-NEXT: vfmadd132nepbf16 %ymm1, %ymm2, %ymm0 {%k1} # encoding: [0x62,0xf6,0x6c,0x29,0x98,0xc1] +; X64-NEXT: vfmadd132bf16 %ymm1, %ymm2, %ymm0 {%k1} # encoding: [0x62,0xf6,0x6c,0x29,0x98,0xc1] ; X64-NEXT: retq # encoding: [0xc3] ; ; X86-LABEL: test_mm256_mask_fmaddne_pbh: ; X86: # %bb.0: # %entry ; X86-NEXT: kmovw {{[0-9]+}}(%esp), %k1 # encoding: [0xc5,0xf8,0x90,0x4c,0x24,0x04] -; X86-NEXT: vfmadd132nepbf16 %ymm1, %ymm2, %ymm0 {%k1} # encoding: [0x62,0xf6,0x6c,0x29,0x98,0xc1] +; X86-NEXT: vfmadd132bf16 %ymm1, %ymm2, %ymm0 {%k1} # encoding: [0x62,0xf6,0x6c,0x29,0x98,0xc1] ; X86-NEXT: retl # encoding: [0xc3] entry: %0 = tail call <16 x bfloat> @llvm.fma.v16bf16(<16 x bfloat> %__A, <16 x bfloat> %__B, <16 x bfloat> %__C) @@ -616,14 +616,14 @@ define <16 x bfloat> @test_mm256_mask3_fmaddne_pbh(<16 x bfloat> %__A, <16 x bfl ; X64-LABEL: test_mm256_mask3_fmaddne_pbh: ; X64: # %bb.0: # %entry ; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf] -; X64-NEXT: vfmadd231nepbf16 %ymm1, %ymm0, %ymm2 {%k1} # encoding: [0x62,0xf6,0x7c,0x29,0xb8,0xd1] +; X64-NEXT: vfmadd231bf16 %ymm1, %ymm0, %ymm2 {%k1} # encoding: [0x62,0xf6,0x7c,0x29,0xb8,0xd1] ; X64-NEXT: vmovaps %ymm2, %ymm0 # EVEX TO VEX Compression encoding: [0xc5,0xfc,0x28,0xc2] ; X64-NEXT: retq # encoding: [0xc3] ; ; X86-LABEL: test_mm256_mask3_fmaddne_pbh: ; X86: # %bb.0: # %entry ; X86-NEXT: kmovw {{[0-9]+}}(%esp), %k1 # encoding: [0xc5,0xf8,0x90,0x4c,0x24,0x04] -; X86-NEXT: vfmadd231nepbf16 %ymm1, %ymm0, %ymm2 {%k1} # encoding: [0x62,0xf6,0x7c,0x29,0xb8,0xd1] +; X86-NEXT: vfmadd231bf16 %ymm1, %ymm0, %ymm2 {%k1} # encoding: [0x62,0xf6,0x7c,0x29,0xb8,0xd1] ; X86-NEXT: vmovaps %ymm2, %ymm0 # EVEX TO VEX Compression encoding: [0xc5,0xfc,0x28,0xc2] ; X86-NEXT: retl # encoding: [0xc3] entry: @@ -637,13 +637,13 @@ define <16 x bfloat> @test_mm256_maskz_fmaddne_pbh(i16 zeroext %__U, <16 x bfloa ; X64-LABEL: test_mm256_maskz_fmaddne_pbh: ; X64: # %bb.0: # %entry ; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf] -; X64-NEXT: vfmadd213nepbf16 %ymm2, %ymm1, %ymm0 {%k1} {z} # encoding: [0x62,0xf6,0x74,0xa9,0xa8,0xc2] +; X64-NEXT: vfmadd213bf16 %ymm2, %ymm1, %ymm0 {%k1} {z} # encoding: [0x62,0xf6,0x74,0xa9,0xa8,0xc2] ; X64-NEXT: retq # encoding: [0xc3] ; ; X86-LABEL: test_mm256_maskz_fmaddne_pbh: ; X86: # %bb.0: # %entry ; X86-NEXT: kmovw {{[0-9]+}}(%esp), %k1 # encoding: [0xc5,0xf8,0x90,0x4c,0x24,0x04] -; X86-NEXT: vfmadd213nepbf16 %ymm2, %ymm1, %ymm0 {%k1} {z} # encoding: [0x62,0xf6,0x74,0xa9,0xa8,0xc2] +; X86-NEXT: vfmadd213bf16 %ymm2, %ymm1, %ymm0 {%k1} {z} # encoding: [0x62,0xf6,0x74,0xa9,0xa8,0xc2] ; X86-NEXT: retl # encoding: [0xc3] entry: %0 = tail call <16 x bfloat> @llvm.fma.v16bf16(<16 x bfloat> %__A, <16 x bfloat> %__B, <16 x bfloat> %__C) @@ -655,7 +655,7 @@ entry: define <16 x bfloat> @test_mm256_fmsubne_pbh(<16 x bfloat> %__A, <16 x bfloat> %__B, <16 x bfloat> %__C) { ; CHECK-LABEL: test_mm256_fmsubne_pbh: ; CHECK: # %bb.0: # %entry -; CHECK-NEXT: vfmsub213nepbf16 %ymm2, %ymm1, %ymm0 # encoding: [0x62,0xf6,0x74,0x28,0xaa,0xc2] +; CHECK-NEXT: vfmsub213bf16 %ymm2, %ymm1, %ymm0 # encoding: [0x62,0xf6,0x74,0x28,0xaa,0xc2] ; CHECK-NEXT: ret{{[l|q]}} # encoding: [0xc3] entry: %fneg.i = fneg <16 x bfloat> %__C @@ -667,13 +667,13 @@ define <16 x bfloat> @test_mm256_mask_fmsubne_pbh(<16 x bfloat> %__A, i16 zeroex ; X64-LABEL: test_mm256_mask_fmsubne_pbh: ; X64: # %bb.0: # %entry ; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf] -; X64-NEXT: vfmsub132nepbf16 %ymm1, %ymm2, %ymm0 {%k1} # encoding: [0x62,0xf6,0x6c,0x29,0x9a,0xc1] +; X64-NEXT: vfmsub132bf16 %ymm1, %ymm2, %ymm0 {%k1} # encoding: [0x62,0xf6,0x6c,0x29,0x9a,0xc1] ; X64-NEXT: retq # encoding: [0xc3] ; ; X86-LABEL: test_mm256_mask_fmsubne_pbh: ; X86: # %bb.0: # %entry ; X86-NEXT: kmovw {{[0-9]+}}(%esp), %k1 # encoding: [0xc5,0xf8,0x90,0x4c,0x24,0x04] -; X86-NEXT: vfmsub132nepbf16 %ymm1, %ymm2, %ymm0 {%k1} # encoding: [0x62,0xf6,0x6c,0x29,0x9a,0xc1] +; X86-NEXT: vfmsub132bf16 %ymm1, %ymm2, %ymm0 {%k1} # encoding: [0x62,0xf6,0x6c,0x29,0x9a,0xc1] ; X86-NEXT: retl # encoding: [0xc3] entry: %fneg.i.i = fneg <16 x bfloat> %__C @@ -687,14 +687,14 @@ define <16 x bfloat> @test_mm256_mask3_fmsubne_pbh(<16 x bfloat> %__A, <16 x bfl ; X64-LABEL: test_mm256_mask3_fmsubne_pbh: ; X64: # %bb.0: # %entry ; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf] -; X64-NEXT: vfmsub231nepbf16 %ymm1, %ymm0, %ymm2 {%k1} # encoding: [0x62,0xf6,0x7c,0x29,0xba,0xd1] +; X64-NEXT: vfmsub231bf16 %ymm1, %ymm0, %ymm2 {%k1} # encoding: [0x62,0xf6,0x7c,0x29,0xba,0xd1] ; X64-NEXT: vmovaps %ymm2, %ymm0 # EVEX TO VEX Compression encoding: [0xc5,0xfc,0x28,0xc2] ; X64-NEXT: retq # encoding: [0xc3] ; ; X86-LABEL: test_mm256_mask3_fmsubne_pbh: ; X86: # %bb.0: # %entry ; X86-NEXT: kmovw {{[0-9]+}}(%esp), %k1 # encoding: [0xc5,0xf8,0x90,0x4c,0x24,0x04] -; X86-NEXT: vfmsub231nepbf16 %ymm1, %ymm0, %ymm2 {%k1} # encoding: [0x62,0xf6,0x7c,0x29,0xba,0xd1] +; X86-NEXT: vfmsub231bf16 %ymm1, %ymm0, %ymm2 {%k1} # encoding: [0x62,0xf6,0x7c,0x29,0xba,0xd1] ; X86-NEXT: vmovaps %ymm2, %ymm0 # EVEX TO VEX Compression encoding: [0xc5,0xfc,0x28,0xc2] ; X86-NEXT: retl # encoding: [0xc3] entry: @@ -709,13 +709,13 @@ define <16 x bfloat> @test_mm256_maskz_fmsubne_pbh(i16 zeroext %__U, <16 x bfloa ; X64-LABEL: test_mm256_maskz_fmsubne_pbh: ; X64: # %bb.0: # %entry ; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf] -; X64-NEXT: vfmsub213nepbf16 %ymm2, %ymm1, %ymm0 {%k1} {z} # encoding: [0x62,0xf6,0x74,0xa9,0xaa,0xc2] +; X64-NEXT: vfmsub213bf16 %ymm2, %ymm1, %ymm0 {%k1} {z} # encoding: [0x62,0xf6,0x74,0xa9,0xaa,0xc2] ; X64-NEXT: retq # encoding: [0xc3] ; ; X86-LABEL: test_mm256_maskz_fmsubne_pbh: ; X86: # %bb.0: # %entry ; X86-NEXT: kmovw {{[0-9]+}}(%esp), %k1 # encoding: [0xc5,0xf8,0x90,0x4c,0x24,0x04] -; X86-NEXT: vfmsub213nepbf16 %ymm2, %ymm1, %ymm0 {%k1} {z} # encoding: [0x62,0xf6,0x74,0xa9,0xaa,0xc2] +; X86-NEXT: vfmsub213bf16 %ymm2, %ymm1, %ymm0 {%k1} {z} # encoding: [0x62,0xf6,0x74,0xa9,0xaa,0xc2] ; X86-NEXT: retl # encoding: [0xc3] entry: %fneg.i.i = fneg <16 x bfloat> %__C @@ -728,7 +728,7 @@ entry: define <16 x bfloat> @test_mm256_fnmaddne_pbh(<16 x bfloat> %__A, <16 x bfloat> %__B, <16 x bfloat> %__C) { ; CHECK-LABEL: test_mm256_fnmaddne_pbh: ; CHECK: # %bb.0: # %entry -; CHECK-NEXT: vfnmadd213nepbf16 %ymm2, %ymm1, %ymm0 # encoding: [0x62,0xf6,0x74,0x28,0xac,0xc2] +; CHECK-NEXT: vfnmadd213bf16 %ymm2, %ymm1, %ymm0 # encoding: [0x62,0xf6,0x74,0x28,0xac,0xc2] ; CHECK-NEXT: ret{{[l|q]}} # encoding: [0xc3] entry: %fneg.i = fneg <16 x bfloat> %__B @@ -740,13 +740,13 @@ define <16 x bfloat> @test_mm256_mask_fnmaddne_pbh(<16 x bfloat> %__A, i16 zeroe ; X64-LABEL: test_mm256_mask_fnmaddne_pbh: ; X64: # %bb.0: # %entry ; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf] -; X64-NEXT: vfnmadd132nepbf16 %ymm1, %ymm2, %ymm0 {%k1} # encoding: [0x62,0xf6,0x6c,0x29,0x9c,0xc1] +; X64-NEXT: vfnmadd132bf16 %ymm1, %ymm2, %ymm0 {%k1} # encoding: [0x62,0xf6,0x6c,0x29,0x9c,0xc1] ; X64-NEXT: retq # encoding: [0xc3] ; ; X86-LABEL: test_mm256_mask_fnmaddne_pbh: ; X86: # %bb.0: # %entry ; X86-NEXT: kmovw {{[0-9]+}}(%esp), %k1 # encoding: [0xc5,0xf8,0x90,0x4c,0x24,0x04] -; X86-NEXT: vfnmadd132nepbf16 %ymm1, %ymm2, %ymm0 {%k1} # encoding: [0x62,0xf6,0x6c,0x29,0x9c,0xc1] +; X86-NEXT: vfnmadd132bf16 %ymm1, %ymm2, %ymm0 {%k1} # encoding: [0x62,0xf6,0x6c,0x29,0x9c,0xc1] ; X86-NEXT: retl # encoding: [0xc3] entry: %fneg.i.i = fneg <16 x bfloat> %__B @@ -760,14 +760,14 @@ define <16 x bfloat> @test_mm256_mask3_fnmaddne_pbh(<16 x bfloat> %__A, <16 x bf ; X64-LABEL: test_mm256_mask3_fnmaddne_pbh: ; X64: # %bb.0: # %entry ; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf] -; X64-NEXT: vfnmadd231nepbf16 %ymm1, %ymm0, %ymm2 {%k1} # encoding: [0x62,0xf6,0x7c,0x29,0xbc,0xd1] +; X64-NEXT: vfnmadd231bf16 %ymm1, %ymm0, %ymm2 {%k1} # encoding: [0x62,0xf6,0x7c,0x29,0xbc,0xd1] ; X64-NEXT: vmovaps %ymm2, %ymm0 # EVEX TO VEX Compression encoding: [0xc5,0xfc,0x28,0xc2] ; X64-NEXT: retq # encoding: [0xc3] ; ; X86-LABEL: test_mm256_mask3_fnmaddne_pbh: ; X86: # %bb.0: # %entry ; X86-NEXT: kmovw {{[0-9]+}}(%esp), %k1 # encoding: [0xc5,0xf8,0x90,0x4c,0x24,0x04] -; X86-NEXT: vfnmadd231nepbf16 %ymm1, %ymm0, %ymm2 {%k1} # encoding: [0x62,0xf6,0x7c,0x29,0xbc,0xd1] +; X86-NEXT: vfnmadd231bf16 %ymm1, %ymm0, %ymm2 {%k1} # encoding: [0x62,0xf6,0x7c,0x29,0xbc,0xd1] ; X86-NEXT: vmovaps %ymm2, %ymm0 # EVEX TO VEX Compression encoding: [0xc5,0xfc,0x28,0xc2] ; X86-NEXT: retl # encoding: [0xc3] entry: @@ -782,13 +782,13 @@ define <16 x bfloat> @test_mm256_maskz_fnmaddne_pbh(i16 zeroext %__U, <16 x bflo ; X64-LABEL: test_mm256_maskz_fnmaddne_pbh: ; X64: # %bb.0: # %entry ; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf] -; X64-NEXT: vfnmadd213nepbf16 %ymm2, %ymm1, %ymm0 {%k1} {z} # encoding: [0x62,0xf6,0x74,0xa9,0xac,0xc2] +; X64-NEXT: vfnmadd213bf16 %ymm2, %ymm1, %ymm0 {%k1} {z} # encoding: [0x62,0xf6,0x74,0xa9,0xac,0xc2] ; X64-NEXT: retq # encoding: [0xc3] ; ; X86-LABEL: test_mm256_maskz_fnmaddne_pbh: ; X86: # %bb.0: # %entry ; X86-NEXT: kmovw {{[0-9]+}}(%esp), %k1 # encoding: [0xc5,0xf8,0x90,0x4c,0x24,0x04] -; X86-NEXT: vfnmadd213nepbf16 %ymm2, %ymm1, %ymm0 {%k1} {z} # encoding: [0x62,0xf6,0x74,0xa9,0xac,0xc2] +; X86-NEXT: vfnmadd213bf16 %ymm2, %ymm1, %ymm0 {%k1} {z} # encoding: [0x62,0xf6,0x74,0xa9,0xac,0xc2] ; X86-NEXT: retl # encoding: [0xc3] entry: %fneg.i.i = fneg <16 x bfloat> %__B @@ -801,7 +801,7 @@ entry: define <16 x bfloat> @test_mm256_fnmsubne_pbh(<16 x bfloat> %__A, <16 x bfloat> %__B, <16 x bfloat> %__C) { ; CHECK-LABEL: test_mm256_fnmsubne_pbh: ; CHECK: # %bb.0: # %entry -; CHECK-NEXT: vfnmsub213nepbf16 %ymm2, %ymm1, %ymm0 # encoding: [0x62,0xf6,0x74,0x28,0xae,0xc2] +; CHECK-NEXT: vfnmsub213bf16 %ymm2, %ymm1, %ymm0 # encoding: [0x62,0xf6,0x74,0x28,0xae,0xc2] ; CHECK-NEXT: ret{{[l|q]}} # encoding: [0xc3] entry: %fneg.i = fneg <16 x bfloat> %__B @@ -814,13 +814,13 @@ define <16 x bfloat> @test_mm256_mask_fnmsubne_pbh(<16 x bfloat> %__A, i16 zeroe ; X64-LABEL: test_mm256_mask_fnmsubne_pbh: ; X64: # %bb.0: # %entry ; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf] -; X64-NEXT: vfnmsub132nepbf16 %ymm1, %ymm2, %ymm0 {%k1} # encoding: [0x62,0xf6,0x6c,0x29,0x9e,0xc1] +; X64-NEXT: vfnmsub132bf16 %ymm1, %ymm2, %ymm0 {%k1} # encoding: [0x62,0xf6,0x6c,0x29,0x9e,0xc1] ; X64-NEXT: retq # encoding: [0xc3] ; ; X86-LABEL: test_mm256_mask_fnmsubne_pbh: ; X86: # %bb.0: # %entry ; X86-NEXT: kmovw {{[0-9]+}}(%esp), %k1 # encoding: [0xc5,0xf8,0x90,0x4c,0x24,0x04] -; X86-NEXT: vfnmsub132nepbf16 %ymm1, %ymm2, %ymm0 {%k1} # encoding: [0x62,0xf6,0x6c,0x29,0x9e,0xc1] +; X86-NEXT: vfnmsub132bf16 %ymm1, %ymm2, %ymm0 {%k1} # encoding: [0x62,0xf6,0x6c,0x29,0x9e,0xc1] ; X86-NEXT: retl # encoding: [0xc3] entry: %fneg.i.i = fneg <16 x bfloat> %__B @@ -835,14 +835,14 @@ define <16 x bfloat> @test_mm256_mask3_fnmsubne_pbh(<16 x bfloat> %__A, <16 x bf ; X64-LABEL: test_mm256_mask3_fnmsubne_pbh: ; X64: # %bb.0: # %entry ; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf] -; X64-NEXT: vfnmsub231nepbf16 %ymm1, %ymm0, %ymm2 {%k1} # encoding: [0x62,0xf6,0x7c,0x29,0xbe,0xd1] +; X64-NEXT: vfnmsub231bf16 %ymm1, %ymm0, %ymm2 {%k1} # encoding: [0x62,0xf6,0x7c,0x29,0xbe,0xd1] ; X64-NEXT: vmovaps %ymm2, %ymm0 # EVEX TO VEX Compression encoding: [0xc5,0xfc,0x28,0xc2] ; X64-NEXT: retq # encoding: [0xc3] ; ; X86-LABEL: test_mm256_mask3_fnmsubne_pbh: ; X86: # %bb.0: # %entry ; X86-NEXT: kmovw {{[0-9]+}}(%esp), %k1 # encoding: [0xc5,0xf8,0x90,0x4c,0x24,0x04] -; X86-NEXT: vfnmsub231nepbf16 %ymm1, %ymm0, %ymm2 {%k1} # encoding: [0x62,0xf6,0x7c,0x29,0xbe,0xd1] +; X86-NEXT: vfnmsub231bf16 %ymm1, %ymm0, %ymm2 {%k1} # encoding: [0x62,0xf6,0x7c,0x29,0xbe,0xd1] ; X86-NEXT: vmovaps %ymm2, %ymm0 # EVEX TO VEX Compression encoding: [0xc5,0xfc,0x28,0xc2] ; X86-NEXT: retl # encoding: [0xc3] entry: @@ -858,13 +858,13 @@ define <16 x bfloat> @test_mm256_maskz_fnmsubne_pbh(i16 zeroext %__U, <16 x bflo ; X64-LABEL: test_mm256_maskz_fnmsubne_pbh: ; X64: # %bb.0: # %entry ; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf] -; X64-NEXT: vfnmsub213nepbf16 %ymm2, %ymm1, %ymm0 {%k1} {z} # encoding: [0x62,0xf6,0x74,0xa9,0xae,0xc2] +; X64-NEXT: vfnmsub213bf16 %ymm2, %ymm1, %ymm0 {%k1} {z} # encoding: [0x62,0xf6,0x74,0xa9,0xae,0xc2] ; X64-NEXT: retq # encoding: [0xc3] ; ; X86-LABEL: test_mm256_maskz_fnmsubne_pbh: ; X86: # %bb.0: # %entry ; X86-NEXT: kmovw {{[0-9]+}}(%esp), %k1 # encoding: [0xc5,0xf8,0x90,0x4c,0x24,0x04] -; X86-NEXT: vfnmsub213nepbf16 %ymm2, %ymm1, %ymm0 {%k1} {z} # encoding: [0x62,0xf6,0x74,0xa9,0xae,0xc2] +; X86-NEXT: vfnmsub213bf16 %ymm2, %ymm1, %ymm0 {%k1} {z} # encoding: [0x62,0xf6,0x74,0xa9,0xae,0xc2] ; X86-NEXT: retl # encoding: [0xc3] entry: %fneg.i.i = fneg <16 x bfloat> %__B @@ -878,7 +878,7 @@ entry: define <8 x bfloat> @test_mm_fmaddne_pbh(<8 x bfloat> %__A, <8 x bfloat> %__B, <8 x bfloat> %__C) { ; CHECK-LABEL: test_mm_fmaddne_pbh: ; CHECK: # %bb.0: # %entry -; CHECK-NEXT: vfmadd213nepbf16 %xmm2, %xmm1, %xmm0 # encoding: [0x62,0xf6,0x74,0x08,0xa8,0xc2] +; CHECK-NEXT: vfmadd213bf16 %xmm2, %xmm1, %xmm0 # encoding: [0x62,0xf6,0x74,0x08,0xa8,0xc2] ; CHECK-NEXT: ret{{[l|q]}} # encoding: [0xc3] entry: %0 = tail call <8 x bfloat> @llvm.fma.v8bf16(<8 x bfloat> %__A, <8 x bfloat> %__B, <8 x bfloat> %__C) @@ -889,13 +889,13 @@ define <8 x bfloat> @test_mm_mask_fmaddne_pbh(<8 x bfloat> %__A, i8 zeroext %__U ; X64-LABEL: test_mm_mask_fmaddne_pbh: ; X64: # %bb.0: # %entry ; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf] -; X64-NEXT: vfmadd132nepbf16 %xmm1, %xmm2, %xmm0 {%k1} # encoding: [0x62,0xf6,0x6c,0x09,0x98,0xc1] +; X64-NEXT: vfmadd132bf16 %xmm1, %xmm2, %xmm0 {%k1} # encoding: [0x62,0xf6,0x6c,0x09,0x98,0xc1] ; X64-NEXT: retq # encoding: [0xc3] ; ; X86-LABEL: test_mm_mask_fmaddne_pbh: ; X86: # %bb.0: # %entry ; X86-NEXT: kmovb {{[0-9]+}}(%esp), %k1 # encoding: [0xc5,0xf9,0x90,0x4c,0x24,0x04] -; X86-NEXT: vfmadd132nepbf16 %xmm1, %xmm2, %xmm0 {%k1} # encoding: [0x62,0xf6,0x6c,0x09,0x98,0xc1] +; X86-NEXT: vfmadd132bf16 %xmm1, %xmm2, %xmm0 {%k1} # encoding: [0x62,0xf6,0x6c,0x09,0x98,0xc1] ; X86-NEXT: retl # encoding: [0xc3] entry: %0 = tail call <8 x bfloat> @llvm.fma.v8bf16(<8 x bfloat> %__A, <8 x bfloat> %__B, <8 x bfloat> %__C) @@ -908,14 +908,14 @@ define <8 x bfloat> @test_mm_mask3_fmaddne_pbh(<8 x bfloat> %__A, <8 x bfloat> % ; X64-LABEL: test_mm_mask3_fmaddne_pbh: ; X64: # %bb.0: # %entry ; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf] -; X64-NEXT: vfmadd231nepbf16 %xmm1, %xmm0, %xmm2 {%k1} # encoding: [0x62,0xf6,0x7c,0x09,0xb8,0xd1] +; X64-NEXT: vfmadd231bf16 %xmm1, %xmm0, %xmm2 {%k1} # encoding: [0x62,0xf6,0x7c,0x09,0xb8,0xd1] ; X64-NEXT: vmovaps %xmm2, %xmm0 # EVEX TO VEX Compression encoding: [0xc5,0xf8,0x28,0xc2] ; X64-NEXT: retq # encoding: [0xc3] ; ; X86-LABEL: test_mm_mask3_fmaddne_pbh: ; X86: # %bb.0: # %entry ; X86-NEXT: kmovb {{[0-9]+}}(%esp), %k1 # encoding: [0xc5,0xf9,0x90,0x4c,0x24,0x04] -; X86-NEXT: vfmadd231nepbf16 %xmm1, %xmm0, %xmm2 {%k1} # encoding: [0x62,0xf6,0x7c,0x09,0xb8,0xd1] +; X86-NEXT: vfmadd231bf16 %xmm1, %xmm0, %xmm2 {%k1} # encoding: [0x62,0xf6,0x7c,0x09,0xb8,0xd1] ; X86-NEXT: vmovaps %xmm2, %xmm0 # EVEX TO VEX Compression encoding: [0xc5,0xf8,0x28,0xc2] ; X86-NEXT: retl # encoding: [0xc3] entry: @@ -929,13 +929,13 @@ define <8 x bfloat> @test_mm_maskz_fmaddne_pbh(i8 zeroext %__U, <8 x bfloat> %__ ; X64-LABEL: test_mm_maskz_fmaddne_pbh: ; X64: # %bb.0: # %entry ; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf] -; X64-NEXT: vfmadd213nepbf16 %xmm2, %xmm1, %xmm0 {%k1} {z} # encoding: [0x62,0xf6,0x74,0x89,0xa8,0xc2] +; X64-NEXT: vfmadd213bf16 %xmm2, %xmm1, %xmm0 {%k1} {z} # encoding: [0x62,0xf6,0x74,0x89,0xa8,0xc2] ; X64-NEXT: retq # encoding: [0xc3] ; ; X86-LABEL: test_mm_maskz_fmaddne_pbh: ; X86: # %bb.0: # %entry ; X86-NEXT: kmovb {{[0-9]+}}(%esp), %k1 # encoding: [0xc5,0xf9,0x90,0x4c,0x24,0x04] -; X86-NEXT: vfmadd213nepbf16 %xmm2, %xmm1, %xmm0 {%k1} {z} # encoding: [0x62,0xf6,0x74,0x89,0xa8,0xc2] +; X86-NEXT: vfmadd213bf16 %xmm2, %xmm1, %xmm0 {%k1} {z} # encoding: [0x62,0xf6,0x74,0x89,0xa8,0xc2] ; X86-NEXT: retl # encoding: [0xc3] entry: %0 = tail call <8 x bfloat> @llvm.fma.v8bf16(<8 x bfloat> %__A, <8 x bfloat> %__B, <8 x bfloat> %__C) @@ -947,7 +947,7 @@ entry: define <8 x bfloat> @test_mm_fmsubne_pbh(<8 x bfloat> %__A, <8 x bfloat> %__B, <8 x bfloat> %__C) { ; CHECK-LABEL: test_mm_fmsubne_pbh: ; CHECK: # %bb.0: # %entry -; CHECK-NEXT: vfmsub213nepbf16 %xmm2, %xmm1, %xmm0 # encoding: [0x62,0xf6,0x74,0x08,0xaa,0xc2] +; CHECK-NEXT: vfmsub213bf16 %xmm2, %xmm1, %xmm0 # encoding: [0x62,0xf6,0x74,0x08,0xaa,0xc2] ; CHECK-NEXT: ret{{[l|q]}} # encoding: [0xc3] entry: %fneg.i = fneg <8 x bfloat> %__C @@ -959,13 +959,13 @@ define <8 x bfloat> @test_mm_mask_fmsubne_pbh(<8 x bfloat> %__A, i8 zeroext %__U ; X64-LABEL: test_mm_mask_fmsubne_pbh: ; X64: # %bb.0: # %entry ; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf] -; X64-NEXT: vfmsub132nepbf16 %xmm1, %xmm2, %xmm0 {%k1} # encoding: [0x62,0xf6,0x6c,0x09,0x9a,0xc1] +; X64-NEXT: vfmsub132bf16 %xmm1, %xmm2, %xmm0 {%k1} # encoding: [0x62,0xf6,0x6c,0x09,0x9a,0xc1] ; X64-NEXT: retq # encoding: [0xc3] ; ; X86-LABEL: test_mm_mask_fmsubne_pbh: ; X86: # %bb.0: # %entry ; X86-NEXT: kmovb {{[0-9]+}}(%esp), %k1 # encoding: [0xc5,0xf9,0x90,0x4c,0x24,0x04] -; X86-NEXT: vfmsub132nepbf16 %xmm1, %xmm2, %xmm0 {%k1} # encoding: [0x62,0xf6,0x6c,0x09,0x9a,0xc1] +; X86-NEXT: vfmsub132bf16 %xmm1, %xmm2, %xmm0 {%k1} # encoding: [0x62,0xf6,0x6c,0x09,0x9a,0xc1] ; X86-NEXT: retl # encoding: [0xc3] entry: %fneg.i.i = fneg <8 x bfloat> %__C @@ -979,14 +979,14 @@ define <8 x bfloat> @test_mm_mask3_fmsubne_pbh(<8 x bfloat> %__A, <8 x bfloat> % ; X64-LABEL: test_mm_mask3_fmsubne_pbh: ; X64: # %bb.0: # %entry ; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf] -; X64-NEXT: vfmsub231nepbf16 %xmm1, %xmm0, %xmm2 {%k1} # encoding: [0x62,0xf6,0x7c,0x09,0xba,0xd1] +; X64-NEXT: vfmsub231bf16 %xmm1, %xmm0, %xmm2 {%k1} # encoding: [0x62,0xf6,0x7c,0x09,0xba,0xd1] ; X64-NEXT: vmovaps %xmm2, %xmm0 # EVEX TO VEX Compression encoding: [0xc5,0xf8,0x28,0xc2] ; X64-NEXT: retq # encoding: [0xc3] ; ; X86-LABEL: test_mm_mask3_fmsubne_pbh: ; X86: # %bb.0: # %entry ; X86-NEXT: kmovb {{[0-9]+}}(%esp), %k1 # encoding: [0xc5,0xf9,0x90,0x4c,0x24,0x04] -; X86-NEXT: vfmsub231nepbf16 %xmm1, %xmm0, %xmm2 {%k1} # encoding: [0x62,0xf6,0x7c,0x09,0xba,0xd1] +; X86-NEXT: vfmsub231bf16 %xmm1, %xmm0, %xmm2 {%k1} # encoding: [0x62,0xf6,0x7c,0x09,0xba,0xd1] ; X86-NEXT: vmovaps %xmm2, %xmm0 # EVEX TO VEX Compression encoding: [0xc5,0xf8,0x28,0xc2] ; X86-NEXT: retl # encoding: [0xc3] entry: @@ -1001,13 +1001,13 @@ define <8 x bfloat> @test_mm_maskz_fmsubne_pbh(i8 zeroext %__U, <8 x bfloat> %__ ; X64-LABEL: test_mm_maskz_fmsubne_pbh: ; X64: # %bb.0: # %entry ; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf] -; X64-NEXT: vfmsub213nepbf16 %xmm2, %xmm1, %xmm0 {%k1} {z} # encoding: [0x62,0xf6,0x74,0x89,0xaa,0xc2] +; X64-NEXT: vfmsub213bf16 %xmm2, %xmm1, %xmm0 {%k1} {z} # encoding: [0x62,0xf6,0x74,0x89,0xaa,0xc2] ; X64-NEXT: retq # encoding: [0xc3] ; ; X86-LABEL: test_mm_maskz_fmsubne_pbh: ; X86: # %bb.0: # %entry ; X86-NEXT: kmovb {{[0-9]+}}(%esp), %k1 # encoding: [0xc5,0xf9,0x90,0x4c,0x24,0x04] -; X86-NEXT: vfmsub213nepbf16 %xmm2, %xmm1, %xmm0 {%k1} {z} # encoding: [0x62,0xf6,0x74,0x89,0xaa,0xc2] +; X86-NEXT: vfmsub213bf16 %xmm2, %xmm1, %xmm0 {%k1} {z} # encoding: [0x62,0xf6,0x74,0x89,0xaa,0xc2] ; X86-NEXT: retl # encoding: [0xc3] entry: %fneg.i.i = fneg <8 x bfloat> %__C @@ -1020,7 +1020,7 @@ entry: define <8 x bfloat> @test_mm_fnmaddne_pbh(<8 x bfloat> %__A, <8 x bfloat> %__B, <8 x bfloat> %__C) { ; CHECK-LABEL: test_mm_fnmaddne_pbh: ; CHECK: # %bb.0: # %entry -; CHECK-NEXT: vfnmadd213nepbf16 %xmm2, %xmm1, %xmm0 # encoding: [0x62,0xf6,0x74,0x08,0xac,0xc2] +; CHECK-NEXT: vfnmadd213bf16 %xmm2, %xmm1, %xmm0 # encoding: [0x62,0xf6,0x74,0x08,0xac,0xc2] ; CHECK-NEXT: ret{{[l|q]}} # encoding: [0xc3] entry: %fneg.i = fneg <8 x bfloat> %__B @@ -1032,13 +1032,13 @@ define <8 x bfloat> @test_mm_mask_fnmaddne_pbh(<8 x bfloat> %__A, i8 zeroext %__ ; X64-LABEL: test_mm_mask_fnmaddne_pbh: ; X64: # %bb.0: # %entry ; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf] -; X64-NEXT: vfnmadd132nepbf16 %xmm1, %xmm2, %xmm0 {%k1} # encoding: [0x62,0xf6,0x6c,0x09,0x9c,0xc1] +; X64-NEXT: vfnmadd132bf16 %xmm1, %xmm2, %xmm0 {%k1} # encoding: [0x62,0xf6,0x6c,0x09,0x9c,0xc1] ; X64-NEXT: retq # encoding: [0xc3] ; ; X86-LABEL: test_mm_mask_fnmaddne_pbh: ; X86: # %bb.0: # %entry ; X86-NEXT: kmovb {{[0-9]+}}(%esp), %k1 # encoding: [0xc5,0xf9,0x90,0x4c,0x24,0x04] -; X86-NEXT: vfnmadd132nepbf16 %xmm1, %xmm2, %xmm0 {%k1} # encoding: [0x62,0xf6,0x6c,0x09,0x9c,0xc1] +; X86-NEXT: vfnmadd132bf16 %xmm1, %xmm2, %xmm0 {%k1} # encoding: [0x62,0xf6,0x6c,0x09,0x9c,0xc1] ; X86-NEXT: retl # encoding: [0xc3] entry: %fneg.i.i = fneg <8 x bfloat> %__B @@ -1052,14 +1052,14 @@ define <8 x bfloat> @test_mm_mask3_fnmaddne_pbh(<8 x bfloat> %__A, <8 x bfloat> ; X64-LABEL: test_mm_mask3_fnmaddne_pbh: ; X64: # %bb.0: # %entry ; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf] -; X64-NEXT: vfnmadd231nepbf16 %xmm1, %xmm0, %xmm2 {%k1} # encoding: [0x62,0xf6,0x7c,0x09,0xbc,0xd1] +; X64-NEXT: vfnmadd231bf16 %xmm1, %xmm0, %xmm2 {%k1} # encoding: [0x62,0xf6,0x7c,0x09,0xbc,0xd1] ; X64-NEXT: vmovaps %xmm2, %xmm0 # EVEX TO VEX Compression encoding: [0xc5,0xf8,0x28,0xc2] ; X64-NEXT: retq # encoding: [0xc3] ; ; X86-LABEL: test_mm_mask3_fnmaddne_pbh: ; X86: # %bb.0: # %entry ; X86-NEXT: kmovb {{[0-9]+}}(%esp), %k1 # encoding: [0xc5,0xf9,0x90,0x4c,0x24,0x04] -; X86-NEXT: vfnmadd231nepbf16 %xmm1, %xmm0, %xmm2 {%k1} # encoding: [0x62,0xf6,0x7c,0x09,0xbc,0xd1] +; X86-NEXT: vfnmadd231bf16 %xmm1, %xmm0, %xmm2 {%k1} # encoding: [0x62,0xf6,0x7c,0x09,0xbc,0xd1] ; X86-NEXT: vmovaps %xmm2, %xmm0 # EVEX TO VEX Compression encoding: [0xc5,0xf8,0x28,0xc2] ; X86-NEXT: retl # encoding: [0xc3] entry: @@ -1074,13 +1074,13 @@ define <8 x bfloat> @test_mm_maskz_fnmaddne_pbh(i8 zeroext %__U, <8 x bfloat> %_ ; X64-LABEL: test_mm_maskz_fnmaddne_pbh: ; X64: # %bb.0: # %entry ; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf] -; X64-NEXT: vfnmadd213nepbf16 %xmm2, %xmm1, %xmm0 {%k1} {z} # encoding: [0x62,0xf6,0x74,0x89,0xac,0xc2] +; X64-NEXT: vfnmadd213bf16 %xmm2, %xmm1, %xmm0 {%k1} {z} # encoding: [0x62,0xf6,0x74,0x89,0xac,0xc2] ; X64-NEXT: retq # encoding: [0xc3] ; ; X86-LABEL: test_mm_maskz_fnmaddne_pbh: ; X86: # %bb.0: # %entry ; X86-NEXT: kmovb {{[0-9]+}}(%esp), %k1 # encoding: [0xc5,0xf9,0x90,0x4c,0x24,0x04] -; X86-NEXT: vfnmadd213nepbf16 %xmm2, %xmm1, %xmm0 {%k1} {z} # encoding: [0x62,0xf6,0x74,0x89,0xac,0xc2] +; X86-NEXT: vfnmadd213bf16 %xmm2, %xmm1, %xmm0 {%k1} {z} # encoding: [0x62,0xf6,0x74,0x89,0xac,0xc2] ; X86-NEXT: retl # encoding: [0xc3] entry: %fneg.i.i = fneg <8 x bfloat> %__B @@ -1093,7 +1093,7 @@ entry: define <8 x bfloat> @test_mm_fnmsubne_pbh(<8 x bfloat> %__A, <8 x bfloat> %__B, <8 x bfloat> %__C) { ; CHECK-LABEL: test_mm_fnmsubne_pbh: ; CHECK: # %bb.0: # %entry -; CHECK-NEXT: vfnmsub213nepbf16 %xmm2, %xmm1, %xmm0 # encoding: [0x62,0xf6,0x74,0x08,0xae,0xc2] +; CHECK-NEXT: vfnmsub213bf16 %xmm2, %xmm1, %xmm0 # encoding: [0x62,0xf6,0x74,0x08,0xae,0xc2] ; CHECK-NEXT: ret{{[l|q]}} # encoding: [0xc3] entry: %fneg.i = fneg <8 x bfloat> %__B @@ -1106,13 +1106,13 @@ define <8 x bfloat> @test_mm_mask_fnmsubne_pbh(<8 x bfloat> %__A, i8 zeroext %__ ; X64-LABEL: test_mm_mask_fnmsubne_pbh: ; X64: # %bb.0: # %entry ; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf] -; X64-NEXT: vfnmsub132nepbf16 %xmm1, %xmm2, %xmm0 {%k1} # encoding: [0x62,0xf6,0x6c,0x09,0x9e,0xc1] +; X64-NEXT: vfnmsub132bf16 %xmm1, %xmm2, %xmm0 {%k1} # encoding: [0x62,0xf6,0x6c,0x09,0x9e,0xc1] ; X64-NEXT: retq # encoding: [0xc3] ; ; X86-LABEL: test_mm_mask_fnmsubne_pbh: ; X86: # %bb.0: # %entry ; X86-NEXT: kmovb {{[0-9]+}}(%esp), %k1 # encoding: [0xc5,0xf9,0x90,0x4c,0x24,0x04] -; X86-NEXT: vfnmsub132nepbf16 %xmm1, %xmm2, %xmm0 {%k1} # encoding: [0x62,0xf6,0x6c,0x09,0x9e,0xc1] +; X86-NEXT: vfnmsub132bf16 %xmm1, %xmm2, %xmm0 {%k1} # encoding: [0x62,0xf6,0x6c,0x09,0x9e,0xc1] ; X86-NEXT: retl # encoding: [0xc3] entry: %fneg.i.i = fneg <8 x bfloat> %__B @@ -1127,14 +1127,14 @@ define <8 x bfloat> @test_mm_mask3_fnmsubne_pbh(<8 x bfloat> %__A, <8 x bfloat> ; X64-LABEL: test_mm_mask3_fnmsubne_pbh: ; X64: # %bb.0: # %entry ; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf] -; X64-NEXT: vfnmsub231nepbf16 %xmm1, %xmm0, %xmm2 {%k1} # encoding: [0x62,0xf6,0x7c,0x09,0xbe,0xd1] +; X64-NEXT: vfnmsub231bf16 %xmm1, %xmm0, %xmm2 {%k1} # encoding: [0x62,0xf6,0x7c,0x09,0xbe,0xd1] ; X64-NEXT: vmovaps %xmm2, %xmm0 # EVEX TO VEX Compression encoding: [0xc5,0xf8,0x28,0xc2] ; X64-NEXT: retq # encoding: [0xc3] ; ; X86-LABEL: test_mm_mask3_fnmsubne_pbh: ; X86: # %bb.0: # %entry ; X86-NEXT: kmovb {{[0-9]+}}(%esp), %k1 # encoding: [0xc5,0xf9,0x90,0x4c,0x24,0x04] -; X86-NEXT: vfnmsub231nepbf16 %xmm1, %xmm0, %xmm2 {%k1} # encoding: [0x62,0xf6,0x7c,0x09,0xbe,0xd1] +; X86-NEXT: vfnmsub231bf16 %xmm1, %xmm0, %xmm2 {%k1} # encoding: [0x62,0xf6,0x7c,0x09,0xbe,0xd1] ; X86-NEXT: vmovaps %xmm2, %xmm0 # EVEX TO VEX Compression encoding: [0xc5,0xf8,0x28,0xc2] ; X86-NEXT: retl # encoding: [0xc3] entry: @@ -1150,13 +1150,13 @@ define <8 x bfloat> @test_mm_maskz_fnmsubne_pbh(i8 zeroext %__U, <8 x bfloat> %_ ; X64-LABEL: test_mm_maskz_fnmsubne_pbh: ; X64: # %bb.0: # %entry ; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf] -; X64-NEXT: vfnmsub213nepbf16 %xmm2, %xmm1, %xmm0 {%k1} {z} # encoding: [0x62,0xf6,0x74,0x89,0xae,0xc2] +; X64-NEXT: vfnmsub213bf16 %xmm2, %xmm1, %xmm0 {%k1} {z} # encoding: [0x62,0xf6,0x74,0x89,0xae,0xc2] ; X64-NEXT: retq # encoding: [0xc3] ; ; X86-LABEL: test_mm_maskz_fnmsubne_pbh: ; X86: # %bb.0: # %entry ; X86-NEXT: kmovb {{[0-9]+}}(%esp), %k1 # encoding: [0xc5,0xf9,0x90,0x4c,0x24,0x04] -; X86-NEXT: vfnmsub213nepbf16 %xmm2, %xmm1, %xmm0 {%k1} {z} # encoding: [0x62,0xf6,0x74,0x89,0xae,0xc2] +; X86-NEXT: vfnmsub213bf16 %xmm2, %xmm1, %xmm0 {%k1} {z} # encoding: [0x62,0xf6,0x74,0x89,0xae,0xc2] ; X86-NEXT: retl # encoding: [0xc3] entry: %fneg.i.i = fneg <8 x bfloat> %__B @@ -1170,8 +1170,8 @@ entry: define <32 x bfloat> @addv(<32 x bfloat> %a, <32 x bfloat> %b) nounwind { ; X64-LABEL: addv: ; X64: # %bb.0: -; X64-NEXT: vaddnepbf16 %ymm2, %ymm0, %ymm0 # encoding: [0x62,0xf5,0x7d,0x28,0x58,0xc2] -; X64-NEXT: vaddnepbf16 %ymm3, %ymm1, %ymm1 # encoding: [0x62,0xf5,0x75,0x28,0x58,0xcb] +; X64-NEXT: vaddbf16 %ymm2, %ymm0, %ymm0 # encoding: [0x62,0xf5,0x7d,0x28,0x58,0xc2] +; X64-NEXT: vaddbf16 %ymm3, %ymm1, %ymm1 # encoding: [0x62,0xf5,0x75,0x28,0x58,0xcb] ; X64-NEXT: retq # encoding: [0xc3] ; ; X86-LABEL: addv: @@ -1180,8 +1180,8 @@ define <32 x bfloat> @addv(<32 x bfloat> %a, <32 x bfloat> %b) nounwind { ; X86-NEXT: movl %esp, %ebp # encoding: [0x89,0xe5] ; X86-NEXT: andl $-32, %esp # encoding: [0x83,0xe4,0xe0] ; X86-NEXT: subl $32, %esp # encoding: [0x83,0xec,0x20] -; X86-NEXT: vaddnepbf16 %ymm2, %ymm0, %ymm0 # encoding: [0x62,0xf5,0x7d,0x28,0x58,0xc2] -; X86-NEXT: vaddnepbf16 8(%ebp), %ymm1, %ymm1 # encoding: [0x62,0xf5,0x75,0x28,0x58,0x8d,0x08,0x00,0x00,0x00] +; X86-NEXT: vaddbf16 %ymm2, %ymm0, %ymm0 # encoding: [0x62,0xf5,0x7d,0x28,0x58,0xc2] +; X86-NEXT: vaddbf16 8(%ebp), %ymm1, %ymm1 # encoding: [0x62,0xf5,0x75,0x28,0x58,0x8d,0x08,0x00,0x00,0x00] ; X86-NEXT: movl %ebp, %esp # encoding: [0x89,0xec] ; X86-NEXT: popl %ebp # encoding: [0x5d] ; X86-NEXT: retl # encoding: [0xc3] diff --git a/llvm/test/CodeGen/X86/avx10_2bf16-intrinsics.ll b/llvm/test/CodeGen/X86/avx10_2bf16-intrinsics.ll index 59151d4dd9609..f1146d5617f77 100644 --- a/llvm/test/CodeGen/X86/avx10_2bf16-intrinsics.ll +++ b/llvm/test/CodeGen/X86/avx10_2bf16-intrinsics.ll @@ -2,118 +2,118 @@ ; RUN: llc < %s -verify-machineinstrs -mtriple=x86_64-unknown-unknown --show-mc-encoding -mattr=+avx10.2-256 | FileCheck %s --check-prefixes=CHECK,X64 ; RUN: llc < %s -verify-machineinstrs -mtriple=i686-unknown-unknown --show-mc-encoding -mattr=+avx10.2-256 | FileCheck %s --check-prefixes=CHECK,X86 -declare <16 x bfloat> @llvm.x86.avx10.vminpbf16256(<16 x bfloat>, <16 x bfloat>) +declare <16 x bfloat> @llvm.x86.avx10.vminbf16256(<16 x bfloat>, <16 x bfloat>) -define <16 x bfloat> @test_int_x86_avx10_min_nepbf16_256(<16 x bfloat> %x1, <16 x bfloat> %x2) { -; CHECK-LABEL: test_int_x86_avx10_min_nepbf16_256: +define <16 x bfloat> @test_int_x86_avx10_min_bf16_256(<16 x bfloat> %x1, <16 x bfloat> %x2) { +; CHECK-LABEL: test_int_x86_avx10_min_bf16_256: ; CHECK: # %bb.0: -; CHECK-NEXT: vminpbf16 %ymm1, %ymm0, %ymm0 # encoding: [0x62,0xf5,0x7d,0x28,0x5d,0xc1] +; CHECK-NEXT: vminbf16 %ymm1, %ymm0, %ymm0 # encoding: [0x62,0xf5,0x7d,0x28,0x5d,0xc1] ; CHECK-NEXT: ret{{[l|q]}} # encoding: [0xc3] - %res0 = call <16 x bfloat> @llvm.x86.avx10.vminpbf16256(<16 x bfloat> %x1, <16 x bfloat> %x2) + %res0 = call <16 x bfloat> @llvm.x86.avx10.vminbf16256(<16 x bfloat> %x1, <16 x bfloat> %x2) ret <16 x bfloat> %res0 } -define <16 x bfloat> @test_int_x86_avx10_maskz_min_nepbf16_256(<16 x bfloat> %x1, <16 x bfloat> %x2, i16 %msk) { -; X64-LABEL: test_int_x86_avx10_maskz_min_nepbf16_256: +define <16 x bfloat> @test_int_x86_avx10_maskz_min_bf16_256(<16 x bfloat> %x1, <16 x bfloat> %x2, i16 %msk) { +; X64-LABEL: test_int_x86_avx10_maskz_min_bf16_256: ; X64: # %bb.0: ; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf] -; X64-NEXT: vminpbf16 %ymm1, %ymm0, %ymm0 {%k1} {z} # encoding: [0x62,0xf5,0x7d,0xa9,0x5d,0xc1] +; X64-NEXT: vminbf16 %ymm1, %ymm0, %ymm0 {%k1} {z} # encoding: [0x62,0xf5,0x7d,0xa9,0x5d,0xc1] ; X64-NEXT: retq # encoding: [0xc3] ; -; X86-LABEL: test_int_x86_avx10_maskz_min_nepbf16_256: +; X86-LABEL: test_int_x86_avx10_maskz_min_bf16_256: ; X86: # %bb.0: ; X86-NEXT: kmovw {{[0-9]+}}(%esp), %k1 # encoding: [0xc5,0xf8,0x90,0x4c,0x24,0x04] -; X86-NEXT: vminpbf16 %ymm1, %ymm0, %ymm0 {%k1} {z} # encoding: [0x62,0xf5,0x7d,0xa9,0x5d,0xc1] +; X86-NEXT: vminbf16 %ymm1, %ymm0, %ymm0 {%k1} {z} # encoding: [0x62,0xf5,0x7d,0xa9,0x5d,0xc1] ; X86-NEXT: retl # encoding: [0xc3] %mask = bitcast i16 %msk to <16 x i1> - %res0 = call <16 x bfloat> @llvm.x86.avx10.vminpbf16256(<16 x bfloat> %x1, <16 x bfloat> %x2) + %res0 = call <16 x bfloat> @llvm.x86.avx10.vminbf16256(<16 x bfloat> %x1, <16 x bfloat> %x2) %res1 = select <16 x i1> %mask, <16 x bfloat> %res0, <16 x bfloat> zeroinitializer ret <16 x bfloat> %res1 } -declare <8 x bfloat> @llvm.x86.avx10.vminpbf16128(<8 x bfloat>, <8 x bfloat>) +declare <8 x bfloat> @llvm.x86.avx10.vminbf16128(<8 x bfloat>, <8 x bfloat>) -define <8 x bfloat> @test_int_x86_avx10_min_nepbf16_128(<8 x bfloat> %x1, <8 x bfloat> %x2) { -; CHECK-LABEL: test_int_x86_avx10_min_nepbf16_128: +define <8 x bfloat> @test_int_x86_avx10_min_bf16_128(<8 x bfloat> %x1, <8 x bfloat> %x2) { +; CHECK-LABEL: test_int_x86_avx10_min_bf16_128: ; CHECK: # %bb.0: -; CHECK-NEXT: vminpbf16 %xmm1, %xmm0, %xmm0 # encoding: [0x62,0xf5,0x7d,0x08,0x5d,0xc1] +; CHECK-NEXT: vminbf16 %xmm1, %xmm0, %xmm0 # encoding: [0x62,0xf5,0x7d,0x08,0x5d,0xc1] ; CHECK-NEXT: ret{{[l|q]}} # encoding: [0xc3] - %res0 = call <8 x bfloat> @llvm.x86.avx10.vminpbf16128(<8 x bfloat> %x1, <8 x bfloat> %x2) + %res0 = call <8 x bfloat> @llvm.x86.avx10.vminbf16128(<8 x bfloat> %x1, <8 x bfloat> %x2) ret <8 x bfloat> %res0 } -define <8 x bfloat> @test_int_x86_avx10_maskz_min_nepbf16_128(<8 x bfloat> %x1, <8 x bfloat> %x2, i8 %msk) { -; X64-LABEL: test_int_x86_avx10_maskz_min_nepbf16_128: +define <8 x bfloat> @test_int_x86_avx10_maskz_min_bf16_128(<8 x bfloat> %x1, <8 x bfloat> %x2, i8 %msk) { +; X64-LABEL: test_int_x86_avx10_maskz_min_bf16_128: ; X64: # %bb.0: ; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf] -; X64-NEXT: vminpbf16 %xmm1, %xmm0, %xmm0 {%k1} {z} # encoding: [0x62,0xf5,0x7d,0x89,0x5d,0xc1] +; X64-NEXT: vminbf16 %xmm1, %xmm0, %xmm0 {%k1} {z} # encoding: [0x62,0xf5,0x7d,0x89,0x5d,0xc1] ; X64-NEXT: retq # encoding: [0xc3] ; -; X86-LABEL: test_int_x86_avx10_maskz_min_nepbf16_128: +; X86-LABEL: test_int_x86_avx10_maskz_min_bf16_128: ; X86: # %bb.0: ; X86-NEXT: kmovb {{[0-9]+}}(%esp), %k1 # encoding: [0xc5,0xf9,0x90,0x4c,0x24,0x04] -; X86-NEXT: vminpbf16 %xmm1, %xmm0, %xmm0 {%k1} {z} # encoding: [0x62,0xf5,0x7d,0x89,0x5d,0xc1] +; X86-NEXT: vminbf16 %xmm1, %xmm0, %xmm0 {%k1} {z} # encoding: [0x62,0xf5,0x7d,0x89,0x5d,0xc1] ; X86-NEXT: retl # encoding: [0xc3] %mask = bitcast i8 %msk to <8 x i1> - %res0 = call <8 x bfloat> @llvm.x86.avx10.vminpbf16128(<8 x bfloat> %x1, <8 x bfloat> %x2) + %res0 = call <8 x bfloat> @llvm.x86.avx10.vminbf16128(<8 x bfloat> %x1, <8 x bfloat> %x2) %res1 = select <8 x i1> %mask, <8 x bfloat> %res0, <8 x bfloat> zeroinitializer ret <8 x bfloat> %res1 } -declare <16 x bfloat> @llvm.x86.avx10.vmaxpbf16256(<16 x bfloat>, <16 x bfloat>) +declare <16 x bfloat> @llvm.x86.avx10.vmaxbf16256(<16 x bfloat>, <16 x bfloat>) -define <16 x bfloat> @test_int_x86_avx10_max_nepbf16_256(<16 x bfloat> %x1, <16 x bfloat> %x2) { -; CHECK-LABEL: test_int_x86_avx10_max_nepbf16_256: +define <16 x bfloat> @test_int_x86_avx10_max_bf16_256(<16 x bfloat> %x1, <16 x bfloat> %x2) { +; CHECK-LABEL: test_int_x86_avx10_max_bf16_256: ; CHECK: # %bb.0: -; CHECK-NEXT: vmaxpbf16 %ymm1, %ymm0, %ymm0 # encoding: [0x62,0xf5,0x7d,0x28,0x5f,0xc1] +; CHECK-NEXT: vmaxbf16 %ymm1, %ymm0, %ymm0 # encoding: [0x62,0xf5,0x7d,0x28,0x5f,0xc1] ; CHECK-NEXT: ret{{[l|q]}} # encoding: [0xc3] - %res0 = call <16 x bfloat> @llvm.x86.avx10.vmaxpbf16256(<16 x bfloat> %x1, <16 x bfloat> %x2) + %res0 = call <16 x bfloat> @llvm.x86.avx10.vmaxbf16256(<16 x bfloat> %x1, <16 x bfloat> %x2) ret <16 x bfloat> %res0 } -define <16 x bfloat> @test_int_x86_avx10_maskz_max_nepbf16_256(<16 x bfloat> %x1, <16 x bfloat> %x2, i16 %msk) { -; X64-LABEL: test_int_x86_avx10_maskz_max_nepbf16_256: +define <16 x bfloat> @test_int_x86_avx10_maskz_max_bf16_256(<16 x bfloat> %x1, <16 x bfloat> %x2, i16 %msk) { +; X64-LABEL: test_int_x86_avx10_maskz_max_bf16_256: ; X64: # %bb.0: ; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf] -; X64-NEXT: vmaxpbf16 %ymm1, %ymm0, %ymm0 {%k1} {z} # encoding: [0x62,0xf5,0x7d,0xa9,0x5f,0xc1] +; X64-NEXT: vmaxbf16 %ymm1, %ymm0, %ymm0 {%k1} {z} # encoding: [0x62,0xf5,0x7d,0xa9,0x5f,0xc1] ; X64-NEXT: retq # encoding: [0xc3] ; -; X86-LABEL: test_int_x86_avx10_maskz_max_nepbf16_256: +; X86-LABEL: test_int_x86_avx10_maskz_max_bf16_256: ; X86: # %bb.0: ; X86-NEXT: kmovw {{[0-9]+}}(%esp), %k1 # encoding: [0xc5,0xf8,0x90,0x4c,0x24,0x04] -; X86-NEXT: vmaxpbf16 %ymm1, %ymm0, %ymm0 {%k1} {z} # encoding: [0x62,0xf5,0x7d,0xa9,0x5f,0xc1] +; X86-NEXT: vmaxbf16 %ymm1, %ymm0, %ymm0 {%k1} {z} # encoding: [0x62,0xf5,0x7d,0xa9,0x5f,0xc1] ; X86-NEXT: retl # encoding: [0xc3] %mask = bitcast i16 %msk to <16 x i1> - %res0 = call <16 x bfloat> @llvm.x86.avx10.vmaxpbf16256(<16 x bfloat> %x1, <16 x bfloat> %x2) + %res0 = call <16 x bfloat> @llvm.x86.avx10.vmaxbf16256(<16 x bfloat> %x1, <16 x bfloat> %x2) %res1 = select <16 x i1> %mask, <16 x bfloat> %res0, <16 x bfloat> zeroinitializer ret <16 x bfloat> %res1 } -declare <8 x bfloat> @llvm.x86.avx10.vmaxpbf16128(<8 x bfloat>, <8 x bfloat>) +declare <8 x bfloat> @llvm.x86.avx10.vmaxbf16128(<8 x bfloat>, <8 x bfloat>) -define <8 x bfloat> @test_int_x86_avx10_max_nepbf16_128(<8 x bfloat> %x1, <8 x bfloat> %x2) { -; CHECK-LABEL: test_int_x86_avx10_max_nepbf16_128: +define <8 x bfloat> @test_int_x86_avx10_max_bf16_128(<8 x bfloat> %x1, <8 x bfloat> %x2) { +; CHECK-LABEL: test_int_x86_avx10_max_bf16_128: ; CHECK: # %bb.0: -; CHECK-NEXT: vmaxpbf16 %xmm1, %xmm0, %xmm0 # encoding: [0x62,0xf5,0x7d,0x08,0x5f,0xc1] +; CHECK-NEXT: vmaxbf16 %xmm1, %xmm0, %xmm0 # encoding: [0x62,0xf5,0x7d,0x08,0x5f,0xc1] ; CHECK-NEXT: ret{{[l|q]}} # encoding: [0xc3] - %res0 = call <8 x bfloat> @llvm.x86.avx10.vmaxpbf16128(<8 x bfloat> %x1, <8 x bfloat> %x2) + %res0 = call <8 x bfloat> @llvm.x86.avx10.vmaxbf16128(<8 x bfloat> %x1, <8 x bfloat> %x2) ret <8 x bfloat> %res0 } -define <8 x bfloat> @test_int_x86_avx10_maskz_max_nepbf16_128(<8 x bfloat> %x1, <8 x bfloat> %x2, i8 %msk) { -; X64-LABEL: test_int_x86_avx10_maskz_max_nepbf16_128: +define <8 x bfloat> @test_int_x86_avx10_maskz_max_bf16_128(<8 x bfloat> %x1, <8 x bfloat> %x2, i8 %msk) { +; X64-LABEL: test_int_x86_avx10_maskz_max_bf16_128: ; X64: # %bb.0: ; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf] -; X64-NEXT: vmaxpbf16 %xmm1, %xmm0, %xmm0 {%k1} {z} # encoding: [0x62,0xf5,0x7d,0x89,0x5f,0xc1] +; X64-NEXT: vmaxbf16 %xmm1, %xmm0, %xmm0 {%k1} {z} # encoding: [0x62,0xf5,0x7d,0x89,0x5f,0xc1] ; X64-NEXT: retq # encoding: [0xc3] ; -; X86-LABEL: test_int_x86_avx10_maskz_max_nepbf16_128: +; X86-LABEL: test_int_x86_avx10_maskz_max_bf16_128: ; X86: # %bb.0: ; X86-NEXT: kmovb {{[0-9]+}}(%esp), %k1 # encoding: [0xc5,0xf9,0x90,0x4c,0x24,0x04] -; X86-NEXT: vmaxpbf16 %xmm1, %xmm0, %xmm0 {%k1} {z} # encoding: [0x62,0xf5,0x7d,0x89,0x5f,0xc1] +; X86-NEXT: vmaxbf16 %xmm1, %xmm0, %xmm0 {%k1} {z} # encoding: [0x62,0xf5,0x7d,0x89,0x5f,0xc1] ; X86-NEXT: retl # encoding: [0xc3] %mask = bitcast i8 %msk to <8 x i1> - %res0 = call <8 x bfloat> @llvm.x86.avx10.vmaxpbf16128(<8 x bfloat> %x1, <8 x bfloat> %x2) + %res0 = call <8 x bfloat> @llvm.x86.avx10.vmaxbf16128(<8 x bfloat> %x1, <8 x bfloat> %x2) %res1 = select <8 x i1> %mask, <8 x bfloat> %res0, <8 x bfloat> zeroinitializer ret <8 x bfloat> %res1 } @@ -184,421 +184,421 @@ define i32 @test_x86_avx10_com_nesbf16_neq(<8 x bfloat> %a0, <8 x bfloat> %a1) { ret i32 %res } -declare <8 x bfloat> @llvm.x86.avx10.mask.rsqrt.nepbf16.128(<8 x bfloat>, <8 x bfloat>, i8) -declare <16 x bfloat> @llvm.x86.avx10.mask.rsqrt.nepbf16.256(<16 x bfloat>, <16 x bfloat>, i16) +declare <8 x bfloat> @llvm.x86.avx10.mask.rsqrt.bf16.128(<8 x bfloat>, <8 x bfloat>, i8) +declare <16 x bfloat> @llvm.x86.avx10.mask.rsqrt.bf16.256(<16 x bfloat>, <16 x bfloat>, i16) -define <8 x bfloat> @test_rsqrt_nepbf16_128(<8 x bfloat> %a0) { -; CHECK-LABEL: test_rsqrt_nepbf16_128: +define <8 x bfloat> @test_rsqrt_bf16_128(<8 x bfloat> %a0) { +; CHECK-LABEL: test_rsqrt_bf16_128: ; CHECK: # %bb.0: -; CHECK-NEXT: vrsqrtpbf16 %xmm0, %xmm0 # encoding: [0x62,0xf6,0x7c,0x08,0x4e,0xc0] +; CHECK-NEXT: vrsqrtbf16 %xmm0, %xmm0 # encoding: [0x62,0xf6,0x7c,0x08,0x4e,0xc0] ; CHECK-NEXT: ret{{[l|q]}} # encoding: [0xc3] - %res = call <8 x bfloat> @llvm.x86.avx10.mask.rsqrt.nepbf16.128(<8 x bfloat> %a0, <8 x bfloat> zeroinitializer, i8 -1) + %res = call <8 x bfloat> @llvm.x86.avx10.mask.rsqrt.bf16.128(<8 x bfloat> %a0, <8 x bfloat> zeroinitializer, i8 -1) ret <8 x bfloat> %res } -define <16 x bfloat> @test_rsqrt_nepbf16_256(<16 x bfloat> %a0) { -; CHECK-LABEL: test_rsqrt_nepbf16_256: +define <16 x bfloat> @test_rsqrt_bf16_256(<16 x bfloat> %a0) { +; CHECK-LABEL: test_rsqrt_bf16_256: ; CHECK: # %bb.0: -; CHECK-NEXT: vrsqrtpbf16 %ymm0, %ymm0 # encoding: [0x62,0xf6,0x7c,0x28,0x4e,0xc0] +; CHECK-NEXT: vrsqrtbf16 %ymm0, %ymm0 # encoding: [0x62,0xf6,0x7c,0x28,0x4e,0xc0] ; CHECK-NEXT: ret{{[l|q]}} # encoding: [0xc3] - %res = call <16 x bfloat> @llvm.x86.avx10.mask.rsqrt.nepbf16.256(<16 x bfloat> %a0, <16 x bfloat> zeroinitializer, i16 -1) + %res = call <16 x bfloat> @llvm.x86.avx10.mask.rsqrt.bf16.256(<16 x bfloat> %a0, <16 x bfloat> zeroinitializer, i16 -1) ret <16 x bfloat> %res } -declare <8 x bfloat> @llvm.x86.avx10.mask.rcp.nepbf16.128(<8 x bfloat>, <8 x bfloat>, i8) -declare <16 x bfloat> @llvm.x86.avx10.mask.rcp.nepbf16.256(<16 x bfloat>, <16 x bfloat>, i16) +declare <8 x bfloat> @llvm.x86.avx10.mask.rcp.bf16.128(<8 x bfloat>, <8 x bfloat>, i8) +declare <16 x bfloat> @llvm.x86.avx10.mask.rcp.bf16.256(<16 x bfloat>, <16 x bfloat>, i16) -define <8 x bfloat> @test_rcp_nepbf16_128(<8 x bfloat> %a0, <8 x bfloat> %a1, i8 %mask) { -; X64-LABEL: test_rcp_nepbf16_128: +define <8 x bfloat> @test_rcp_bf16_128(<8 x bfloat> %a0, <8 x bfloat> %a1, i8 %mask) { +; X64-LABEL: test_rcp_bf16_128: ; X64: # %bb.0: ; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf] -; X64-NEXT: vrcppbf16 %xmm0, %xmm1 {%k1} # encoding: [0x62,0xf6,0x7c,0x09,0x4c,0xc8] +; X64-NEXT: vrcpbf16 %xmm0, %xmm1 {%k1} # encoding: [0x62,0xf6,0x7c,0x09,0x4c,0xc8] ; X64-NEXT: vmovaps %xmm1, %xmm0 # EVEX TO VEX Compression encoding: [0xc5,0xf8,0x28,0xc1] ; X64-NEXT: retq # encoding: [0xc3] ; -; X86-LABEL: test_rcp_nepbf16_128: +; X86-LABEL: test_rcp_bf16_128: ; X86: # %bb.0: ; X86-NEXT: kmovb {{[0-9]+}}(%esp), %k1 # encoding: [0xc5,0xf9,0x90,0x4c,0x24,0x04] -; X86-NEXT: vrcppbf16 %xmm0, %xmm1 {%k1} # encoding: [0x62,0xf6,0x7c,0x09,0x4c,0xc8] +; X86-NEXT: vrcpbf16 %xmm0, %xmm1 {%k1} # encoding: [0x62,0xf6,0x7c,0x09,0x4c,0xc8] ; X86-NEXT: vmovaps %xmm1, %xmm0 # EVEX TO VEX Compression encoding: [0xc5,0xf8,0x28,0xc1] ; X86-NEXT: retl # encoding: [0xc3] - %res = call <8 x bfloat> @llvm.x86.avx10.mask.rcp.nepbf16.128(<8 x bfloat> %a0, <8 x bfloat> %a1, i8 %mask) + %res = call <8 x bfloat> @llvm.x86.avx10.mask.rcp.bf16.128(<8 x bfloat> %a0, <8 x bfloat> %a1, i8 %mask) ret <8 x bfloat> %res } -define <16 x bfloat> @test_rcp_nepbf16_256(<16 x bfloat> %a0, <16 x bfloat> %a1, i16 %mask) { -; X64-LABEL: test_rcp_nepbf16_256: +define <16 x bfloat> @test_rcp_bf16_256(<16 x bfloat> %a0, <16 x bfloat> %a1, i16 %mask) { +; X64-LABEL: test_rcp_bf16_256: ; X64: # %bb.0: ; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf] -; X64-NEXT: vrcppbf16 %ymm0, %ymm1 {%k1} # encoding: [0x62,0xf6,0x7c,0x29,0x4c,0xc8] +; X64-NEXT: vrcpbf16 %ymm0, %ymm1 {%k1} # encoding: [0x62,0xf6,0x7c,0x29,0x4c,0xc8] ; X64-NEXT: vmovaps %ymm1, %ymm0 # EVEX TO VEX Compression encoding: [0xc5,0xfc,0x28,0xc1] ; X64-NEXT: retq # encoding: [0xc3] ; -; X86-LABEL: test_rcp_nepbf16_256: +; X86-LABEL: test_rcp_bf16_256: ; X86: # %bb.0: ; X86-NEXT: kmovw {{[0-9]+}}(%esp), %k1 # encoding: [0xc5,0xf8,0x90,0x4c,0x24,0x04] -; X86-NEXT: vrcppbf16 %ymm0, %ymm1 {%k1} # encoding: [0x62,0xf6,0x7c,0x29,0x4c,0xc8] +; X86-NEXT: vrcpbf16 %ymm0, %ymm1 {%k1} # encoding: [0x62,0xf6,0x7c,0x29,0x4c,0xc8] ; X86-NEXT: vmovaps %ymm1, %ymm0 # EVEX TO VEX Compression encoding: [0xc5,0xfc,0x28,0xc1] ; X86-NEXT: retl # encoding: [0xc3] - %res = call <16 x bfloat> @llvm.x86.avx10.mask.rcp.nepbf16.256(<16 x bfloat> %a0, <16 x bfloat> %a1, i16 %mask) + %res = call <16 x bfloat> @llvm.x86.avx10.mask.rcp.bf16.256(<16 x bfloat> %a0, <16 x bfloat> %a1, i16 %mask) ret <16 x bfloat> %res } -declare <8 x bfloat> @llvm.x86.avx10.mask.reduce.nepbf16.128(<8 x bfloat>, i32, <8 x bfloat>, i8) -declare <16 x bfloat> @llvm.x86.avx10.mask.reduce.nepbf16.256(<16 x bfloat>, i32, <16 x bfloat>, i16) +declare <8 x bfloat> @llvm.x86.avx10.mask.reduce.bf16.128(<8 x bfloat>, i32, <8 x bfloat>, i8) +declare <16 x bfloat> @llvm.x86.avx10.mask.reduce.bf16.256(<16 x bfloat>, i32, <16 x bfloat>, i16) -define <8 x bfloat>@test_int_x86_avx512_mask_reduce_nepbf16_128(<8 x bfloat> %x0, <8 x bfloat> %x2, i8 %x3) { -; X64-LABEL: test_int_x86_avx512_mask_reduce_nepbf16_128: +define <8 x bfloat>@test_int_x86_avx512_mask_reduce_bf16_128(<8 x bfloat> %x0, <8 x bfloat> %x2, i8 %x3) { +; X64-LABEL: test_int_x86_avx512_mask_reduce_bf16_128: ; X64: # %bb.0: ; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf] -; X64-NEXT: vreducenepbf16 $8, %xmm0, %xmm1 {%k1} # encoding: [0x62,0xf3,0x7f,0x09,0x56,0xc8,0x08] -; X64-NEXT: vreducenepbf16 $4, %xmm0, %xmm0 # encoding: [0x62,0xf3,0x7f,0x08,0x56,0xc0,0x04] -; X64-NEXT: vaddnepbf16 %xmm0, %xmm1, %xmm0 # encoding: [0x62,0xf5,0x75,0x08,0x58,0xc0] +; X64-NEXT: vreducebf16 $8, %xmm0, %xmm1 {%k1} # encoding: [0x62,0xf3,0x7f,0x09,0x56,0xc8,0x08] +; X64-NEXT: vreducebf16 $4, %xmm0, %xmm0 # encoding: [0x62,0xf3,0x7f,0x08,0x56,0xc0,0x04] +; X64-NEXT: vaddbf16 %xmm0, %xmm1, %xmm0 # encoding: [0x62,0xf5,0x75,0x08,0x58,0xc0] ; X64-NEXT: retq # encoding: [0xc3] ; -; X86-LABEL: test_int_x86_avx512_mask_reduce_nepbf16_128: +; X86-LABEL: test_int_x86_avx512_mask_reduce_bf16_128: ; X86: # %bb.0: ; X86-NEXT: kmovb {{[0-9]+}}(%esp), %k1 # encoding: [0xc5,0xf9,0x90,0x4c,0x24,0x04] -; X86-NEXT: vreducenepbf16 $8, %xmm0, %xmm1 {%k1} # encoding: [0x62,0xf3,0x7f,0x09,0x56,0xc8,0x08] -; X86-NEXT: vreducenepbf16 $4, %xmm0, %xmm0 # encoding: [0x62,0xf3,0x7f,0x08,0x56,0xc0,0x04] -; X86-NEXT: vaddnepbf16 %xmm0, %xmm1, %xmm0 # encoding: [0x62,0xf5,0x75,0x08,0x58,0xc0] +; X86-NEXT: vreducebf16 $8, %xmm0, %xmm1 {%k1} # encoding: [0x62,0xf3,0x7f,0x09,0x56,0xc8,0x08] +; X86-NEXT: vreducebf16 $4, %xmm0, %xmm0 # encoding: [0x62,0xf3,0x7f,0x08,0x56,0xc0,0x04] +; X86-NEXT: vaddbf16 %xmm0, %xmm1, %xmm0 # encoding: [0x62,0xf5,0x75,0x08,0x58,0xc0] ; X86-NEXT: retl # encoding: [0xc3] - %res = call <8 x bfloat> @llvm.x86.avx10.mask.reduce.nepbf16.128(<8 x bfloat> %x0, i32 8, <8 x bfloat> %x2, i8 %x3) - %res1 = call <8 x bfloat> @llvm.x86.avx10.mask.reduce.nepbf16.128(<8 x bfloat> %x0, i32 4, <8 x bfloat> %x2, i8 -1) + %res = call <8 x bfloat> @llvm.x86.avx10.mask.reduce.bf16.128(<8 x bfloat> %x0, i32 8, <8 x bfloat> %x2, i8 %x3) + %res1 = call <8 x bfloat> @llvm.x86.avx10.mask.reduce.bf16.128(<8 x bfloat> %x0, i32 4, <8 x bfloat> %x2, i8 -1) %res2 = fadd <8 x bfloat> %res, %res1 ret <8 x bfloat> %res2 } -define <16 x bfloat>@test_int_x86_avx512_mask_reduce_nepbf16_256(<16 x bfloat> %x0, <16 x bfloat> %x2, i16 %x3) { -; X64-LABEL: test_int_x86_avx512_mask_reduce_nepbf16_256: +define <16 x bfloat>@test_int_x86_avx512_mask_reduce_bf16_256(<16 x bfloat> %x0, <16 x bfloat> %x2, i16 %x3) { +; X64-LABEL: test_int_x86_avx512_mask_reduce_bf16_256: ; X64: # %bb.0: ; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf] -; X64-NEXT: vreducenepbf16 $8, %ymm0, %ymm1 {%k1} # encoding: [0x62,0xf3,0x7f,0x29,0x56,0xc8,0x08] -; X64-NEXT: vreducenepbf16 $4, %ymm0, %ymm0 # encoding: [0x62,0xf3,0x7f,0x28,0x56,0xc0,0x04] -; X64-NEXT: vaddnepbf16 %ymm0, %ymm1, %ymm0 # encoding: [0x62,0xf5,0x75,0x28,0x58,0xc0] +; X64-NEXT: vreducebf16 $8, %ymm0, %ymm1 {%k1} # encoding: [0x62,0xf3,0x7f,0x29,0x56,0xc8,0x08] +; X64-NEXT: vreducebf16 $4, %ymm0, %ymm0 # encoding: [0x62,0xf3,0x7f,0x28,0x56,0xc0,0x04] +; X64-NEXT: vaddbf16 %ymm0, %ymm1, %ymm0 # encoding: [0x62,0xf5,0x75,0x28,0x58,0xc0] ; X64-NEXT: retq # encoding: [0xc3] ; -; X86-LABEL: test_int_x86_avx512_mask_reduce_nepbf16_256: +; X86-LABEL: test_int_x86_avx512_mask_reduce_bf16_256: ; X86: # %bb.0: ; X86-NEXT: kmovw {{[0-9]+}}(%esp), %k1 # encoding: [0xc5,0xf8,0x90,0x4c,0x24,0x04] -; X86-NEXT: vreducenepbf16 $8, %ymm0, %ymm1 {%k1} # encoding: [0x62,0xf3,0x7f,0x29,0x56,0xc8,0x08] -; X86-NEXT: vreducenepbf16 $4, %ymm0, %ymm0 # encoding: [0x62,0xf3,0x7f,0x28,0x56,0xc0,0x04] -; X86-NEXT: vaddnepbf16 %ymm0, %ymm1, %ymm0 # encoding: [0x62,0xf5,0x75,0x28,0x58,0xc0] +; X86-NEXT: vreducebf16 $8, %ymm0, %ymm1 {%k1} # encoding: [0x62,0xf3,0x7f,0x29,0x56,0xc8,0x08] +; X86-NEXT: vreducebf16 $4, %ymm0, %ymm0 # encoding: [0x62,0xf3,0x7f,0x28,0x56,0xc0,0x04] +; X86-NEXT: vaddbf16 %ymm0, %ymm1, %ymm0 # encoding: [0x62,0xf5,0x75,0x28,0x58,0xc0] ; X86-NEXT: retl # encoding: [0xc3] - %res = call <16 x bfloat> @llvm.x86.avx10.mask.reduce.nepbf16.256(<16 x bfloat> %x0, i32 8, <16 x bfloat> %x2, i16 %x3) - %res1 = call <16 x bfloat> @llvm.x86.avx10.mask.reduce.nepbf16.256(<16 x bfloat> %x0, i32 4, <16 x bfloat> %x2, i16 -1) + %res = call <16 x bfloat> @llvm.x86.avx10.mask.reduce.bf16.256(<16 x bfloat> %x0, i32 8, <16 x bfloat> %x2, i16 %x3) + %res1 = call <16 x bfloat> @llvm.x86.avx10.mask.reduce.bf16.256(<16 x bfloat> %x0, i32 4, <16 x bfloat> %x2, i16 -1) %res2 = fadd <16 x bfloat> %res, %res1 ret <16 x bfloat> %res2 } -declare <8 x i1> @llvm.x86.avx10.fpclass.nepbf16.128(<8 x bfloat>, i32) -declare <16 x i1> @llvm.x86.avx10.fpclass.nepbf16.256(<16 x bfloat>, i32) +declare <8 x i1> @llvm.x86.avx10.fpclass.bf16.128(<8 x bfloat>, i32) +declare <16 x i1> @llvm.x86.avx10.fpclass.bf16.256(<16 x bfloat>, i32) -define i8 @test_int_x86_avx512_fpclass_nepbf16_128(<8 x bfloat> %x0) { -; CHECK-LABEL: test_int_x86_avx512_fpclass_nepbf16_128: +define i8 @test_int_x86_avx512_fpclass_bf16_128(<8 x bfloat> %x0) { +; CHECK-LABEL: test_int_x86_avx512_fpclass_bf16_128: ; CHECK: # %bb.0: -; CHECK-NEXT: vfpclasspbf16 $2, %xmm0, %k1 # encoding: [0x62,0xf3,0x7f,0x08,0x66,0xc8,0x02] +; CHECK-NEXT: vfpclassbf16 $2, %xmm0, %k1 # encoding: [0x62,0xf3,0x7f,0x08,0x66,0xc8,0x02] ; CHECK-NEXT: # k1 = isPositiveZero(xmm0) -; CHECK-NEXT: vfpclasspbf16 $4, %xmm0, %k0 {%k1} # encoding: [0x62,0xf3,0x7f,0x09,0x66,0xc0,0x04] +; CHECK-NEXT: vfpclassbf16 $4, %xmm0, %k0 {%k1} # encoding: [0x62,0xf3,0x7f,0x09,0x66,0xc0,0x04] ; CHECK-NEXT: kmovd %k0, %eax # encoding: [0xc5,0xfb,0x93,0xc0] ; CHECK-NEXT: # kill: def $al killed $al killed $eax ; CHECK-NEXT: ret{{[l|q]}} # encoding: [0xc3] - %res = call <8 x i1> @llvm.x86.avx10.fpclass.nepbf16.128(<8 x bfloat> %x0, i32 4) - %res1 = call <8 x i1> @llvm.x86.avx10.fpclass.nepbf16.128(<8 x bfloat> %x0, i32 2) + %res = call <8 x i1> @llvm.x86.avx10.fpclass.bf16.128(<8 x bfloat> %x0, i32 4) + %res1 = call <8 x i1> @llvm.x86.avx10.fpclass.bf16.128(<8 x bfloat> %x0, i32 2) %1 = and <8 x i1> %res1, %res %2 = bitcast <8 x i1> %1 to i8 ret i8 %2 } -define i16 @test_int_x86_avx512_fpclass_nepbf16_256(<16 x bfloat> %x0) { -; CHECK-LABEL: test_int_x86_avx512_fpclass_nepbf16_256: +define i16 @test_int_x86_avx512_fpclass_bf16_256(<16 x bfloat> %x0) { +; CHECK-LABEL: test_int_x86_avx512_fpclass_bf16_256: ; CHECK: # %bb.0: -; CHECK-NEXT: vfpclasspbf16 $2, %ymm0, %k1 # encoding: [0x62,0xf3,0x7f,0x28,0x66,0xc8,0x02] +; CHECK-NEXT: vfpclassbf16 $2, %ymm0, %k1 # encoding: [0x62,0xf3,0x7f,0x28,0x66,0xc8,0x02] ; CHECK-NEXT: # k1 = isPositiveZero(ymm0) -; CHECK-NEXT: vfpclasspbf16 $4, %ymm0, %k0 {%k1} # encoding: [0x62,0xf3,0x7f,0x29,0x66,0xc0,0x04] +; CHECK-NEXT: vfpclassbf16 $4, %ymm0, %k0 {%k1} # encoding: [0x62,0xf3,0x7f,0x29,0x66,0xc0,0x04] ; CHECK-NEXT: kmovd %k0, %eax # encoding: [0xc5,0xfb,0x93,0xc0] ; CHECK-NEXT: # kill: def $ax killed $ax killed $eax ; CHECK-NEXT: vzeroupper # encoding: [0xc5,0xf8,0x77] ; CHECK-NEXT: ret{{[l|q]}} # encoding: [0xc3] - %res = call <16 x i1> @llvm.x86.avx10.fpclass.nepbf16.256(<16 x bfloat> %x0, i32 4) - %res1 = call <16 x i1> @llvm.x86.avx10.fpclass.nepbf16.256(<16 x bfloat> %x0, i32 2) + %res = call <16 x i1> @llvm.x86.avx10.fpclass.bf16.256(<16 x bfloat> %x0, i32 4) + %res1 = call <16 x i1> @llvm.x86.avx10.fpclass.bf16.256(<16 x bfloat> %x0, i32 2) %1 = and <16 x i1> %res1, %res %2 = bitcast <16 x i1> %1 to i16 ret i16 %2 } -declare <8 x bfloat> @llvm.x86.avx10.mask.getexp.nepbf16.128(<8 x bfloat>, <8 x bfloat>, i8) -declare <16 x bfloat> @llvm.x86.avx10.mask.getexp.nepbf16.256(<16 x bfloat>, <16 x bfloat>, i16) +declare <8 x bfloat> @llvm.x86.avx10.mask.getexp.bf16.128(<8 x bfloat>, <8 x bfloat>, i8) +declare <16 x bfloat> @llvm.x86.avx10.mask.getexp.bf16.256(<16 x bfloat>, <16 x bfloat>, i16) -define <8 x bfloat>@test_int_x86_avx512_getexp_nepbf16_128(<8 x bfloat> %x0) { -; CHECK-LABEL: test_int_x86_avx512_getexp_nepbf16_128: +define <8 x bfloat>@test_int_x86_avx512_getexp_bf16_128(<8 x bfloat> %x0) { +; CHECK-LABEL: test_int_x86_avx512_getexp_bf16_128: ; CHECK: # %bb.0: -; CHECK-NEXT: vgetexppbf16 %xmm0, %xmm0 # encoding: [0x62,0xf5,0x7d,0x08,0x42,0xc0] +; CHECK-NEXT: vgetexpbf16 %xmm0, %xmm0 # encoding: [0x62,0xf5,0x7d,0x08,0x42,0xc0] ; CHECK-NEXT: ret{{[l|q]}} # encoding: [0xc3] - %res = call <8 x bfloat> @llvm.x86.avx10.mask.getexp.nepbf16.128(<8 x bfloat> %x0, <8 x bfloat> zeroinitializer, i8 -1) + %res = call <8 x bfloat> @llvm.x86.avx10.mask.getexp.bf16.128(<8 x bfloat> %x0, <8 x bfloat> zeroinitializer, i8 -1) ret <8 x bfloat> %res } -define <8 x bfloat>@test_int_x86_avx512_mask_getexp_nepbf16_128(<8 x bfloat> %x0, <8 x bfloat> %x1, i8 %x2) { -; X64-LABEL: test_int_x86_avx512_mask_getexp_nepbf16_128: +define <8 x bfloat>@test_int_x86_avx512_mask_getexp_bf16_128(<8 x bfloat> %x0, <8 x bfloat> %x1, i8 %x2) { +; X64-LABEL: test_int_x86_avx512_mask_getexp_bf16_128: ; X64: # %bb.0: ; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf] -; X64-NEXT: vgetexppbf16 %xmm0, %xmm1 {%k1} # encoding: [0x62,0xf5,0x7d,0x09,0x42,0xc8] +; X64-NEXT: vgetexpbf16 %xmm0, %xmm1 {%k1} # encoding: [0x62,0xf5,0x7d,0x09,0x42,0xc8] ; X64-NEXT: vmovaps %xmm1, %xmm0 # EVEX TO VEX Compression encoding: [0xc5,0xf8,0x28,0xc1] ; X64-NEXT: retq # encoding: [0xc3] ; -; X86-LABEL: test_int_x86_avx512_mask_getexp_nepbf16_128: +; X86-LABEL: test_int_x86_avx512_mask_getexp_bf16_128: ; X86: # %bb.0: ; X86-NEXT: kmovb {{[0-9]+}}(%esp), %k1 # encoding: [0xc5,0xf9,0x90,0x4c,0x24,0x04] -; X86-NEXT: vgetexppbf16 %xmm0, %xmm1 {%k1} # encoding: [0x62,0xf5,0x7d,0x09,0x42,0xc8] +; X86-NEXT: vgetexpbf16 %xmm0, %xmm1 {%k1} # encoding: [0x62,0xf5,0x7d,0x09,0x42,0xc8] ; X86-NEXT: vmovaps %xmm1, %xmm0 # EVEX TO VEX Compression encoding: [0xc5,0xf8,0x28,0xc1] ; X86-NEXT: retl # encoding: [0xc3] - %res = call <8 x bfloat> @llvm.x86.avx10.mask.getexp.nepbf16.128(<8 x bfloat> %x0, <8 x bfloat> %x1, i8 %x2) + %res = call <8 x bfloat> @llvm.x86.avx10.mask.getexp.bf16.128(<8 x bfloat> %x0, <8 x bfloat> %x1, i8 %x2) ret <8 x bfloat> %res } -define <8 x bfloat>@test_int_x86_avx512_maskz_getexp_nepbf16_128(<8 x bfloat> %x0, i8 %x2) { -; X64-LABEL: test_int_x86_avx512_maskz_getexp_nepbf16_128: +define <8 x bfloat>@test_int_x86_avx512_maskz_getexp_bf16_128(<8 x bfloat> %x0, i8 %x2) { +; X64-LABEL: test_int_x86_avx512_maskz_getexp_bf16_128: ; X64: # %bb.0: ; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf] -; X64-NEXT: vgetexppbf16 %xmm0, %xmm0 {%k1} {z} # encoding: [0x62,0xf5,0x7d,0x89,0x42,0xc0] +; X64-NEXT: vgetexpbf16 %xmm0, %xmm0 {%k1} {z} # encoding: [0x62,0xf5,0x7d,0x89,0x42,0xc0] ; X64-NEXT: retq # encoding: [0xc3] ; -; X86-LABEL: test_int_x86_avx512_maskz_getexp_nepbf16_128: +; X86-LABEL: test_int_x86_avx512_maskz_getexp_bf16_128: ; X86: # %bb.0: ; X86-NEXT: kmovb {{[0-9]+}}(%esp), %k1 # encoding: [0xc5,0xf9,0x90,0x4c,0x24,0x04] -; X86-NEXT: vgetexppbf16 %xmm0, %xmm0 {%k1} {z} # encoding: [0x62,0xf5,0x7d,0x89,0x42,0xc0] +; X86-NEXT: vgetexpbf16 %xmm0, %xmm0 {%k1} {z} # encoding: [0x62,0xf5,0x7d,0x89,0x42,0xc0] ; X86-NEXT: retl # encoding: [0xc3] - %res = call <8 x bfloat> @llvm.x86.avx10.mask.getexp.nepbf16.128(<8 x bfloat> %x0, <8 x bfloat> zeroinitializer, i8 %x2) + %res = call <8 x bfloat> @llvm.x86.avx10.mask.getexp.bf16.128(<8 x bfloat> %x0, <8 x bfloat> zeroinitializer, i8 %x2) ret <8 x bfloat> %res } -define <16 x bfloat>@test_int_x86_avx512_getexp_nepbf16_256(<16 x bfloat> %x0) { -; CHECK-LABEL: test_int_x86_avx512_getexp_nepbf16_256: +define <16 x bfloat>@test_int_x86_avx512_getexp_bf16_256(<16 x bfloat> %x0) { +; CHECK-LABEL: test_int_x86_avx512_getexp_bf16_256: ; CHECK: # %bb.0: -; CHECK-NEXT: vgetexppbf16 %ymm0, %ymm0 # encoding: [0x62,0xf5,0x7d,0x28,0x42,0xc0] +; CHECK-NEXT: vgetexpbf16 %ymm0, %ymm0 # encoding: [0x62,0xf5,0x7d,0x28,0x42,0xc0] ; CHECK-NEXT: ret{{[l|q]}} # encoding: [0xc3] - %res = call <16 x bfloat> @llvm.x86.avx10.mask.getexp.nepbf16.256(<16 x bfloat> %x0, <16 x bfloat> zeroinitializer, i16 -1) + %res = call <16 x bfloat> @llvm.x86.avx10.mask.getexp.bf16.256(<16 x bfloat> %x0, <16 x bfloat> zeroinitializer, i16 -1) ret <16 x bfloat> %res } -define <16 x bfloat>@test_int_x86_avx512_mask_getexp_nepbf16_256(<16 x bfloat> %x0, <16 x bfloat> %x1, i16 %x2) { -; X64-LABEL: test_int_x86_avx512_mask_getexp_nepbf16_256: +define <16 x bfloat>@test_int_x86_avx512_mask_getexp_bf16_256(<16 x bfloat> %x0, <16 x bfloat> %x1, i16 %x2) { +; X64-LABEL: test_int_x86_avx512_mask_getexp_bf16_256: ; X64: # %bb.0: ; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf] -; X64-NEXT: vgetexppbf16 %ymm0, %ymm1 {%k1} # encoding: [0x62,0xf5,0x7d,0x29,0x42,0xc8] +; X64-NEXT: vgetexpbf16 %ymm0, %ymm1 {%k1} # encoding: [0x62,0xf5,0x7d,0x29,0x42,0xc8] ; X64-NEXT: vmovaps %ymm1, %ymm0 # EVEX TO VEX Compression encoding: [0xc5,0xfc,0x28,0xc1] ; X64-NEXT: retq # encoding: [0xc3] ; -; X86-LABEL: test_int_x86_avx512_mask_getexp_nepbf16_256: +; X86-LABEL: test_int_x86_avx512_mask_getexp_bf16_256: ; X86: # %bb.0: ; X86-NEXT: kmovw {{[0-9]+}}(%esp), %k1 # encoding: [0xc5,0xf8,0x90,0x4c,0x24,0x04] -; X86-NEXT: vgetexppbf16 %ymm0, %ymm1 {%k1} # encoding: [0x62,0xf5,0x7d,0x29,0x42,0xc8] +; X86-NEXT: vgetexpbf16 %ymm0, %ymm1 {%k1} # encoding: [0x62,0xf5,0x7d,0x29,0x42,0xc8] ; X86-NEXT: vmovaps %ymm1, %ymm0 # EVEX TO VEX Compression encoding: [0xc5,0xfc,0x28,0xc1] ; X86-NEXT: retl # encoding: [0xc3] - %res = call <16 x bfloat> @llvm.x86.avx10.mask.getexp.nepbf16.256(<16 x bfloat> %x0, <16 x bfloat> %x1, i16 %x2) + %res = call <16 x bfloat> @llvm.x86.avx10.mask.getexp.bf16.256(<16 x bfloat> %x0, <16 x bfloat> %x1, i16 %x2) ret <16 x bfloat> %res } -define <16 x bfloat>@test_int_x86_avx512_maskz_getexp_nepbf16_256(<16 x bfloat> %x0, i16 %x2) { -; X64-LABEL: test_int_x86_avx512_maskz_getexp_nepbf16_256: +define <16 x bfloat>@test_int_x86_avx512_maskz_getexp_bf16_256(<16 x bfloat> %x0, i16 %x2) { +; X64-LABEL: test_int_x86_avx512_maskz_getexp_bf16_256: ; X64: # %bb.0: ; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf] -; X64-NEXT: vgetexppbf16 %ymm0, %ymm0 {%k1} {z} # encoding: [0x62,0xf5,0x7d,0xa9,0x42,0xc0] +; X64-NEXT: vgetexpbf16 %ymm0, %ymm0 {%k1} {z} # encoding: [0x62,0xf5,0x7d,0xa9,0x42,0xc0] ; X64-NEXT: retq # encoding: [0xc3] ; -; X86-LABEL: test_int_x86_avx512_maskz_getexp_nepbf16_256: +; X86-LABEL: test_int_x86_avx512_maskz_getexp_bf16_256: ; X86: # %bb.0: ; X86-NEXT: kmovw {{[0-9]+}}(%esp), %k1 # encoding: [0xc5,0xf8,0x90,0x4c,0x24,0x04] -; X86-NEXT: vgetexppbf16 %ymm0, %ymm0 {%k1} {z} # encoding: [0x62,0xf5,0x7d,0xa9,0x42,0xc0] +; X86-NEXT: vgetexpbf16 %ymm0, %ymm0 {%k1} {z} # encoding: [0x62,0xf5,0x7d,0xa9,0x42,0xc0] ; X86-NEXT: retl # encoding: [0xc3] - %res = call <16 x bfloat> @llvm.x86.avx10.mask.getexp.nepbf16.256(<16 x bfloat> %x0, <16 x bfloat> zeroinitializer, i16 %x2) + %res = call <16 x bfloat> @llvm.x86.avx10.mask.getexp.bf16.256(<16 x bfloat> %x0, <16 x bfloat> zeroinitializer, i16 %x2) ret <16 x bfloat> %res } -declare <8 x bfloat> @llvm.x86.avx10.mask.getmant.nepbf16.128(<8 x bfloat>, i32, <8 x bfloat>, i8) -declare <16 x bfloat> @llvm.x86.avx10.mask.getmant.nepbf16.256(<16 x bfloat>, i32, <16 x bfloat>, i16) +declare <8 x bfloat> @llvm.x86.avx10.mask.getmant.bf16.128(<8 x bfloat>, i32, <8 x bfloat>, i8) +declare <16 x bfloat> @llvm.x86.avx10.mask.getmant.bf16.256(<16 x bfloat>, i32, <16 x bfloat>, i16) -define <8 x bfloat>@test_int_x86_avx512_mask_getmant_nepbf16_128(<8 x bfloat> %x0, <8 x bfloat> %x2, i8 %x3) { -; X64-LABEL: test_int_x86_avx512_mask_getmant_nepbf16_128: +define <8 x bfloat>@test_int_x86_avx512_mask_getmant_bf16_128(<8 x bfloat> %x0, <8 x bfloat> %x2, i8 %x3) { +; X64-LABEL: test_int_x86_avx512_mask_getmant_bf16_128: ; X64: # %bb.0: ; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf] -; X64-NEXT: vgetmantpbf16 $8, %xmm0, %xmm1 {%k1} # encoding: [0x62,0xf3,0x7f,0x09,0x26,0xc8,0x08] -; X64-NEXT: vgetmantpbf16 $4, %xmm0, %xmm0 # encoding: [0x62,0xf3,0x7f,0x08,0x26,0xc0,0x04] -; X64-NEXT: vaddnepbf16 %xmm0, %xmm1, %xmm0 # encoding: [0x62,0xf5,0x75,0x08,0x58,0xc0] +; X64-NEXT: vgetmantbf16 $8, %xmm0, %xmm1 {%k1} # encoding: [0x62,0xf3,0x7f,0x09,0x26,0xc8,0x08] +; X64-NEXT: vgetmantbf16 $4, %xmm0, %xmm0 # encoding: [0x62,0xf3,0x7f,0x08,0x26,0xc0,0x04] +; X64-NEXT: vaddbf16 %xmm0, %xmm1, %xmm0 # encoding: [0x62,0xf5,0x75,0x08,0x58,0xc0] ; X64-NEXT: retq # encoding: [0xc3] ; -; X86-LABEL: test_int_x86_avx512_mask_getmant_nepbf16_128: +; X86-LABEL: test_int_x86_avx512_mask_getmant_bf16_128: ; X86: # %bb.0: ; X86-NEXT: kmovb {{[0-9]+}}(%esp), %k1 # encoding: [0xc5,0xf9,0x90,0x4c,0x24,0x04] -; X86-NEXT: vgetmantpbf16 $8, %xmm0, %xmm1 {%k1} # encoding: [0x62,0xf3,0x7f,0x09,0x26,0xc8,0x08] -; X86-NEXT: vgetmantpbf16 $4, %xmm0, %xmm0 # encoding: [0x62,0xf3,0x7f,0x08,0x26,0xc0,0x04] -; X86-NEXT: vaddnepbf16 %xmm0, %xmm1, %xmm0 # encoding: [0x62,0xf5,0x75,0x08,0x58,0xc0] +; X86-NEXT: vgetmantbf16 $8, %xmm0, %xmm1 {%k1} # encoding: [0x62,0xf3,0x7f,0x09,0x26,0xc8,0x08] +; X86-NEXT: vgetmantbf16 $4, %xmm0, %xmm0 # encoding: [0x62,0xf3,0x7f,0x08,0x26,0xc0,0x04] +; X86-NEXT: vaddbf16 %xmm0, %xmm1, %xmm0 # encoding: [0x62,0xf5,0x75,0x08,0x58,0xc0] ; X86-NEXT: retl # encoding: [0xc3] - %res = call <8 x bfloat> @llvm.x86.avx10.mask.getmant.nepbf16.128(<8 x bfloat> %x0, i32 8, <8 x bfloat> %x2, i8 %x3) - %res1 = call <8 x bfloat> @llvm.x86.avx10.mask.getmant.nepbf16.128(<8 x bfloat> %x0, i32 4, <8 x bfloat> %x2, i8 -1) + %res = call <8 x bfloat> @llvm.x86.avx10.mask.getmant.bf16.128(<8 x bfloat> %x0, i32 8, <8 x bfloat> %x2, i8 %x3) + %res1 = call <8 x bfloat> @llvm.x86.avx10.mask.getmant.bf16.128(<8 x bfloat> %x0, i32 4, <8 x bfloat> %x2, i8 -1) %res2 = fadd <8 x bfloat> %res, %res1 ret <8 x bfloat> %res2 } -define <16 x bfloat>@test_int_x86_avx512_mask_getmant_nepbf16_256(<16 x bfloat> %x0, <16 x bfloat> %x2, i16 %x3) { -; X64-LABEL: test_int_x86_avx512_mask_getmant_nepbf16_256: +define <16 x bfloat>@test_int_x86_avx512_mask_getmant_bf16_256(<16 x bfloat> %x0, <16 x bfloat> %x2, i16 %x3) { +; X64-LABEL: test_int_x86_avx512_mask_getmant_bf16_256: ; X64: # %bb.0: ; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf] -; X64-NEXT: vgetmantpbf16 $8, %ymm0, %ymm1 {%k1} # encoding: [0x62,0xf3,0x7f,0x29,0x26,0xc8,0x08] -; X64-NEXT: vgetmantpbf16 $4, %ymm0, %ymm0 # encoding: [0x62,0xf3,0x7f,0x28,0x26,0xc0,0x04] -; X64-NEXT: vaddnepbf16 %ymm0, %ymm1, %ymm0 # encoding: [0x62,0xf5,0x75,0x28,0x58,0xc0] +; X64-NEXT: vgetmantbf16 $8, %ymm0, %ymm1 {%k1} # encoding: [0x62,0xf3,0x7f,0x29,0x26,0xc8,0x08] +; X64-NEXT: vgetmantbf16 $4, %ymm0, %ymm0 # encoding: [0x62,0xf3,0x7f,0x28,0x26,0xc0,0x04] +; X64-NEXT: vaddbf16 %ymm0, %ymm1, %ymm0 # encoding: [0x62,0xf5,0x75,0x28,0x58,0xc0] ; X64-NEXT: retq # encoding: [0xc3] ; -; X86-LABEL: test_int_x86_avx512_mask_getmant_nepbf16_256: +; X86-LABEL: test_int_x86_avx512_mask_getmant_bf16_256: ; X86: # %bb.0: ; X86-NEXT: kmovw {{[0-9]+}}(%esp), %k1 # encoding: [0xc5,0xf8,0x90,0x4c,0x24,0x04] -; X86-NEXT: vgetmantpbf16 $8, %ymm0, %ymm1 {%k1} # encoding: [0x62,0xf3,0x7f,0x29,0x26,0xc8,0x08] -; X86-NEXT: vgetmantpbf16 $4, %ymm0, %ymm0 # encoding: [0x62,0xf3,0x7f,0x28,0x26,0xc0,0x04] -; X86-NEXT: vaddnepbf16 %ymm0, %ymm1, %ymm0 # encoding: [0x62,0xf5,0x75,0x28,0x58,0xc0] +; X86-NEXT: vgetmantbf16 $8, %ymm0, %ymm1 {%k1} # encoding: [0x62,0xf3,0x7f,0x29,0x26,0xc8,0x08] +; X86-NEXT: vgetmantbf16 $4, %ymm0, %ymm0 # encoding: [0x62,0xf3,0x7f,0x28,0x26,0xc0,0x04] +; X86-NEXT: vaddbf16 %ymm0, %ymm1, %ymm0 # encoding: [0x62,0xf5,0x75,0x28,0x58,0xc0] ; X86-NEXT: retl # encoding: [0xc3] - %res = call <16 x bfloat> @llvm.x86.avx10.mask.getmant.nepbf16.256(<16 x bfloat> %x0, i32 8, <16 x bfloat> %x2, i16 %x3) - %res1 = call <16 x bfloat> @llvm.x86.avx10.mask.getmant.nepbf16.256(<16 x bfloat> %x0, i32 4, <16 x bfloat> %x2, i16 -1) + %res = call <16 x bfloat> @llvm.x86.avx10.mask.getmant.bf16.256(<16 x bfloat> %x0, i32 8, <16 x bfloat> %x2, i16 %x3) + %res1 = call <16 x bfloat> @llvm.x86.avx10.mask.getmant.bf16.256(<16 x bfloat> %x0, i32 4, <16 x bfloat> %x2, i16 -1) %res2 = fadd <16 x bfloat> %res, %res1 ret <16 x bfloat> %res2 } -declare <8 x bfloat> @llvm.x86.avx10.mask.rndscale.nepbf16.128(<8 x bfloat>, i32, <8 x bfloat>, i8) -declare <16 x bfloat> @llvm.x86.avx10.mask.rndscale.nepbf16.256(<16 x bfloat>, i32, <16 x bfloat>, i16) +declare <8 x bfloat> @llvm.x86.avx10.mask.rndscale.bf16.128(<8 x bfloat>, i32, <8 x bfloat>, i8) +declare <16 x bfloat> @llvm.x86.avx10.mask.rndscale.bf16.256(<16 x bfloat>, i32, <16 x bfloat>, i16) -define <8 x bfloat>@test_int_x86_avx512_mask_rndscale_nepbf16_128(<8 x bfloat> %x0, <8 x bfloat> %x2, i8 %x3) { -; X64-LABEL: test_int_x86_avx512_mask_rndscale_nepbf16_128: +define <8 x bfloat>@test_int_x86_avx512_mask_rndscale_bf16_128(<8 x bfloat> %x0, <8 x bfloat> %x2, i8 %x3) { +; X64-LABEL: test_int_x86_avx512_mask_rndscale_bf16_128: ; X64: # %bb.0: ; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf] -; X64-NEXT: vrndscalenepbf16 $8, %xmm0, %xmm1 {%k1} # encoding: [0x62,0xf3,0x7f,0x09,0x08,0xc8,0x08] -; X64-NEXT: vrndscalenepbf16 $4, %xmm0, %xmm0 # encoding: [0x62,0xf3,0x7f,0x08,0x08,0xc0,0x04] -; X64-NEXT: vaddnepbf16 %xmm0, %xmm1, %xmm0 # encoding: [0x62,0xf5,0x75,0x08,0x58,0xc0] +; X64-NEXT: vrndscalebf16 $8, %xmm0, %xmm1 {%k1} # encoding: [0x62,0xf3,0x7f,0x09,0x08,0xc8,0x08] +; X64-NEXT: vrndscalebf16 $4, %xmm0, %xmm0 # encoding: [0x62,0xf3,0x7f,0x08,0x08,0xc0,0x04] +; X64-NEXT: vaddbf16 %xmm0, %xmm1, %xmm0 # encoding: [0x62,0xf5,0x75,0x08,0x58,0xc0] ; X64-NEXT: retq # encoding: [0xc3] ; -; X86-LABEL: test_int_x86_avx512_mask_rndscale_nepbf16_128: +; X86-LABEL: test_int_x86_avx512_mask_rndscale_bf16_128: ; X86: # %bb.0: ; X86-NEXT: kmovb {{[0-9]+}}(%esp), %k1 # encoding: [0xc5,0xf9,0x90,0x4c,0x24,0x04] -; X86-NEXT: vrndscalenepbf16 $8, %xmm0, %xmm1 {%k1} # encoding: [0x62,0xf3,0x7f,0x09,0x08,0xc8,0x08] -; X86-NEXT: vrndscalenepbf16 $4, %xmm0, %xmm0 # encoding: [0x62,0xf3,0x7f,0x08,0x08,0xc0,0x04] -; X86-NEXT: vaddnepbf16 %xmm0, %xmm1, %xmm0 # encoding: [0x62,0xf5,0x75,0x08,0x58,0xc0] +; X86-NEXT: vrndscalebf16 $8, %xmm0, %xmm1 {%k1} # encoding: [0x62,0xf3,0x7f,0x09,0x08,0xc8,0x08] +; X86-NEXT: vrndscalebf16 $4, %xmm0, %xmm0 # encoding: [0x62,0xf3,0x7f,0x08,0x08,0xc0,0x04] +; X86-NEXT: vaddbf16 %xmm0, %xmm1, %xmm0 # encoding: [0x62,0xf5,0x75,0x08,0x58,0xc0] ; X86-NEXT: retl # encoding: [0xc3] - %res = call <8 x bfloat> @llvm.x86.avx10.mask.rndscale.nepbf16.128(<8 x bfloat> %x0, i32 8, <8 x bfloat> %x2, i8 %x3) - %res1 = call <8 x bfloat> @llvm.x86.avx10.mask.rndscale.nepbf16.128(<8 x bfloat> %x0, i32 4, <8 x bfloat> %x2, i8 -1) + %res = call <8 x bfloat> @llvm.x86.avx10.mask.rndscale.bf16.128(<8 x bfloat> %x0, i32 8, <8 x bfloat> %x2, i8 %x3) + %res1 = call <8 x bfloat> @llvm.x86.avx10.mask.rndscale.bf16.128(<8 x bfloat> %x0, i32 4, <8 x bfloat> %x2, i8 -1) %res2 = fadd <8 x bfloat> %res, %res1 ret <8 x bfloat> %res2 } -define <16 x bfloat>@test_int_x86_avx512_mask_rndscale_nepbf16_256(<16 x bfloat> %x0, <16 x bfloat> %x2, i16 %x3) { -; X64-LABEL: test_int_x86_avx512_mask_rndscale_nepbf16_256: +define <16 x bfloat>@test_int_x86_avx512_mask_rndscale_bf16_256(<16 x bfloat> %x0, <16 x bfloat> %x2, i16 %x3) { +; X64-LABEL: test_int_x86_avx512_mask_rndscale_bf16_256: ; X64: # %bb.0: ; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf] -; X64-NEXT: vrndscalenepbf16 $8, %ymm0, %ymm1 {%k1} # encoding: [0x62,0xf3,0x7f,0x29,0x08,0xc8,0x08] -; X64-NEXT: vrndscalenepbf16 $4, %ymm0, %ymm0 # encoding: [0x62,0xf3,0x7f,0x28,0x08,0xc0,0x04] -; X64-NEXT: vaddnepbf16 %ymm0, %ymm1, %ymm0 # encoding: [0x62,0xf5,0x75,0x28,0x58,0xc0] +; X64-NEXT: vrndscalebf16 $8, %ymm0, %ymm1 {%k1} # encoding: [0x62,0xf3,0x7f,0x29,0x08,0xc8,0x08] +; X64-NEXT: vrndscalebf16 $4, %ymm0, %ymm0 # encoding: [0x62,0xf3,0x7f,0x28,0x08,0xc0,0x04] +; X64-NEXT: vaddbf16 %ymm0, %ymm1, %ymm0 # encoding: [0x62,0xf5,0x75,0x28,0x58,0xc0] ; X64-NEXT: retq # encoding: [0xc3] ; -; X86-LABEL: test_int_x86_avx512_mask_rndscale_nepbf16_256: +; X86-LABEL: test_int_x86_avx512_mask_rndscale_bf16_256: ; X86: # %bb.0: ; X86-NEXT: kmovw {{[0-9]+}}(%esp), %k1 # encoding: [0xc5,0xf8,0x90,0x4c,0x24,0x04] -; X86-NEXT: vrndscalenepbf16 $8, %ymm0, %ymm1 {%k1} # encoding: [0x62,0xf3,0x7f,0x29,0x08,0xc8,0x08] -; X86-NEXT: vrndscalenepbf16 $4, %ymm0, %ymm0 # encoding: [0x62,0xf3,0x7f,0x28,0x08,0xc0,0x04] -; X86-NEXT: vaddnepbf16 %ymm0, %ymm1, %ymm0 # encoding: [0x62,0xf5,0x75,0x28,0x58,0xc0] +; X86-NEXT: vrndscalebf16 $8, %ymm0, %ymm1 {%k1} # encoding: [0x62,0xf3,0x7f,0x29,0x08,0xc8,0x08] +; X86-NEXT: vrndscalebf16 $4, %ymm0, %ymm0 # encoding: [0x62,0xf3,0x7f,0x28,0x08,0xc0,0x04] +; X86-NEXT: vaddbf16 %ymm0, %ymm1, %ymm0 # encoding: [0x62,0xf5,0x75,0x28,0x58,0xc0] ; X86-NEXT: retl # encoding: [0xc3] - %res = call <16 x bfloat> @llvm.x86.avx10.mask.rndscale.nepbf16.256(<16 x bfloat> %x0, i32 8, <16 x bfloat> %x2, i16 %x3) - %res1 = call <16 x bfloat> @llvm.x86.avx10.mask.rndscale.nepbf16.256(<16 x bfloat> %x0, i32 4, <16 x bfloat> %x2, i16 -1) + %res = call <16 x bfloat> @llvm.x86.avx10.mask.rndscale.bf16.256(<16 x bfloat> %x0, i32 8, <16 x bfloat> %x2, i16 %x3) + %res1 = call <16 x bfloat> @llvm.x86.avx10.mask.rndscale.bf16.256(<16 x bfloat> %x0, i32 4, <16 x bfloat> %x2, i16 -1) %res2 = fadd <16 x bfloat> %res, %res1 ret <16 x bfloat> %res2 } -declare <8 x bfloat> @llvm.x86.avx10.mask.scalef.nepbf16.128(<8 x bfloat>, <8 x bfloat>, <8 x bfloat>, i8) -declare <16 x bfloat> @llvm.x86.avx10.mask.scalef.nepbf16.256(<16 x bfloat>, <16 x bfloat>, <16 x bfloat>, i16) +declare <8 x bfloat> @llvm.x86.avx10.mask.scalef.bf16.128(<8 x bfloat>, <8 x bfloat>, <8 x bfloat>, i8) +declare <16 x bfloat> @llvm.x86.avx10.mask.scalef.bf16.256(<16 x bfloat>, <16 x bfloat>, <16 x bfloat>, i16) -define <8 x bfloat>@test_int_x86_avx512_scalef_nepbf16_128(<8 x bfloat> %x0, <8 x bfloat> %x1) { -; CHECK-LABEL: test_int_x86_avx512_scalef_nepbf16_128: +define <8 x bfloat>@test_int_x86_avx512_scalef_bf16_128(<8 x bfloat> %x0, <8 x bfloat> %x1) { +; CHECK-LABEL: test_int_x86_avx512_scalef_bf16_128: ; CHECK: # %bb.0: -; CHECK-NEXT: vscalefpbf16 %xmm1, %xmm0, %xmm0 # encoding: [0x62,0xf6,0x7c,0x08,0x2c,0xc1] +; CHECK-NEXT: vscalefbf16 %xmm1, %xmm0, %xmm0 # encoding: [0x62,0xf6,0x7c,0x08,0x2c,0xc1] ; CHECK-NEXT: ret{{[l|q]}} # encoding: [0xc3] - %res = call <8 x bfloat> @llvm.x86.avx10.mask.scalef.nepbf16.128(<8 x bfloat> %x0, <8 x bfloat> %x1, <8 x bfloat> zeroinitializer, i8 -1) + %res = call <8 x bfloat> @llvm.x86.avx10.mask.scalef.bf16.128(<8 x bfloat> %x0, <8 x bfloat> %x1, <8 x bfloat> zeroinitializer, i8 -1) ret <8 x bfloat> %res } -define <8 x bfloat>@test_int_x86_avx512_mask_scalef_nepbf16_128(<8 x bfloat> %x0, <8 x bfloat> %x1, <8 x bfloat> %x2, i8 %x3) { -; X64-LABEL: test_int_x86_avx512_mask_scalef_nepbf16_128: +define <8 x bfloat>@test_int_x86_avx512_mask_scalef_bf16_128(<8 x bfloat> %x0, <8 x bfloat> %x1, <8 x bfloat> %x2, i8 %x3) { +; X64-LABEL: test_int_x86_avx512_mask_scalef_bf16_128: ; X64: # %bb.0: ; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf] -; X64-NEXT: vscalefpbf16 %xmm1, %xmm0, %xmm2 {%k1} # encoding: [0x62,0xf6,0x7c,0x09,0x2c,0xd1] +; X64-NEXT: vscalefbf16 %xmm1, %xmm0, %xmm2 {%k1} # encoding: [0x62,0xf6,0x7c,0x09,0x2c,0xd1] ; X64-NEXT: vmovaps %xmm2, %xmm0 # EVEX TO VEX Compression encoding: [0xc5,0xf8,0x28,0xc2] ; X64-NEXT: retq # encoding: [0xc3] ; -; X86-LABEL: test_int_x86_avx512_mask_scalef_nepbf16_128: +; X86-LABEL: test_int_x86_avx512_mask_scalef_bf16_128: ; X86: # %bb.0: ; X86-NEXT: kmovb {{[0-9]+}}(%esp), %k1 # encoding: [0xc5,0xf9,0x90,0x4c,0x24,0x04] -; X86-NEXT: vscalefpbf16 %xmm1, %xmm0, %xmm2 {%k1} # encoding: [0x62,0xf6,0x7c,0x09,0x2c,0xd1] +; X86-NEXT: vscalefbf16 %xmm1, %xmm0, %xmm2 {%k1} # encoding: [0x62,0xf6,0x7c,0x09,0x2c,0xd1] ; X86-NEXT: vmovaps %xmm2, %xmm0 # EVEX TO VEX Compression encoding: [0xc5,0xf8,0x28,0xc2] ; X86-NEXT: retl # encoding: [0xc3] %mask = bitcast i8 %x3 to <8 x i1> - %res = call <8 x bfloat> @llvm.x86.avx10.mask.scalef.nepbf16.128(<8 x bfloat> %x0, <8 x bfloat> %x1, <8 x bfloat> %x2, i8 %x3) + %res = call <8 x bfloat> @llvm.x86.avx10.mask.scalef.bf16.128(<8 x bfloat> %x0, <8 x bfloat> %x1, <8 x bfloat> %x2, i8 %x3) ret <8 x bfloat> %res } -define <8 x bfloat>@test_int_x86_avx512_maskz_scalef_nepbf16_128(<8 x bfloat> %x0, <8 x bfloat> %x1, i8 %x3) { -; X64-LABEL: test_int_x86_avx512_maskz_scalef_nepbf16_128: +define <8 x bfloat>@test_int_x86_avx512_maskz_scalef_bf16_128(<8 x bfloat> %x0, <8 x bfloat> %x1, i8 %x3) { +; X64-LABEL: test_int_x86_avx512_maskz_scalef_bf16_128: ; X64: # %bb.0: ; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf] -; X64-NEXT: vscalefpbf16 %xmm1, %xmm0, %xmm0 {%k1} {z} # encoding: [0x62,0xf6,0x7c,0x89,0x2c,0xc1] +; X64-NEXT: vscalefbf16 %xmm1, %xmm0, %xmm0 {%k1} {z} # encoding: [0x62,0xf6,0x7c,0x89,0x2c,0xc1] ; X64-NEXT: retq # encoding: [0xc3] ; -; X86-LABEL: test_int_x86_avx512_maskz_scalef_nepbf16_128: +; X86-LABEL: test_int_x86_avx512_maskz_scalef_bf16_128: ; X86: # %bb.0: ; X86-NEXT: kmovb {{[0-9]+}}(%esp), %k1 # encoding: [0xc5,0xf9,0x90,0x4c,0x24,0x04] -; X86-NEXT: vscalefpbf16 %xmm1, %xmm0, %xmm0 {%k1} {z} # encoding: [0x62,0xf6,0x7c,0x89,0x2c,0xc1] +; X86-NEXT: vscalefbf16 %xmm1, %xmm0, %xmm0 {%k1} {z} # encoding: [0x62,0xf6,0x7c,0x89,0x2c,0xc1] ; X86-NEXT: retl # encoding: [0xc3] %mask = bitcast i8 %x3 to <8 x i1> - %res = call <8 x bfloat> @llvm.x86.avx10.mask.scalef.nepbf16.128(<8 x bfloat> %x0, <8 x bfloat> %x1, <8 x bfloat> zeroinitializer, i8 %x3) + %res = call <8 x bfloat> @llvm.x86.avx10.mask.scalef.bf16.128(<8 x bfloat> %x0, <8 x bfloat> %x1, <8 x bfloat> zeroinitializer, i8 %x3) ret <8 x bfloat> %res } -define <16 x bfloat>@test_int_x86_avx512_scalef_nepbf16_256(<16 x bfloat> %x0, <16 x bfloat> %x1) { -; CHECK-LABEL: test_int_x86_avx512_scalef_nepbf16_256: +define <16 x bfloat>@test_int_x86_avx512_scalef_bf16_256(<16 x bfloat> %x0, <16 x bfloat> %x1) { +; CHECK-LABEL: test_int_x86_avx512_scalef_bf16_256: ; CHECK: # %bb.0: -; CHECK-NEXT: vscalefpbf16 %ymm1, %ymm0, %ymm0 # encoding: [0x62,0xf6,0x7c,0x28,0x2c,0xc1] +; CHECK-NEXT: vscalefbf16 %ymm1, %ymm0, %ymm0 # encoding: [0x62,0xf6,0x7c,0x28,0x2c,0xc1] ; CHECK-NEXT: ret{{[l|q]}} # encoding: [0xc3] - %res = call <16 x bfloat> @llvm.x86.avx10.mask.scalef.nepbf16.256(<16 x bfloat> %x0, <16 x bfloat> %x1, <16 x bfloat> zeroinitializer, i16 -1) + %res = call <16 x bfloat> @llvm.x86.avx10.mask.scalef.bf16.256(<16 x bfloat> %x0, <16 x bfloat> %x1, <16 x bfloat> zeroinitializer, i16 -1) ret <16 x bfloat> %res } -define <16 x bfloat>@test_int_x86_avx512_mask_scalef_nepbf16_256(<16 x bfloat> %x0, <16 x bfloat> %x1, <16 x bfloat> %x2, i16 %x3) { -; X64-LABEL: test_int_x86_avx512_mask_scalef_nepbf16_256: +define <16 x bfloat>@test_int_x86_avx512_mask_scalef_bf16_256(<16 x bfloat> %x0, <16 x bfloat> %x1, <16 x bfloat> %x2, i16 %x3) { +; X64-LABEL: test_int_x86_avx512_mask_scalef_bf16_256: ; X64: # %bb.0: ; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf] -; X64-NEXT: vscalefpbf16 %ymm1, %ymm0, %ymm2 {%k1} # encoding: [0x62,0xf6,0x7c,0x29,0x2c,0xd1] +; X64-NEXT: vscalefbf16 %ymm1, %ymm0, %ymm2 {%k1} # encoding: [0x62,0xf6,0x7c,0x29,0x2c,0xd1] ; X64-NEXT: vmovaps %ymm2, %ymm0 # EVEX TO VEX Compression encoding: [0xc5,0xfc,0x28,0xc2] ; X64-NEXT: retq # encoding: [0xc3] ; -; X86-LABEL: test_int_x86_avx512_mask_scalef_nepbf16_256: +; X86-LABEL: test_int_x86_avx512_mask_scalef_bf16_256: ; X86: # %bb.0: ; X86-NEXT: kmovw {{[0-9]+}}(%esp), %k1 # encoding: [0xc5,0xf8,0x90,0x4c,0x24,0x04] -; X86-NEXT: vscalefpbf16 %ymm1, %ymm0, %ymm2 {%k1} # encoding: [0x62,0xf6,0x7c,0x29,0x2c,0xd1] +; X86-NEXT: vscalefbf16 %ymm1, %ymm0, %ymm2 {%k1} # encoding: [0x62,0xf6,0x7c,0x29,0x2c,0xd1] ; X86-NEXT: vmovaps %ymm2, %ymm0 # EVEX TO VEX Compression encoding: [0xc5,0xfc,0x28,0xc2] ; X86-NEXT: retl # encoding: [0xc3] %mask = bitcast i16 %x3 to <16 x i1> - %res = call <16 x bfloat> @llvm.x86.avx10.mask.scalef.nepbf16.256(<16 x bfloat> %x0, <16 x bfloat> %x1, <16 x bfloat> %x2, i16 %x3) + %res = call <16 x bfloat> @llvm.x86.avx10.mask.scalef.bf16.256(<16 x bfloat> %x0, <16 x bfloat> %x1, <16 x bfloat> %x2, i16 %x3) ret <16 x bfloat> %res } -define <16 x bfloat>@test_int_x86_avx512_maskz_scalef_nepbf16_256(<16 x bfloat> %x0, <16 x bfloat> %x1, i16 %x3) { -; X64-LABEL: test_int_x86_avx512_maskz_scalef_nepbf16_256: +define <16 x bfloat>@test_int_x86_avx512_maskz_scalef_bf16_256(<16 x bfloat> %x0, <16 x bfloat> %x1, i16 %x3) { +; X64-LABEL: test_int_x86_avx512_maskz_scalef_bf16_256: ; X64: # %bb.0: ; X64-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf] -; X64-NEXT: vscalefpbf16 %ymm1, %ymm0, %ymm0 {%k1} {z} # encoding: [0x62,0xf6,0x7c,0xa9,0x2c,0xc1] +; X64-NEXT: vscalefbf16 %ymm1, %ymm0, %ymm0 {%k1} {z} # encoding: [0x62,0xf6,0x7c,0xa9,0x2c,0xc1] ; X64-NEXT: retq # encoding: [0xc3] ; -; X86-LABEL: test_int_x86_avx512_maskz_scalef_nepbf16_256: +; X86-LABEL: test_int_x86_avx512_maskz_scalef_bf16_256: ; X86: # %bb.0: ; X86-NEXT: kmovw {{[0-9]+}}(%esp), %k1 # encoding: [0xc5,0xf8,0x90,0x4c,0x24,0x04] -; X86-NEXT: vscalefpbf16 %ymm1, %ymm0, %ymm0 {%k1} {z} # encoding: [0x62,0xf6,0x7c,0xa9,0x2c,0xc1] +; X86-NEXT: vscalefbf16 %ymm1, %ymm0, %ymm0 {%k1} {z} # encoding: [0x62,0xf6,0x7c,0xa9,0x2c,0xc1] ; X86-NEXT: retl # encoding: [0xc3] %mask = bitcast i16 %x3 to <16 x i1> - %res = call <16 x bfloat> @llvm.x86.avx10.mask.scalef.nepbf16.256(<16 x bfloat> %x0, <16 x bfloat> %x1, <16 x bfloat> zeroinitializer, i16 %x3) + %res = call <16 x bfloat> @llvm.x86.avx10.mask.scalef.bf16.256(<16 x bfloat> %x0, <16 x bfloat> %x1, <16 x bfloat> zeroinitializer, i16 %x3) ret <16 x bfloat> %res } diff --git a/llvm/test/MC/Disassembler/X86/avx10.2-bf16-32.txt b/llvm/test/MC/Disassembler/X86/avx10.2-bf16-32.txt index 8cc53db077e4f..b278f1d46e4d5 100644 --- a/llvm/test/MC/Disassembler/X86/avx10.2-bf16-32.txt +++ b/llvm/test/MC/Disassembler/X86/avx10.2-bf16-32.txt @@ -1,208 +1,208 @@ # RUN: llvm-mc --disassemble %s -triple=i386 | FileCheck %s --check-prefixes=ATT # RUN: llvm-mc --disassemble %s -triple=i386 --output-asm-variant=1 | FileCheck %s --check-prefixes=INTEL -# ATT: vaddnepbf16 %ymm4, %ymm3, %ymm2 -# INTEL: vaddnepbf16 ymm2, ymm3, ymm4 +# ATT: vaddbf16 %ymm4, %ymm3, %ymm2 +# INTEL: vaddbf16 ymm2, ymm3, ymm4 0x62,0xf5,0x65,0x28,0x58,0xd4 -# ATT: vaddnepbf16 %ymm4, %ymm3, %ymm2 {%k7} -# INTEL: vaddnepbf16 ymm2 {k7}, ymm3, ymm4 +# ATT: vaddbf16 %ymm4, %ymm3, %ymm2 {%k7} +# INTEL: vaddbf16 ymm2 {k7}, ymm3, ymm4 0x62,0xf5,0x65,0x2f,0x58,0xd4 -# ATT: vaddnepbf16 %ymm4, %ymm3, %ymm2 {%k7} {z} -# INTEL: vaddnepbf16 ymm2 {k7} {z}, ymm3, ymm4 +# ATT: vaddbf16 %ymm4, %ymm3, %ymm2 {%k7} {z} +# INTEL: vaddbf16 ymm2 {k7} {z}, ymm3, ymm4 0x62,0xf5,0x65,0xaf,0x58,0xd4 -# ATT: vaddnepbf16 %zmm4, %zmm3, %zmm2 -# INTEL: vaddnepbf16 zmm2, zmm3, zmm4 +# ATT: vaddbf16 %zmm4, %zmm3, %zmm2 +# INTEL: vaddbf16 zmm2, zmm3, zmm4 0x62,0xf5,0x65,0x48,0x58,0xd4 -# ATT: vaddnepbf16 %zmm4, %zmm3, %zmm2 {%k7} -# INTEL: vaddnepbf16 zmm2 {k7}, zmm3, zmm4 +# ATT: vaddbf16 %zmm4, %zmm3, %zmm2 {%k7} +# INTEL: vaddbf16 zmm2 {k7}, zmm3, zmm4 0x62,0xf5,0x65,0x4f,0x58,0xd4 -# ATT: vaddnepbf16 %zmm4, %zmm3, %zmm2 {%k7} {z} -# INTEL: vaddnepbf16 zmm2 {k7} {z}, zmm3, zmm4 +# ATT: vaddbf16 %zmm4, %zmm3, %zmm2 {%k7} {z} +# INTEL: vaddbf16 zmm2 {k7} {z}, zmm3, zmm4 0x62,0xf5,0x65,0xcf,0x58,0xd4 -# ATT: vaddnepbf16 %xmm4, %xmm3, %xmm2 -# INTEL: vaddnepbf16 xmm2, xmm3, xmm4 +# ATT: vaddbf16 %xmm4, %xmm3, %xmm2 +# INTEL: vaddbf16 xmm2, xmm3, xmm4 0x62,0xf5,0x65,0x08,0x58,0xd4 -# ATT: vaddnepbf16 %xmm4, %xmm3, %xmm2 {%k7} -# INTEL: vaddnepbf16 xmm2 {k7}, xmm3, xmm4 +# ATT: vaddbf16 %xmm4, %xmm3, %xmm2 {%k7} +# INTEL: vaddbf16 xmm2 {k7}, xmm3, xmm4 0x62,0xf5,0x65,0x0f,0x58,0xd4 -# ATT: vaddnepbf16 %xmm4, %xmm3, %xmm2 {%k7} {z} -# INTEL: vaddnepbf16 xmm2 {k7} {z}, xmm3, xmm4 +# ATT: vaddbf16 %xmm4, %xmm3, %xmm2 {%k7} {z} +# INTEL: vaddbf16 xmm2 {k7} {z}, xmm3, xmm4 0x62,0xf5,0x65,0x8f,0x58,0xd4 -# ATT: vaddnepbf16 268435456(%esp,%esi,8), %zmm3, %zmm2 -# INTEL: vaddnepbf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456] +# ATT: vaddbf16 268435456(%esp,%esi,8), %zmm3, %zmm2 +# INTEL: vaddbf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456] 0x62,0xf5,0x65,0x48,0x58,0x94,0xf4,0x00,0x00,0x00,0x10 -# ATT: vaddnepbf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7} -# INTEL: vaddnepbf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291] +# ATT: vaddbf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7} +# INTEL: vaddbf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291] 0x62,0xf5,0x65,0x4f,0x58,0x94,0x87,0x23,0x01,0x00,0x00 -# ATT: vaddnepbf16 (%eax){1to32}, %zmm3, %zmm2 -# INTEL: vaddnepbf16 zmm2, zmm3, word ptr [eax]{1to32} +# ATT: vaddbf16 (%eax){1to32}, %zmm3, %zmm2 +# INTEL: vaddbf16 zmm2, zmm3, word ptr [eax]{1to32} 0x62,0xf5,0x65,0x58,0x58,0x10 -# ATT: vaddnepbf16 -2048(,%ebp,2), %zmm3, %zmm2 -# INTEL: vaddnepbf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048] +# ATT: vaddbf16 -2048(,%ebp,2), %zmm3, %zmm2 +# INTEL: vaddbf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048] 0x62,0xf5,0x65,0x48,0x58,0x14,0x6d,0x00,0xf8,0xff,0xff -# ATT: vaddnepbf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z} -# INTEL: vaddnepbf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128] +# ATT: vaddbf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z} +# INTEL: vaddbf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128] 0x62,0xf5,0x65,0xcf,0x58,0x51,0x7f -# ATT: vaddnepbf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z} -# INTEL: vaddnepbf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32} +# ATT: vaddbf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z} +# INTEL: vaddbf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32} 0x62,0xf5,0x65,0xdf,0x58,0x52,0x80 -# ATT: vaddnepbf16 268435456(%esp,%esi,8), %ymm3, %ymm2 -# INTEL: vaddnepbf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456] +# ATT: vaddbf16 268435456(%esp,%esi,8), %ymm3, %ymm2 +# INTEL: vaddbf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456] 0x62,0xf5,0x65,0x28,0x58,0x94,0xf4,0x00,0x00,0x00,0x10 -# ATT: vaddnepbf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7} -# INTEL: vaddnepbf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291] +# ATT: vaddbf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7} +# INTEL: vaddbf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291] 0x62,0xf5,0x65,0x2f,0x58,0x94,0x87,0x23,0x01,0x00,0x00 -# ATT: vaddnepbf16 (%eax){1to16}, %ymm3, %ymm2 -# INTEL: vaddnepbf16 ymm2, ymm3, word ptr [eax]{1to16} +# ATT: vaddbf16 (%eax){1to16}, %ymm3, %ymm2 +# INTEL: vaddbf16 ymm2, ymm3, word ptr [eax]{1to16} 0x62,0xf5,0x65,0x38,0x58,0x10 -# ATT: vaddnepbf16 -1024(,%ebp,2), %ymm3, %ymm2 -# INTEL: vaddnepbf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024] +# ATT: vaddbf16 -1024(,%ebp,2), %ymm3, %ymm2 +# INTEL: vaddbf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024] 0x62,0xf5,0x65,0x28,0x58,0x14,0x6d,0x00,0xfc,0xff,0xff -# ATT: vaddnepbf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z} -# INTEL: vaddnepbf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064] +# ATT: vaddbf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z} +# INTEL: vaddbf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064] 0x62,0xf5,0x65,0xaf,0x58,0x51,0x7f -# ATT: vaddnepbf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z} -# INTEL: vaddnepbf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16} +# ATT: vaddbf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z} +# INTEL: vaddbf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16} 0x62,0xf5,0x65,0xbf,0x58,0x52,0x80 -# ATT: vaddnepbf16 268435456(%esp,%esi,8), %xmm3, %xmm2 -# INTEL: vaddnepbf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456] +# ATT: vaddbf16 268435456(%esp,%esi,8), %xmm3, %xmm2 +# INTEL: vaddbf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456] 0x62,0xf5,0x65,0x08,0x58,0x94,0xf4,0x00,0x00,0x00,0x10 -# ATT: vaddnepbf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7} -# INTEL: vaddnepbf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291] +# ATT: vaddbf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7} +# INTEL: vaddbf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291] 0x62,0xf5,0x65,0x0f,0x58,0x94,0x87,0x23,0x01,0x00,0x00 -# ATT: vaddnepbf16 (%eax){1to8}, %xmm3, %xmm2 -# INTEL: vaddnepbf16 xmm2, xmm3, word ptr [eax]{1to8} +# ATT: vaddbf16 (%eax){1to8}, %xmm3, %xmm2 +# INTEL: vaddbf16 xmm2, xmm3, word ptr [eax]{1to8} 0x62,0xf5,0x65,0x18,0x58,0x10 -# ATT: vaddnepbf16 -512(,%ebp,2), %xmm3, %xmm2 -# INTEL: vaddnepbf16 xmm2, xmm3, xmmword ptr [2*ebp - 512] +# ATT: vaddbf16 -512(,%ebp,2), %xmm3, %xmm2 +# INTEL: vaddbf16 xmm2, xmm3, xmmword ptr [2*ebp - 512] 0x62,0xf5,0x65,0x08,0x58,0x14,0x6d,0x00,0xfe,0xff,0xff -# ATT: vaddnepbf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z} -# INTEL: vaddnepbf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032] +# ATT: vaddbf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z} +# INTEL: vaddbf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032] 0x62,0xf5,0x65,0x8f,0x58,0x51,0x7f -# ATT: vaddnepbf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z} -# INTEL: vaddnepbf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8} +# ATT: vaddbf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z} +# INTEL: vaddbf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8} 0x62,0xf5,0x65,0x9f,0x58,0x52,0x80 -# ATT: vcmppbf16 $123, %ymm4, %ymm3, %k5 -# INTEL: vcmppbf16 k5, ymm3, ymm4, 123 +# ATT: vcmpbf16 $123, %ymm4, %ymm3, %k5 +# INTEL: vcmpbf16 k5, ymm3, ymm4, 123 0x62,0xf3,0x67,0x28,0xc2,0xec,0x7b -# ATT: vcmppbf16 $123, %ymm4, %ymm3, %k5 {%k7} -# INTEL: vcmppbf16 k5 {k7}, ymm3, ymm4, 123 +# ATT: vcmpbf16 $123, %ymm4, %ymm3, %k5 {%k7} +# INTEL: vcmpbf16 k5 {k7}, ymm3, ymm4, 123 0x62,0xf3,0x67,0x2f,0xc2,0xec,0x7b -# ATT: vcmppbf16 $123, %xmm4, %xmm3, %k5 -# INTEL: vcmppbf16 k5, xmm3, xmm4, 123 +# ATT: vcmpbf16 $123, %xmm4, %xmm3, %k5 +# INTEL: vcmpbf16 k5, xmm3, xmm4, 123 0x62,0xf3,0x67,0x08,0xc2,0xec,0x7b -# ATT: vcmppbf16 $123, %xmm4, %xmm3, %k5 {%k7} -# INTEL: vcmppbf16 k5 {k7}, xmm3, xmm4, 123 +# ATT: vcmpbf16 $123, %xmm4, %xmm3, %k5 {%k7} +# INTEL: vcmpbf16 k5 {k7}, xmm3, xmm4, 123 0x62,0xf3,0x67,0x0f,0xc2,0xec,0x7b -# ATT: vcmppbf16 $123, %zmm4, %zmm3, %k5 -# INTEL: vcmppbf16 k5, zmm3, zmm4, 123 +# ATT: vcmpbf16 $123, %zmm4, %zmm3, %k5 +# INTEL: vcmpbf16 k5, zmm3, zmm4, 123 0x62,0xf3,0x67,0x48,0xc2,0xec,0x7b -# ATT: vcmppbf16 $123, %zmm4, %zmm3, %k5 {%k7} -# INTEL: vcmppbf16 k5 {k7}, zmm3, zmm4, 123 +# ATT: vcmpbf16 $123, %zmm4, %zmm3, %k5 {%k7} +# INTEL: vcmpbf16 k5 {k7}, zmm3, zmm4, 123 0x62,0xf3,0x67,0x4f,0xc2,0xec,0x7b -# ATT: vcmppbf16 $123, 268435456(%esp,%esi,8), %zmm3, %k5 -# INTEL: vcmppbf16 k5, zmm3, zmmword ptr [esp + 8*esi + 268435456], 123 +# ATT: vcmpbf16 $123, 268435456(%esp,%esi,8), %zmm3, %k5 +# INTEL: vcmpbf16 k5, zmm3, zmmword ptr [esp + 8*esi + 268435456], 123 0x62,0xf3,0x67,0x48,0xc2,0xac,0xf4,0x00,0x00,0x00,0x10,0x7b -# ATT: vcmppbf16 $123, 291(%edi,%eax,4), %zmm3, %k5 {%k7} -# INTEL: vcmppbf16 k5 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291], 123 +# ATT: vcmpbf16 $123, 291(%edi,%eax,4), %zmm3, %k5 {%k7} +# INTEL: vcmpbf16 k5 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291], 123 0x62,0xf3,0x67,0x4f,0xc2,0xac,0x87,0x23,0x01,0x00,0x00,0x7b -# ATT: vcmppbf16 $123, (%eax){1to32}, %zmm3, %k5 -# INTEL: vcmppbf16 k5, zmm3, word ptr [eax]{1to32}, 123 +# ATT: vcmpbf16 $123, (%eax){1to32}, %zmm3, %k5 +# INTEL: vcmpbf16 k5, zmm3, word ptr [eax]{1to32}, 123 0x62,0xf3,0x67,0x58,0xc2,0x28,0x7b -# ATT: vcmppbf16 $123, -2048(,%ebp,2), %zmm3, %k5 -# INTEL: vcmppbf16 k5, zmm3, zmmword ptr [2*ebp - 2048], 123 +# ATT: vcmpbf16 $123, -2048(,%ebp,2), %zmm3, %k5 +# INTEL: vcmpbf16 k5, zmm3, zmmword ptr [2*ebp - 2048], 123 0x62,0xf3,0x67,0x48,0xc2,0x2c,0x6d,0x00,0xf8,0xff,0xff,0x7b -# ATT: vcmppbf16 $123, 8128(%ecx), %zmm3, %k5 {%k7} -# INTEL: vcmppbf16 k5 {k7}, zmm3, zmmword ptr [ecx + 8128], 123 +# ATT: vcmpbf16 $123, 8128(%ecx), %zmm3, %k5 {%k7} +# INTEL: vcmpbf16 k5 {k7}, zmm3, zmmword ptr [ecx + 8128], 123 0x62,0xf3,0x67,0x4f,0xc2,0x69,0x7f,0x7b -# ATT: vcmppbf16 $123, -256(%edx){1to32}, %zmm3, %k5 {%k7} -# INTEL: vcmppbf16 k5 {k7}, zmm3, word ptr [edx - 256]{1to32}, 123 +# ATT: vcmpbf16 $123, -256(%edx){1to32}, %zmm3, %k5 {%k7} +# INTEL: vcmpbf16 k5 {k7}, zmm3, word ptr [edx - 256]{1to32}, 123 0x62,0xf3,0x67,0x5f,0xc2,0x6a,0x80,0x7b -# ATT: vcmppbf16 $123, 268435456(%esp,%esi,8), %xmm3, %k5 -# INTEL: vcmppbf16 k5, xmm3, xmmword ptr [esp + 8*esi + 268435456], 123 +# ATT: vcmpbf16 $123, 268435456(%esp,%esi,8), %xmm3, %k5 +# INTEL: vcmpbf16 k5, xmm3, xmmword ptr [esp + 8*esi + 268435456], 123 0x62,0xf3,0x67,0x08,0xc2,0xac,0xf4,0x00,0x00,0x00,0x10,0x7b -# ATT: vcmppbf16 $123, 291(%edi,%eax,4), %xmm3, %k5 {%k7} -# INTEL: vcmppbf16 k5 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291], 123 +# ATT: vcmpbf16 $123, 291(%edi,%eax,4), %xmm3, %k5 {%k7} +# INTEL: vcmpbf16 k5 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291], 123 0x62,0xf3,0x67,0x0f,0xc2,0xac,0x87,0x23,0x01,0x00,0x00,0x7b -# ATT: vcmppbf16 $123, (%eax){1to8}, %xmm3, %k5 -# INTEL: vcmppbf16 k5, xmm3, word ptr [eax]{1to8}, 123 +# ATT: vcmpbf16 $123, (%eax){1to8}, %xmm3, %k5 +# INTEL: vcmpbf16 k5, xmm3, word ptr [eax]{1to8}, 123 0x62,0xf3,0x67,0x18,0xc2,0x28,0x7b -# ATT: vcmppbf16 $123, -512(,%ebp,2), %xmm3, %k5 -# INTEL: vcmppbf16 k5, xmm3, xmmword ptr [2*ebp - 512], 123 +# ATT: vcmpbf16 $123, -512(,%ebp,2), %xmm3, %k5 +# INTEL: vcmpbf16 k5, xmm3, xmmword ptr [2*ebp - 512], 123 0x62,0xf3,0x67,0x08,0xc2,0x2c,0x6d,0x00,0xfe,0xff,0xff,0x7b -# ATT: vcmppbf16 $123, 2032(%ecx), %xmm3, %k5 {%k7} -# INTEL: vcmppbf16 k5 {k7}, xmm3, xmmword ptr [ecx + 2032], 123 +# ATT: vcmpbf16 $123, 2032(%ecx), %xmm3, %k5 {%k7} +# INTEL: vcmpbf16 k5 {k7}, xmm3, xmmword ptr [ecx + 2032], 123 0x62,0xf3,0x67,0x0f,0xc2,0x69,0x7f,0x7b -# ATT: vcmppbf16 $123, -256(%edx){1to8}, %xmm3, %k5 {%k7} -# INTEL: vcmppbf16 k5 {k7}, xmm3, word ptr [edx - 256]{1to8}, 123 +# ATT: vcmpbf16 $123, -256(%edx){1to8}, %xmm3, %k5 {%k7} +# INTEL: vcmpbf16 k5 {k7}, xmm3, word ptr [edx - 256]{1to8}, 123 0x62,0xf3,0x67,0x1f,0xc2,0x6a,0x80,0x7b -# ATT: vcmppbf16 $123, 268435456(%esp,%esi,8), %ymm3, %k5 -# INTEL: vcmppbf16 k5, ymm3, ymmword ptr [esp + 8*esi + 268435456], 123 +# ATT: vcmpbf16 $123, 268435456(%esp,%esi,8), %ymm3, %k5 +# INTEL: vcmpbf16 k5, ymm3, ymmword ptr [esp + 8*esi + 268435456], 123 0x62,0xf3,0x67,0x28,0xc2,0xac,0xf4,0x00,0x00,0x00,0x10,0x7b -# ATT: vcmppbf16 $123, 291(%edi,%eax,4), %ymm3, %k5 {%k7} -# INTEL: vcmppbf16 k5 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291], 123 +# ATT: vcmpbf16 $123, 291(%edi,%eax,4), %ymm3, %k5 {%k7} +# INTEL: vcmpbf16 k5 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291], 123 0x62,0xf3,0x67,0x2f,0xc2,0xac,0x87,0x23,0x01,0x00,0x00,0x7b -# ATT: vcmppbf16 $123, (%eax){1to16}, %ymm3, %k5 -# INTEL: vcmppbf16 k5, ymm3, word ptr [eax]{1to16}, 123 +# ATT: vcmpbf16 $123, (%eax){1to16}, %ymm3, %k5 +# INTEL: vcmpbf16 k5, ymm3, word ptr [eax]{1to16}, 123 0x62,0xf3,0x67,0x38,0xc2,0x28,0x7b -# ATT: vcmppbf16 $123, -1024(,%ebp,2), %ymm3, %k5 -# INTEL: vcmppbf16 k5, ymm3, ymmword ptr [2*ebp - 1024], 123 +# ATT: vcmpbf16 $123, -1024(,%ebp,2), %ymm3, %k5 +# INTEL: vcmpbf16 k5, ymm3, ymmword ptr [2*ebp - 1024], 123 0x62,0xf3,0x67,0x28,0xc2,0x2c,0x6d,0x00,0xfc,0xff,0xff,0x7b -# ATT: vcmppbf16 $123, 4064(%ecx), %ymm3, %k5 {%k7} -# INTEL: vcmppbf16 k5 {k7}, ymm3, ymmword ptr [ecx + 4064], 123 +# ATT: vcmpbf16 $123, 4064(%ecx), %ymm3, %k5 {%k7} +# INTEL: vcmpbf16 k5 {k7}, ymm3, ymmword ptr [ecx + 4064], 123 0x62,0xf3,0x67,0x2f,0xc2,0x69,0x7f,0x7b -# ATT: vcmppbf16 $123, -256(%edx){1to16}, %ymm3, %k5 {%k7} -# INTEL: vcmppbf16 k5 {k7}, ymm3, word ptr [edx - 256]{1to16}, 123 +# ATT: vcmpbf16 $123, -256(%edx){1to16}, %ymm3, %k5 {%k7} +# INTEL: vcmpbf16 k5 {k7}, ymm3, word ptr [edx - 256]{1to16}, 123 0x62,0xf3,0x67,0x3f,0xc2,0x6a,0x80,0x7b # ATT: vcomsbf16 %xmm3, %xmm2 @@ -233,2783 +233,2783 @@ # INTEL: vcomsbf16 xmm2, word ptr [edx - 256] 0x62,0xf5,0x7d,0x08,0x2f,0x52,0x80 -# ATT: vdivnepbf16 %ymm4, %ymm3, %ymm2 -# INTEL: vdivnepbf16 ymm2, ymm3, ymm4 +# ATT: vdivbf16 %ymm4, %ymm3, %ymm2 +# INTEL: vdivbf16 ymm2, ymm3, ymm4 0x62,0xf5,0x65,0x28,0x5e,0xd4 -# ATT: vdivnepbf16 %ymm4, %ymm3, %ymm2 {%k7} -# INTEL: vdivnepbf16 ymm2 {k7}, ymm3, ymm4 +# ATT: vdivbf16 %ymm4, %ymm3, %ymm2 {%k7} +# INTEL: vdivbf16 ymm2 {k7}, ymm3, ymm4 0x62,0xf5,0x65,0x2f,0x5e,0xd4 -# ATT: vdivnepbf16 %ymm4, %ymm3, %ymm2 {%k7} {z} -# INTEL: vdivnepbf16 ymm2 {k7} {z}, ymm3, ymm4 +# ATT: vdivbf16 %ymm4, %ymm3, %ymm2 {%k7} {z} +# INTEL: vdivbf16 ymm2 {k7} {z}, ymm3, ymm4 0x62,0xf5,0x65,0xaf,0x5e,0xd4 -# ATT: vdivnepbf16 %zmm4, %zmm3, %zmm2 -# INTEL: vdivnepbf16 zmm2, zmm3, zmm4 +# ATT: vdivbf16 %zmm4, %zmm3, %zmm2 +# INTEL: vdivbf16 zmm2, zmm3, zmm4 0x62,0xf5,0x65,0x48,0x5e,0xd4 -# ATT: vdivnepbf16 %zmm4, %zmm3, %zmm2 {%k7} -# INTEL: vdivnepbf16 zmm2 {k7}, zmm3, zmm4 +# ATT: vdivbf16 %zmm4, %zmm3, %zmm2 {%k7} +# INTEL: vdivbf16 zmm2 {k7}, zmm3, zmm4 0x62,0xf5,0x65,0x4f,0x5e,0xd4 -# ATT: vdivnepbf16 %zmm4, %zmm3, %zmm2 {%k7} {z} -# INTEL: vdivnepbf16 zmm2 {k7} {z}, zmm3, zmm4 +# ATT: vdivbf16 %zmm4, %zmm3, %zmm2 {%k7} {z} +# INTEL: vdivbf16 zmm2 {k7} {z}, zmm3, zmm4 0x62,0xf5,0x65,0xcf,0x5e,0xd4 -# ATT: vdivnepbf16 %xmm4, %xmm3, %xmm2 -# INTEL: vdivnepbf16 xmm2, xmm3, xmm4 +# ATT: vdivbf16 %xmm4, %xmm3, %xmm2 +# INTEL: vdivbf16 xmm2, xmm3, xmm4 0x62,0xf5,0x65,0x08,0x5e,0xd4 -# ATT: vdivnepbf16 %xmm4, %xmm3, %xmm2 {%k7} -# INTEL: vdivnepbf16 xmm2 {k7}, xmm3, xmm4 +# ATT: vdivbf16 %xmm4, %xmm3, %xmm2 {%k7} +# INTEL: vdivbf16 xmm2 {k7}, xmm3, xmm4 0x62,0xf5,0x65,0x0f,0x5e,0xd4 -# ATT: vdivnepbf16 %xmm4, %xmm3, %xmm2 {%k7} {z} -# INTEL: vdivnepbf16 xmm2 {k7} {z}, xmm3, xmm4 +# ATT: vdivbf16 %xmm4, %xmm3, %xmm2 {%k7} {z} +# INTEL: vdivbf16 xmm2 {k7} {z}, xmm3, xmm4 0x62,0xf5,0x65,0x8f,0x5e,0xd4 -# ATT: vdivnepbf16 268435456(%esp,%esi,8), %zmm3, %zmm2 -# INTEL: vdivnepbf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456] +# ATT: vdivbf16 268435456(%esp,%esi,8), %zmm3, %zmm2 +# INTEL: vdivbf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456] 0x62,0xf5,0x65,0x48,0x5e,0x94,0xf4,0x00,0x00,0x00,0x10 -# ATT: vdivnepbf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7} -# INTEL: vdivnepbf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291] +# ATT: vdivbf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7} +# INTEL: vdivbf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291] 0x62,0xf5,0x65,0x4f,0x5e,0x94,0x87,0x23,0x01,0x00,0x00 -# ATT: vdivnepbf16 (%eax){1to32}, %zmm3, %zmm2 -# INTEL: vdivnepbf16 zmm2, zmm3, word ptr [eax]{1to32} +# ATT: vdivbf16 (%eax){1to32}, %zmm3, %zmm2 +# INTEL: vdivbf16 zmm2, zmm3, word ptr [eax]{1to32} 0x62,0xf5,0x65,0x58,0x5e,0x10 -# ATT: vdivnepbf16 -2048(,%ebp,2), %zmm3, %zmm2 -# INTEL: vdivnepbf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048] +# ATT: vdivbf16 -2048(,%ebp,2), %zmm3, %zmm2 +# INTEL: vdivbf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048] 0x62,0xf5,0x65,0x48,0x5e,0x14,0x6d,0x00,0xf8,0xff,0xff -# ATT: vdivnepbf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z} -# INTEL: vdivnepbf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128] +# ATT: vdivbf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z} +# INTEL: vdivbf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128] 0x62,0xf5,0x65,0xcf,0x5e,0x51,0x7f -# ATT: vdivnepbf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z} -# INTEL: vdivnepbf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32} +# ATT: vdivbf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z} +# INTEL: vdivbf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32} 0x62,0xf5,0x65,0xdf,0x5e,0x52,0x80 -# ATT: vdivnepbf16 268435456(%esp,%esi,8), %ymm3, %ymm2 -# INTEL: vdivnepbf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456] +# ATT: vdivbf16 268435456(%esp,%esi,8), %ymm3, %ymm2 +# INTEL: vdivbf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456] 0x62,0xf5,0x65,0x28,0x5e,0x94,0xf4,0x00,0x00,0x00,0x10 -# ATT: vdivnepbf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7} -# INTEL: vdivnepbf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291] +# ATT: vdivbf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7} +# INTEL: vdivbf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291] 0x62,0xf5,0x65,0x2f,0x5e,0x94,0x87,0x23,0x01,0x00,0x00 -# ATT: vdivnepbf16 (%eax){1to16}, %ymm3, %ymm2 -# INTEL: vdivnepbf16 ymm2, ymm3, word ptr [eax]{1to16} +# ATT: vdivbf16 (%eax){1to16}, %ymm3, %ymm2 +# INTEL: vdivbf16 ymm2, ymm3, word ptr [eax]{1to16} 0x62,0xf5,0x65,0x38,0x5e,0x10 -# ATT: vdivnepbf16 -1024(,%ebp,2), %ymm3, %ymm2 -# INTEL: vdivnepbf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024] +# ATT: vdivbf16 -1024(,%ebp,2), %ymm3, %ymm2 +# INTEL: vdivbf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024] 0x62,0xf5,0x65,0x28,0x5e,0x14,0x6d,0x00,0xfc,0xff,0xff -# ATT: vdivnepbf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z} -# INTEL: vdivnepbf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064] +# ATT: vdivbf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z} +# INTEL: vdivbf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064] 0x62,0xf5,0x65,0xaf,0x5e,0x51,0x7f -# ATT: vdivnepbf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z} -# INTEL: vdivnepbf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16} +# ATT: vdivbf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z} +# INTEL: vdivbf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16} 0x62,0xf5,0x65,0xbf,0x5e,0x52,0x80 -# ATT: vdivnepbf16 268435456(%esp,%esi,8), %xmm3, %xmm2 -# INTEL: vdivnepbf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456] +# ATT: vdivbf16 268435456(%esp,%esi,8), %xmm3, %xmm2 +# INTEL: vdivbf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456] 0x62,0xf5,0x65,0x08,0x5e,0x94,0xf4,0x00,0x00,0x00,0x10 -# ATT: vdivnepbf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7} -# INTEL: vdivnepbf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291] +# ATT: vdivbf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7} +# INTEL: vdivbf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291] 0x62,0xf5,0x65,0x0f,0x5e,0x94,0x87,0x23,0x01,0x00,0x00 -# ATT: vdivnepbf16 (%eax){1to8}, %xmm3, %xmm2 -# INTEL: vdivnepbf16 xmm2, xmm3, word ptr [eax]{1to8} +# ATT: vdivbf16 (%eax){1to8}, %xmm3, %xmm2 +# INTEL: vdivbf16 xmm2, xmm3, word ptr [eax]{1to8} 0x62,0xf5,0x65,0x18,0x5e,0x10 -# ATT: vdivnepbf16 -512(,%ebp,2), %xmm3, %xmm2 -# INTEL: vdivnepbf16 xmm2, xmm3, xmmword ptr [2*ebp - 512] +# ATT: vdivbf16 -512(,%ebp,2), %xmm3, %xmm2 +# INTEL: vdivbf16 xmm2, xmm3, xmmword ptr [2*ebp - 512] 0x62,0xf5,0x65,0x08,0x5e,0x14,0x6d,0x00,0xfe,0xff,0xff -# ATT: vdivnepbf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z} -# INTEL: vdivnepbf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032] +# ATT: vdivbf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z} +# INTEL: vdivbf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032] 0x62,0xf5,0x65,0x8f,0x5e,0x51,0x7f -# ATT: vdivnepbf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z} -# INTEL: vdivnepbf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8} +# ATT: vdivbf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z} +# INTEL: vdivbf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8} 0x62,0xf5,0x65,0x9f,0x5e,0x52,0x80 -# ATT: vfmadd132nepbf16 %ymm4, %ymm3, %ymm2 -# INTEL: vfmadd132nepbf16 ymm2, ymm3, ymm4 +# ATT: vfmadd132bf16 %ymm4, %ymm3, %ymm2 +# INTEL: vfmadd132bf16 ymm2, ymm3, ymm4 0x62,0xf6,0x64,0x28,0x98,0xd4 -# ATT: vfmadd132nepbf16 %ymm4, %ymm3, %ymm2 {%k7} -# INTEL: vfmadd132nepbf16 ymm2 {k7}, ymm3, ymm4 +# ATT: vfmadd132bf16 %ymm4, %ymm3, %ymm2 {%k7} +# INTEL: vfmadd132bf16 ymm2 {k7}, ymm3, ymm4 0x62,0xf6,0x64,0x2f,0x98,0xd4 -# ATT: vfmadd132nepbf16 %ymm4, %ymm3, %ymm2 {%k7} {z} -# INTEL: vfmadd132nepbf16 ymm2 {k7} {z}, ymm3, ymm4 +# ATT: vfmadd132bf16 %ymm4, %ymm3, %ymm2 {%k7} {z} +# INTEL: vfmadd132bf16 ymm2 {k7} {z}, ymm3, ymm4 0x62,0xf6,0x64,0xaf,0x98,0xd4 -# ATT: vfmadd132nepbf16 %zmm4, %zmm3, %zmm2 -# INTEL: vfmadd132nepbf16 zmm2, zmm3, zmm4 +# ATT: vfmadd132bf16 %zmm4, %zmm3, %zmm2 +# INTEL: vfmadd132bf16 zmm2, zmm3, zmm4 0x62,0xf6,0x64,0x48,0x98,0xd4 -# ATT: vfmadd132nepbf16 %zmm4, %zmm3, %zmm2 {%k7} -# INTEL: vfmadd132nepbf16 zmm2 {k7}, zmm3, zmm4 +# ATT: vfmadd132bf16 %zmm4, %zmm3, %zmm2 {%k7} +# INTEL: vfmadd132bf16 zmm2 {k7}, zmm3, zmm4 0x62,0xf6,0x64,0x4f,0x98,0xd4 -# ATT: vfmadd132nepbf16 %zmm4, %zmm3, %zmm2 {%k7} {z} -# INTEL: vfmadd132nepbf16 zmm2 {k7} {z}, zmm3, zmm4 +# ATT: vfmadd132bf16 %zmm4, %zmm3, %zmm2 {%k7} {z} +# INTEL: vfmadd132bf16 zmm2 {k7} {z}, zmm3, zmm4 0x62,0xf6,0x64,0xcf,0x98,0xd4 -# ATT: vfmadd132nepbf16 %xmm4, %xmm3, %xmm2 -# INTEL: vfmadd132nepbf16 xmm2, xmm3, xmm4 +# ATT: vfmadd132bf16 %xmm4, %xmm3, %xmm2 +# INTEL: vfmadd132bf16 xmm2, xmm3, xmm4 0x62,0xf6,0x64,0x08,0x98,0xd4 -# ATT: vfmadd132nepbf16 %xmm4, %xmm3, %xmm2 {%k7} -# INTEL: vfmadd132nepbf16 xmm2 {k7}, xmm3, xmm4 +# ATT: vfmadd132bf16 %xmm4, %xmm3, %xmm2 {%k7} +# INTEL: vfmadd132bf16 xmm2 {k7}, xmm3, xmm4 0x62,0xf6,0x64,0x0f,0x98,0xd4 -# ATT: vfmadd132nepbf16 %xmm4, %xmm3, %xmm2 {%k7} {z} -# INTEL: vfmadd132nepbf16 xmm2 {k7} {z}, xmm3, xmm4 +# ATT: vfmadd132bf16 %xmm4, %xmm3, %xmm2 {%k7} {z} +# INTEL: vfmadd132bf16 xmm2 {k7} {z}, xmm3, xmm4 0x62,0xf6,0x64,0x8f,0x98,0xd4 -# ATT: vfmadd132nepbf16 268435456(%esp,%esi,8), %zmm3, %zmm2 -# INTEL: vfmadd132nepbf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456] +# ATT: vfmadd132bf16 268435456(%esp,%esi,8), %zmm3, %zmm2 +# INTEL: vfmadd132bf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456] 0x62,0xf6,0x64,0x48,0x98,0x94,0xf4,0x00,0x00,0x00,0x10 -# ATT: vfmadd132nepbf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7} -# INTEL: vfmadd132nepbf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291] +# ATT: vfmadd132bf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7} +# INTEL: vfmadd132bf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291] 0x62,0xf6,0x64,0x4f,0x98,0x94,0x87,0x23,0x01,0x00,0x00 -# ATT: vfmadd132nepbf16 (%eax){1to32}, %zmm3, %zmm2 -# INTEL: vfmadd132nepbf16 zmm2, zmm3, word ptr [eax]{1to32} +# ATT: vfmadd132bf16 (%eax){1to32}, %zmm3, %zmm2 +# INTEL: vfmadd132bf16 zmm2, zmm3, word ptr [eax]{1to32} 0x62,0xf6,0x64,0x58,0x98,0x10 -# ATT: vfmadd132nepbf16 -2048(,%ebp,2), %zmm3, %zmm2 -# INTEL: vfmadd132nepbf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048] +# ATT: vfmadd132bf16 -2048(,%ebp,2), %zmm3, %zmm2 +# INTEL: vfmadd132bf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048] 0x62,0xf6,0x64,0x48,0x98,0x14,0x6d,0x00,0xf8,0xff,0xff -# ATT: vfmadd132nepbf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z} -# INTEL: vfmadd132nepbf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128] +# ATT: vfmadd132bf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z} +# INTEL: vfmadd132bf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128] 0x62,0xf6,0x64,0xcf,0x98,0x51,0x7f -# ATT: vfmadd132nepbf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z} -# INTEL: vfmadd132nepbf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32} +# ATT: vfmadd132bf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z} +# INTEL: vfmadd132bf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32} 0x62,0xf6,0x64,0xdf,0x98,0x52,0x80 -# ATT: vfmadd132nepbf16 268435456(%esp,%esi,8), %ymm3, %ymm2 -# INTEL: vfmadd132nepbf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456] +# ATT: vfmadd132bf16 268435456(%esp,%esi,8), %ymm3, %ymm2 +# INTEL: vfmadd132bf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456] 0x62,0xf6,0x64,0x28,0x98,0x94,0xf4,0x00,0x00,0x00,0x10 -# ATT: vfmadd132nepbf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7} -# INTEL: vfmadd132nepbf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291] +# ATT: vfmadd132bf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7} +# INTEL: vfmadd132bf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291] 0x62,0xf6,0x64,0x2f,0x98,0x94,0x87,0x23,0x01,0x00,0x00 -# ATT: vfmadd132nepbf16 (%eax){1to16}, %ymm3, %ymm2 -# INTEL: vfmadd132nepbf16 ymm2, ymm3, word ptr [eax]{1to16} +# ATT: vfmadd132bf16 (%eax){1to16}, %ymm3, %ymm2 +# INTEL: vfmadd132bf16 ymm2, ymm3, word ptr [eax]{1to16} 0x62,0xf6,0x64,0x38,0x98,0x10 -# ATT: vfmadd132nepbf16 -1024(,%ebp,2), %ymm3, %ymm2 -# INTEL: vfmadd132nepbf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024] +# ATT: vfmadd132bf16 -1024(,%ebp,2), %ymm3, %ymm2 +# INTEL: vfmadd132bf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024] 0x62,0xf6,0x64,0x28,0x98,0x14,0x6d,0x00,0xfc,0xff,0xff -# ATT: vfmadd132nepbf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z} -# INTEL: vfmadd132nepbf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064] +# ATT: vfmadd132bf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z} +# INTEL: vfmadd132bf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064] 0x62,0xf6,0x64,0xaf,0x98,0x51,0x7f -# ATT: vfmadd132nepbf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z} -# INTEL: vfmadd132nepbf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16} +# ATT: vfmadd132bf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z} +# INTEL: vfmadd132bf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16} 0x62,0xf6,0x64,0xbf,0x98,0x52,0x80 -# ATT: vfmadd132nepbf16 268435456(%esp,%esi,8), %xmm3, %xmm2 -# INTEL: vfmadd132nepbf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456] +# ATT: vfmadd132bf16 268435456(%esp,%esi,8), %xmm3, %xmm2 +# INTEL: vfmadd132bf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456] 0x62,0xf6,0x64,0x08,0x98,0x94,0xf4,0x00,0x00,0x00,0x10 -# ATT: vfmadd132nepbf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7} -# INTEL: vfmadd132nepbf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291] +# ATT: vfmadd132bf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7} +# INTEL: vfmadd132bf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291] 0x62,0xf6,0x64,0x0f,0x98,0x94,0x87,0x23,0x01,0x00,0x00 -# ATT: vfmadd132nepbf16 (%eax){1to8}, %xmm3, %xmm2 -# INTEL: vfmadd132nepbf16 xmm2, xmm3, word ptr [eax]{1to8} +# ATT: vfmadd132bf16 (%eax){1to8}, %xmm3, %xmm2 +# INTEL: vfmadd132bf16 xmm2, xmm3, word ptr [eax]{1to8} 0x62,0xf6,0x64,0x18,0x98,0x10 -# ATT: vfmadd132nepbf16 -512(,%ebp,2), %xmm3, %xmm2 -# INTEL: vfmadd132nepbf16 xmm2, xmm3, xmmword ptr [2*ebp - 512] +# ATT: vfmadd132bf16 -512(,%ebp,2), %xmm3, %xmm2 +# INTEL: vfmadd132bf16 xmm2, xmm3, xmmword ptr [2*ebp - 512] 0x62,0xf6,0x64,0x08,0x98,0x14,0x6d,0x00,0xfe,0xff,0xff -# ATT: vfmadd132nepbf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z} -# INTEL: vfmadd132nepbf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032] +# ATT: vfmadd132bf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z} +# INTEL: vfmadd132bf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032] 0x62,0xf6,0x64,0x8f,0x98,0x51,0x7f -# ATT: vfmadd132nepbf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z} -# INTEL: vfmadd132nepbf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8} +# ATT: vfmadd132bf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z} +# INTEL: vfmadd132bf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8} 0x62,0xf6,0x64,0x9f,0x98,0x52,0x80 -# ATT: vfmadd213nepbf16 %ymm4, %ymm3, %ymm2 -# INTEL: vfmadd213nepbf16 ymm2, ymm3, ymm4 +# ATT: vfmadd213bf16 %ymm4, %ymm3, %ymm2 +# INTEL: vfmadd213bf16 ymm2, ymm3, ymm4 0x62,0xf6,0x64,0x28,0xa8,0xd4 -# ATT: vfmadd213nepbf16 %ymm4, %ymm3, %ymm2 {%k7} -# INTEL: vfmadd213nepbf16 ymm2 {k7}, ymm3, ymm4 +# ATT: vfmadd213bf16 %ymm4, %ymm3, %ymm2 {%k7} +# INTEL: vfmadd213bf16 ymm2 {k7}, ymm3, ymm4 0x62,0xf6,0x64,0x2f,0xa8,0xd4 -# ATT: vfmadd213nepbf16 %ymm4, %ymm3, %ymm2 {%k7} {z} -# INTEL: vfmadd213nepbf16 ymm2 {k7} {z}, ymm3, ymm4 +# ATT: vfmadd213bf16 %ymm4, %ymm3, %ymm2 {%k7} {z} +# INTEL: vfmadd213bf16 ymm2 {k7} {z}, ymm3, ymm4 0x62,0xf6,0x64,0xaf,0xa8,0xd4 -# ATT: vfmadd213nepbf16 %zmm4, %zmm3, %zmm2 -# INTEL: vfmadd213nepbf16 zmm2, zmm3, zmm4 +# ATT: vfmadd213bf16 %zmm4, %zmm3, %zmm2 +# INTEL: vfmadd213bf16 zmm2, zmm3, zmm4 0x62,0xf6,0x64,0x48,0xa8,0xd4 -# ATT: vfmadd213nepbf16 %zmm4, %zmm3, %zmm2 {%k7} -# INTEL: vfmadd213nepbf16 zmm2 {k7}, zmm3, zmm4 +# ATT: vfmadd213bf16 %zmm4, %zmm3, %zmm2 {%k7} +# INTEL: vfmadd213bf16 zmm2 {k7}, zmm3, zmm4 0x62,0xf6,0x64,0x4f,0xa8,0xd4 -# ATT: vfmadd213nepbf16 %zmm4, %zmm3, %zmm2 {%k7} {z} -# INTEL: vfmadd213nepbf16 zmm2 {k7} {z}, zmm3, zmm4 +# ATT: vfmadd213bf16 %zmm4, %zmm3, %zmm2 {%k7} {z} +# INTEL: vfmadd213bf16 zmm2 {k7} {z}, zmm3, zmm4 0x62,0xf6,0x64,0xcf,0xa8,0xd4 -# ATT: vfmadd213nepbf16 %xmm4, %xmm3, %xmm2 -# INTEL: vfmadd213nepbf16 xmm2, xmm3, xmm4 +# ATT: vfmadd213bf16 %xmm4, %xmm3, %xmm2 +# INTEL: vfmadd213bf16 xmm2, xmm3, xmm4 0x62,0xf6,0x64,0x08,0xa8,0xd4 -# ATT: vfmadd213nepbf16 %xmm4, %xmm3, %xmm2 {%k7} -# INTEL: vfmadd213nepbf16 xmm2 {k7}, xmm3, xmm4 +# ATT: vfmadd213bf16 %xmm4, %xmm3, %xmm2 {%k7} +# INTEL: vfmadd213bf16 xmm2 {k7}, xmm3, xmm4 0x62,0xf6,0x64,0x0f,0xa8,0xd4 -# ATT: vfmadd213nepbf16 %xmm4, %xmm3, %xmm2 {%k7} {z} -# INTEL: vfmadd213nepbf16 xmm2 {k7} {z}, xmm3, xmm4 +# ATT: vfmadd213bf16 %xmm4, %xmm3, %xmm2 {%k7} {z} +# INTEL: vfmadd213bf16 xmm2 {k7} {z}, xmm3, xmm4 0x62,0xf6,0x64,0x8f,0xa8,0xd4 -# ATT: vfmadd213nepbf16 268435456(%esp,%esi,8), %zmm3, %zmm2 -# INTEL: vfmadd213nepbf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456] +# ATT: vfmadd213bf16 268435456(%esp,%esi,8), %zmm3, %zmm2 +# INTEL: vfmadd213bf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456] 0x62,0xf6,0x64,0x48,0xa8,0x94,0xf4,0x00,0x00,0x00,0x10 -# ATT: vfmadd213nepbf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7} -# INTEL: vfmadd213nepbf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291] +# ATT: vfmadd213bf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7} +# INTEL: vfmadd213bf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291] 0x62,0xf6,0x64,0x4f,0xa8,0x94,0x87,0x23,0x01,0x00,0x00 -# ATT: vfmadd213nepbf16 (%eax){1to32}, %zmm3, %zmm2 -# INTEL: vfmadd213nepbf16 zmm2, zmm3, word ptr [eax]{1to32} +# ATT: vfmadd213bf16 (%eax){1to32}, %zmm3, %zmm2 +# INTEL: vfmadd213bf16 zmm2, zmm3, word ptr [eax]{1to32} 0x62,0xf6,0x64,0x58,0xa8,0x10 -# ATT: vfmadd213nepbf16 -2048(,%ebp,2), %zmm3, %zmm2 -# INTEL: vfmadd213nepbf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048] +# ATT: vfmadd213bf16 -2048(,%ebp,2), %zmm3, %zmm2 +# INTEL: vfmadd213bf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048] 0x62,0xf6,0x64,0x48,0xa8,0x14,0x6d,0x00,0xf8,0xff,0xff -# ATT: vfmadd213nepbf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z} -# INTEL: vfmadd213nepbf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128] +# ATT: vfmadd213bf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z} +# INTEL: vfmadd213bf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128] 0x62,0xf6,0x64,0xcf,0xa8,0x51,0x7f -# ATT: vfmadd213nepbf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z} -# INTEL: vfmadd213nepbf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32} +# ATT: vfmadd213bf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z} +# INTEL: vfmadd213bf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32} 0x62,0xf6,0x64,0xdf,0xa8,0x52,0x80 -# ATT: vfmadd213nepbf16 268435456(%esp,%esi,8), %ymm3, %ymm2 -# INTEL: vfmadd213nepbf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456] +# ATT: vfmadd213bf16 268435456(%esp,%esi,8), %ymm3, %ymm2 +# INTEL: vfmadd213bf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456] 0x62,0xf6,0x64,0x28,0xa8,0x94,0xf4,0x00,0x00,0x00,0x10 -# ATT: vfmadd213nepbf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7} -# INTEL: vfmadd213nepbf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291] +# ATT: vfmadd213bf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7} +# INTEL: vfmadd213bf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291] 0x62,0xf6,0x64,0x2f,0xa8,0x94,0x87,0x23,0x01,0x00,0x00 -# ATT: vfmadd213nepbf16 (%eax){1to16}, %ymm3, %ymm2 -# INTEL: vfmadd213nepbf16 ymm2, ymm3, word ptr [eax]{1to16} +# ATT: vfmadd213bf16 (%eax){1to16}, %ymm3, %ymm2 +# INTEL: vfmadd213bf16 ymm2, ymm3, word ptr [eax]{1to16} 0x62,0xf6,0x64,0x38,0xa8,0x10 -# ATT: vfmadd213nepbf16 -1024(,%ebp,2), %ymm3, %ymm2 -# INTEL: vfmadd213nepbf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024] +# ATT: vfmadd213bf16 -1024(,%ebp,2), %ymm3, %ymm2 +# INTEL: vfmadd213bf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024] 0x62,0xf6,0x64,0x28,0xa8,0x14,0x6d,0x00,0xfc,0xff,0xff -# ATT: vfmadd213nepbf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z} -# INTEL: vfmadd213nepbf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064] +# ATT: vfmadd213bf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z} +# INTEL: vfmadd213bf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064] 0x62,0xf6,0x64,0xaf,0xa8,0x51,0x7f -# ATT: vfmadd213nepbf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z} -# INTEL: vfmadd213nepbf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16} +# ATT: vfmadd213bf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z} +# INTEL: vfmadd213bf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16} 0x62,0xf6,0x64,0xbf,0xa8,0x52,0x80 -# ATT: vfmadd213nepbf16 268435456(%esp,%esi,8), %xmm3, %xmm2 -# INTEL: vfmadd213nepbf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456] +# ATT: vfmadd213bf16 268435456(%esp,%esi,8), %xmm3, %xmm2 +# INTEL: vfmadd213bf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456] 0x62,0xf6,0x64,0x08,0xa8,0x94,0xf4,0x00,0x00,0x00,0x10 -# ATT: vfmadd213nepbf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7} -# INTEL: vfmadd213nepbf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291] +# ATT: vfmadd213bf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7} +# INTEL: vfmadd213bf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291] 0x62,0xf6,0x64,0x0f,0xa8,0x94,0x87,0x23,0x01,0x00,0x00 -# ATT: vfmadd213nepbf16 (%eax){1to8}, %xmm3, %xmm2 -# INTEL: vfmadd213nepbf16 xmm2, xmm3, word ptr [eax]{1to8} +# ATT: vfmadd213bf16 (%eax){1to8}, %xmm3, %xmm2 +# INTEL: vfmadd213bf16 xmm2, xmm3, word ptr [eax]{1to8} 0x62,0xf6,0x64,0x18,0xa8,0x10 -# ATT: vfmadd213nepbf16 -512(,%ebp,2), %xmm3, %xmm2 -# INTEL: vfmadd213nepbf16 xmm2, xmm3, xmmword ptr [2*ebp - 512] +# ATT: vfmadd213bf16 -512(,%ebp,2), %xmm3, %xmm2 +# INTEL: vfmadd213bf16 xmm2, xmm3, xmmword ptr [2*ebp - 512] 0x62,0xf6,0x64,0x08,0xa8,0x14,0x6d,0x00,0xfe,0xff,0xff -# ATT: vfmadd213nepbf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z} -# INTEL: vfmadd213nepbf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032] +# ATT: vfmadd213bf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z} +# INTEL: vfmadd213bf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032] 0x62,0xf6,0x64,0x8f,0xa8,0x51,0x7f -# ATT: vfmadd213nepbf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z} -# INTEL: vfmadd213nepbf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8} +# ATT: vfmadd213bf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z} +# INTEL: vfmadd213bf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8} 0x62,0xf6,0x64,0x9f,0xa8,0x52,0x80 -# ATT: vfmadd231nepbf16 %ymm4, %ymm3, %ymm2 -# INTEL: vfmadd231nepbf16 ymm2, ymm3, ymm4 +# ATT: vfmadd231bf16 %ymm4, %ymm3, %ymm2 +# INTEL: vfmadd231bf16 ymm2, ymm3, ymm4 0x62,0xf6,0x64,0x28,0xb8,0xd4 -# ATT: vfmadd231nepbf16 %ymm4, %ymm3, %ymm2 {%k7} -# INTEL: vfmadd231nepbf16 ymm2 {k7}, ymm3, ymm4 +# ATT: vfmadd231bf16 %ymm4, %ymm3, %ymm2 {%k7} +# INTEL: vfmadd231bf16 ymm2 {k7}, ymm3, ymm4 0x62,0xf6,0x64,0x2f,0xb8,0xd4 -# ATT: vfmadd231nepbf16 %ymm4, %ymm3, %ymm2 {%k7} {z} -# INTEL: vfmadd231nepbf16 ymm2 {k7} {z}, ymm3, ymm4 +# ATT: vfmadd231bf16 %ymm4, %ymm3, %ymm2 {%k7} {z} +# INTEL: vfmadd231bf16 ymm2 {k7} {z}, ymm3, ymm4 0x62,0xf6,0x64,0xaf,0xb8,0xd4 -# ATT: vfmadd231nepbf16 %zmm4, %zmm3, %zmm2 -# INTEL: vfmadd231nepbf16 zmm2, zmm3, zmm4 +# ATT: vfmadd231bf16 %zmm4, %zmm3, %zmm2 +# INTEL: vfmadd231bf16 zmm2, zmm3, zmm4 0x62,0xf6,0x64,0x48,0xb8,0xd4 -# ATT: vfmadd231nepbf16 %zmm4, %zmm3, %zmm2 {%k7} -# INTEL: vfmadd231nepbf16 zmm2 {k7}, zmm3, zmm4 +# ATT: vfmadd231bf16 %zmm4, %zmm3, %zmm2 {%k7} +# INTEL: vfmadd231bf16 zmm2 {k7}, zmm3, zmm4 0x62,0xf6,0x64,0x4f,0xb8,0xd4 -# ATT: vfmadd231nepbf16 %zmm4, %zmm3, %zmm2 {%k7} {z} -# INTEL: vfmadd231nepbf16 zmm2 {k7} {z}, zmm3, zmm4 +# ATT: vfmadd231bf16 %zmm4, %zmm3, %zmm2 {%k7} {z} +# INTEL: vfmadd231bf16 zmm2 {k7} {z}, zmm3, zmm4 0x62,0xf6,0x64,0xcf,0xb8,0xd4 -# ATT: vfmadd231nepbf16 %xmm4, %xmm3, %xmm2 -# INTEL: vfmadd231nepbf16 xmm2, xmm3, xmm4 +# ATT: vfmadd231bf16 %xmm4, %xmm3, %xmm2 +# INTEL: vfmadd231bf16 xmm2, xmm3, xmm4 0x62,0xf6,0x64,0x08,0xb8,0xd4 -# ATT: vfmadd231nepbf16 %xmm4, %xmm3, %xmm2 {%k7} -# INTEL: vfmadd231nepbf16 xmm2 {k7}, xmm3, xmm4 +# ATT: vfmadd231bf16 %xmm4, %xmm3, %xmm2 {%k7} +# INTEL: vfmadd231bf16 xmm2 {k7}, xmm3, xmm4 0x62,0xf6,0x64,0x0f,0xb8,0xd4 -# ATT: vfmadd231nepbf16 %xmm4, %xmm3, %xmm2 {%k7} {z} -# INTEL: vfmadd231nepbf16 xmm2 {k7} {z}, xmm3, xmm4 +# ATT: vfmadd231bf16 %xmm4, %xmm3, %xmm2 {%k7} {z} +# INTEL: vfmadd231bf16 xmm2 {k7} {z}, xmm3, xmm4 0x62,0xf6,0x64,0x8f,0xb8,0xd4 -# ATT: vfmadd231nepbf16 268435456(%esp,%esi,8), %zmm3, %zmm2 -# INTEL: vfmadd231nepbf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456] +# ATT: vfmadd231bf16 268435456(%esp,%esi,8), %zmm3, %zmm2 +# INTEL: vfmadd231bf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456] 0x62,0xf6,0x64,0x48,0xb8,0x94,0xf4,0x00,0x00,0x00,0x10 -# ATT: vfmadd231nepbf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7} -# INTEL: vfmadd231nepbf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291] +# ATT: vfmadd231bf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7} +# INTEL: vfmadd231bf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291] 0x62,0xf6,0x64,0x4f,0xb8,0x94,0x87,0x23,0x01,0x00,0x00 -# ATT: vfmadd231nepbf16 (%eax){1to32}, %zmm3, %zmm2 -# INTEL: vfmadd231nepbf16 zmm2, zmm3, word ptr [eax]{1to32} +# ATT: vfmadd231bf16 (%eax){1to32}, %zmm3, %zmm2 +# INTEL: vfmadd231bf16 zmm2, zmm3, word ptr [eax]{1to32} 0x62,0xf6,0x64,0x58,0xb8,0x10 -# ATT: vfmadd231nepbf16 -2048(,%ebp,2), %zmm3, %zmm2 -# INTEL: vfmadd231nepbf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048] +# ATT: vfmadd231bf16 -2048(,%ebp,2), %zmm3, %zmm2 +# INTEL: vfmadd231bf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048] 0x62,0xf6,0x64,0x48,0xb8,0x14,0x6d,0x00,0xf8,0xff,0xff -# ATT: vfmadd231nepbf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z} -# INTEL: vfmadd231nepbf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128] +# ATT: vfmadd231bf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z} +# INTEL: vfmadd231bf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128] 0x62,0xf6,0x64,0xcf,0xb8,0x51,0x7f -# ATT: vfmadd231nepbf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z} -# INTEL: vfmadd231nepbf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32} +# ATT: vfmadd231bf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z} +# INTEL: vfmadd231bf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32} 0x62,0xf6,0x64,0xdf,0xb8,0x52,0x80 -# ATT: vfmadd231nepbf16 268435456(%esp,%esi,8), %ymm3, %ymm2 -# INTEL: vfmadd231nepbf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456] +# ATT: vfmadd231bf16 268435456(%esp,%esi,8), %ymm3, %ymm2 +# INTEL: vfmadd231bf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456] 0x62,0xf6,0x64,0x28,0xb8,0x94,0xf4,0x00,0x00,0x00,0x10 -# ATT: vfmadd231nepbf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7} -# INTEL: vfmadd231nepbf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291] +# ATT: vfmadd231bf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7} +# INTEL: vfmadd231bf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291] 0x62,0xf6,0x64,0x2f,0xb8,0x94,0x87,0x23,0x01,0x00,0x00 -# ATT: vfmadd231nepbf16 (%eax){1to16}, %ymm3, %ymm2 -# INTEL: vfmadd231nepbf16 ymm2, ymm3, word ptr [eax]{1to16} +# ATT: vfmadd231bf16 (%eax){1to16}, %ymm3, %ymm2 +# INTEL: vfmadd231bf16 ymm2, ymm3, word ptr [eax]{1to16} 0x62,0xf6,0x64,0x38,0xb8,0x10 -# ATT: vfmadd231nepbf16 -1024(,%ebp,2), %ymm3, %ymm2 -# INTEL: vfmadd231nepbf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024] +# ATT: vfmadd231bf16 -1024(,%ebp,2), %ymm3, %ymm2 +# INTEL: vfmadd231bf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024] 0x62,0xf6,0x64,0x28,0xb8,0x14,0x6d,0x00,0xfc,0xff,0xff -# ATT: vfmadd231nepbf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z} -# INTEL: vfmadd231nepbf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064] +# ATT: vfmadd231bf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z} +# INTEL: vfmadd231bf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064] 0x62,0xf6,0x64,0xaf,0xb8,0x51,0x7f -# ATT: vfmadd231nepbf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z} -# INTEL: vfmadd231nepbf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16} +# ATT: vfmadd231bf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z} +# INTEL: vfmadd231bf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16} 0x62,0xf6,0x64,0xbf,0xb8,0x52,0x80 -# ATT: vfmadd231nepbf16 268435456(%esp,%esi,8), %xmm3, %xmm2 -# INTEL: vfmadd231nepbf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456] +# ATT: vfmadd231bf16 268435456(%esp,%esi,8), %xmm3, %xmm2 +# INTEL: vfmadd231bf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456] 0x62,0xf6,0x64,0x08,0xb8,0x94,0xf4,0x00,0x00,0x00,0x10 -# ATT: vfmadd231nepbf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7} -# INTEL: vfmadd231nepbf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291] +# ATT: vfmadd231bf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7} +# INTEL: vfmadd231bf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291] 0x62,0xf6,0x64,0x0f,0xb8,0x94,0x87,0x23,0x01,0x00,0x00 -# ATT: vfmadd231nepbf16 (%eax){1to8}, %xmm3, %xmm2 -# INTEL: vfmadd231nepbf16 xmm2, xmm3, word ptr [eax]{1to8} +# ATT: vfmadd231bf16 (%eax){1to8}, %xmm3, %xmm2 +# INTEL: vfmadd231bf16 xmm2, xmm3, word ptr [eax]{1to8} 0x62,0xf6,0x64,0x18,0xb8,0x10 -# ATT: vfmadd231nepbf16 -512(,%ebp,2), %xmm3, %xmm2 -# INTEL: vfmadd231nepbf16 xmm2, xmm3, xmmword ptr [2*ebp - 512] +# ATT: vfmadd231bf16 -512(,%ebp,2), %xmm3, %xmm2 +# INTEL: vfmadd231bf16 xmm2, xmm3, xmmword ptr [2*ebp - 512] 0x62,0xf6,0x64,0x08,0xb8,0x14,0x6d,0x00,0xfe,0xff,0xff -# ATT: vfmadd231nepbf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z} -# INTEL: vfmadd231nepbf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032] +# ATT: vfmadd231bf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z} +# INTEL: vfmadd231bf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032] 0x62,0xf6,0x64,0x8f,0xb8,0x51,0x7f -# ATT: vfmadd231nepbf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z} -# INTEL: vfmadd231nepbf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8} +# ATT: vfmadd231bf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z} +# INTEL: vfmadd231bf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8} 0x62,0xf6,0x64,0x9f,0xb8,0x52,0x80 -# ATT: vfmsub132nepbf16 %ymm4, %ymm3, %ymm2 -# INTEL: vfmsub132nepbf16 ymm2, ymm3, ymm4 +# ATT: vfmsub132bf16 %ymm4, %ymm3, %ymm2 +# INTEL: vfmsub132bf16 ymm2, ymm3, ymm4 0x62,0xf6,0x64,0x28,0x9a,0xd4 -# ATT: vfmsub132nepbf16 %ymm4, %ymm3, %ymm2 {%k7} -# INTEL: vfmsub132nepbf16 ymm2 {k7}, ymm3, ymm4 +# ATT: vfmsub132bf16 %ymm4, %ymm3, %ymm2 {%k7} +# INTEL: vfmsub132bf16 ymm2 {k7}, ymm3, ymm4 0x62,0xf6,0x64,0x2f,0x9a,0xd4 -# ATT: vfmsub132nepbf16 %ymm4, %ymm3, %ymm2 {%k7} {z} -# INTEL: vfmsub132nepbf16 ymm2 {k7} {z}, ymm3, ymm4 +# ATT: vfmsub132bf16 %ymm4, %ymm3, %ymm2 {%k7} {z} +# INTEL: vfmsub132bf16 ymm2 {k7} {z}, ymm3, ymm4 0x62,0xf6,0x64,0xaf,0x9a,0xd4 -# ATT: vfmsub132nepbf16 %zmm4, %zmm3, %zmm2 -# INTEL: vfmsub132nepbf16 zmm2, zmm3, zmm4 +# ATT: vfmsub132bf16 %zmm4, %zmm3, %zmm2 +# INTEL: vfmsub132bf16 zmm2, zmm3, zmm4 0x62,0xf6,0x64,0x48,0x9a,0xd4 -# ATT: vfmsub132nepbf16 %zmm4, %zmm3, %zmm2 {%k7} -# INTEL: vfmsub132nepbf16 zmm2 {k7}, zmm3, zmm4 +# ATT: vfmsub132bf16 %zmm4, %zmm3, %zmm2 {%k7} +# INTEL: vfmsub132bf16 zmm2 {k7}, zmm3, zmm4 0x62,0xf6,0x64,0x4f,0x9a,0xd4 -# ATT: vfmsub132nepbf16 %zmm4, %zmm3, %zmm2 {%k7} {z} -# INTEL: vfmsub132nepbf16 zmm2 {k7} {z}, zmm3, zmm4 +# ATT: vfmsub132bf16 %zmm4, %zmm3, %zmm2 {%k7} {z} +# INTEL: vfmsub132bf16 zmm2 {k7} {z}, zmm3, zmm4 0x62,0xf6,0x64,0xcf,0x9a,0xd4 -# ATT: vfmsub132nepbf16 %xmm4, %xmm3, %xmm2 -# INTEL: vfmsub132nepbf16 xmm2, xmm3, xmm4 +# ATT: vfmsub132bf16 %xmm4, %xmm3, %xmm2 +# INTEL: vfmsub132bf16 xmm2, xmm3, xmm4 0x62,0xf6,0x64,0x08,0x9a,0xd4 -# ATT: vfmsub132nepbf16 %xmm4, %xmm3, %xmm2 {%k7} -# INTEL: vfmsub132nepbf16 xmm2 {k7}, xmm3, xmm4 +# ATT: vfmsub132bf16 %xmm4, %xmm3, %xmm2 {%k7} +# INTEL: vfmsub132bf16 xmm2 {k7}, xmm3, xmm4 0x62,0xf6,0x64,0x0f,0x9a,0xd4 -# ATT: vfmsub132nepbf16 %xmm4, %xmm3, %xmm2 {%k7} {z} -# INTEL: vfmsub132nepbf16 xmm2 {k7} {z}, xmm3, xmm4 +# ATT: vfmsub132bf16 %xmm4, %xmm3, %xmm2 {%k7} {z} +# INTEL: vfmsub132bf16 xmm2 {k7} {z}, xmm3, xmm4 0x62,0xf6,0x64,0x8f,0x9a,0xd4 -# ATT: vfmsub132nepbf16 268435456(%esp,%esi,8), %zmm3, %zmm2 -# INTEL: vfmsub132nepbf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456] +# ATT: vfmsub132bf16 268435456(%esp,%esi,8), %zmm3, %zmm2 +# INTEL: vfmsub132bf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456] 0x62,0xf6,0x64,0x48,0x9a,0x94,0xf4,0x00,0x00,0x00,0x10 -# ATT: vfmsub132nepbf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7} -# INTEL: vfmsub132nepbf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291] +# ATT: vfmsub132bf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7} +# INTEL: vfmsub132bf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291] 0x62,0xf6,0x64,0x4f,0x9a,0x94,0x87,0x23,0x01,0x00,0x00 -# ATT: vfmsub132nepbf16 (%eax){1to32}, %zmm3, %zmm2 -# INTEL: vfmsub132nepbf16 zmm2, zmm3, word ptr [eax]{1to32} +# ATT: vfmsub132bf16 (%eax){1to32}, %zmm3, %zmm2 +# INTEL: vfmsub132bf16 zmm2, zmm3, word ptr [eax]{1to32} 0x62,0xf6,0x64,0x58,0x9a,0x10 -# ATT: vfmsub132nepbf16 -2048(,%ebp,2), %zmm3, %zmm2 -# INTEL: vfmsub132nepbf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048] +# ATT: vfmsub132bf16 -2048(,%ebp,2), %zmm3, %zmm2 +# INTEL: vfmsub132bf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048] 0x62,0xf6,0x64,0x48,0x9a,0x14,0x6d,0x00,0xf8,0xff,0xff -# ATT: vfmsub132nepbf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z} -# INTEL: vfmsub132nepbf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128] +# ATT: vfmsub132bf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z} +# INTEL: vfmsub132bf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128] 0x62,0xf6,0x64,0xcf,0x9a,0x51,0x7f -# ATT: vfmsub132nepbf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z} -# INTEL: vfmsub132nepbf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32} +# ATT: vfmsub132bf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z} +# INTEL: vfmsub132bf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32} 0x62,0xf6,0x64,0xdf,0x9a,0x52,0x80 -# ATT: vfmsub132nepbf16 268435456(%esp,%esi,8), %ymm3, %ymm2 -# INTEL: vfmsub132nepbf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456] +# ATT: vfmsub132bf16 268435456(%esp,%esi,8), %ymm3, %ymm2 +# INTEL: vfmsub132bf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456] 0x62,0xf6,0x64,0x28,0x9a,0x94,0xf4,0x00,0x00,0x00,0x10 -# ATT: vfmsub132nepbf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7} -# INTEL: vfmsub132nepbf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291] +# ATT: vfmsub132bf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7} +# INTEL: vfmsub132bf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291] 0x62,0xf6,0x64,0x2f,0x9a,0x94,0x87,0x23,0x01,0x00,0x00 -# ATT: vfmsub132nepbf16 (%eax){1to16}, %ymm3, %ymm2 -# INTEL: vfmsub132nepbf16 ymm2, ymm3, word ptr [eax]{1to16} +# ATT: vfmsub132bf16 (%eax){1to16}, %ymm3, %ymm2 +# INTEL: vfmsub132bf16 ymm2, ymm3, word ptr [eax]{1to16} 0x62,0xf6,0x64,0x38,0x9a,0x10 -# ATT: vfmsub132nepbf16 -1024(,%ebp,2), %ymm3, %ymm2 -# INTEL: vfmsub132nepbf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024] +# ATT: vfmsub132bf16 -1024(,%ebp,2), %ymm3, %ymm2 +# INTEL: vfmsub132bf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024] 0x62,0xf6,0x64,0x28,0x9a,0x14,0x6d,0x00,0xfc,0xff,0xff -# ATT: vfmsub132nepbf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z} -# INTEL: vfmsub132nepbf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064] +# ATT: vfmsub132bf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z} +# INTEL: vfmsub132bf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064] 0x62,0xf6,0x64,0xaf,0x9a,0x51,0x7f -# ATT: vfmsub132nepbf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z} -# INTEL: vfmsub132nepbf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16} +# ATT: vfmsub132bf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z} +# INTEL: vfmsub132bf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16} 0x62,0xf6,0x64,0xbf,0x9a,0x52,0x80 -# ATT: vfmsub132nepbf16 268435456(%esp,%esi,8), %xmm3, %xmm2 -# INTEL: vfmsub132nepbf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456] +# ATT: vfmsub132bf16 268435456(%esp,%esi,8), %xmm3, %xmm2 +# INTEL: vfmsub132bf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456] 0x62,0xf6,0x64,0x08,0x9a,0x94,0xf4,0x00,0x00,0x00,0x10 -# ATT: vfmsub132nepbf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7} -# INTEL: vfmsub132nepbf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291] +# ATT: vfmsub132bf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7} +# INTEL: vfmsub132bf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291] 0x62,0xf6,0x64,0x0f,0x9a,0x94,0x87,0x23,0x01,0x00,0x00 -# ATT: vfmsub132nepbf16 (%eax){1to8}, %xmm3, %xmm2 -# INTEL: vfmsub132nepbf16 xmm2, xmm3, word ptr [eax]{1to8} +# ATT: vfmsub132bf16 (%eax){1to8}, %xmm3, %xmm2 +# INTEL: vfmsub132bf16 xmm2, xmm3, word ptr [eax]{1to8} 0x62,0xf6,0x64,0x18,0x9a,0x10 -# ATT: vfmsub132nepbf16 -512(,%ebp,2), %xmm3, %xmm2 -# INTEL: vfmsub132nepbf16 xmm2, xmm3, xmmword ptr [2*ebp - 512] +# ATT: vfmsub132bf16 -512(,%ebp,2), %xmm3, %xmm2 +# INTEL: vfmsub132bf16 xmm2, xmm3, xmmword ptr [2*ebp - 512] 0x62,0xf6,0x64,0x08,0x9a,0x14,0x6d,0x00,0xfe,0xff,0xff -# ATT: vfmsub132nepbf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z} -# INTEL: vfmsub132nepbf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032] +# ATT: vfmsub132bf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z} +# INTEL: vfmsub132bf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032] 0x62,0xf6,0x64,0x8f,0x9a,0x51,0x7f -# ATT: vfmsub132nepbf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z} -# INTEL: vfmsub132nepbf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8} +# ATT: vfmsub132bf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z} +# INTEL: vfmsub132bf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8} 0x62,0xf6,0x64,0x9f,0x9a,0x52,0x80 -# ATT: vfmsub213nepbf16 %ymm4, %ymm3, %ymm2 -# INTEL: vfmsub213nepbf16 ymm2, ymm3, ymm4 +# ATT: vfmsub213bf16 %ymm4, %ymm3, %ymm2 +# INTEL: vfmsub213bf16 ymm2, ymm3, ymm4 0x62,0xf6,0x64,0x28,0xaa,0xd4 -# ATT: vfmsub213nepbf16 %ymm4, %ymm3, %ymm2 {%k7} -# INTEL: vfmsub213nepbf16 ymm2 {k7}, ymm3, ymm4 +# ATT: vfmsub213bf16 %ymm4, %ymm3, %ymm2 {%k7} +# INTEL: vfmsub213bf16 ymm2 {k7}, ymm3, ymm4 0x62,0xf6,0x64,0x2f,0xaa,0xd4 -# ATT: vfmsub213nepbf16 %ymm4, %ymm3, %ymm2 {%k7} {z} -# INTEL: vfmsub213nepbf16 ymm2 {k7} {z}, ymm3, ymm4 +# ATT: vfmsub213bf16 %ymm4, %ymm3, %ymm2 {%k7} {z} +# INTEL: vfmsub213bf16 ymm2 {k7} {z}, ymm3, ymm4 0x62,0xf6,0x64,0xaf,0xaa,0xd4 -# ATT: vfmsub213nepbf16 %zmm4, %zmm3, %zmm2 -# INTEL: vfmsub213nepbf16 zmm2, zmm3, zmm4 +# ATT: vfmsub213bf16 %zmm4, %zmm3, %zmm2 +# INTEL: vfmsub213bf16 zmm2, zmm3, zmm4 0x62,0xf6,0x64,0x48,0xaa,0xd4 -# ATT: vfmsub213nepbf16 %zmm4, %zmm3, %zmm2 {%k7} -# INTEL: vfmsub213nepbf16 zmm2 {k7}, zmm3, zmm4 +# ATT: vfmsub213bf16 %zmm4, %zmm3, %zmm2 {%k7} +# INTEL: vfmsub213bf16 zmm2 {k7}, zmm3, zmm4 0x62,0xf6,0x64,0x4f,0xaa,0xd4 -# ATT: vfmsub213nepbf16 %zmm4, %zmm3, %zmm2 {%k7} {z} -# INTEL: vfmsub213nepbf16 zmm2 {k7} {z}, zmm3, zmm4 +# ATT: vfmsub213bf16 %zmm4, %zmm3, %zmm2 {%k7} {z} +# INTEL: vfmsub213bf16 zmm2 {k7} {z}, zmm3, zmm4 0x62,0xf6,0x64,0xcf,0xaa,0xd4 -# ATT: vfmsub213nepbf16 %xmm4, %xmm3, %xmm2 -# INTEL: vfmsub213nepbf16 xmm2, xmm3, xmm4 +# ATT: vfmsub213bf16 %xmm4, %xmm3, %xmm2 +# INTEL: vfmsub213bf16 xmm2, xmm3, xmm4 0x62,0xf6,0x64,0x08,0xaa,0xd4 -# ATT: vfmsub213nepbf16 %xmm4, %xmm3, %xmm2 {%k7} -# INTEL: vfmsub213nepbf16 xmm2 {k7}, xmm3, xmm4 +# ATT: vfmsub213bf16 %xmm4, %xmm3, %xmm2 {%k7} +# INTEL: vfmsub213bf16 xmm2 {k7}, xmm3, xmm4 0x62,0xf6,0x64,0x0f,0xaa,0xd4 -# ATT: vfmsub213nepbf16 %xmm4, %xmm3, %xmm2 {%k7} {z} -# INTEL: vfmsub213nepbf16 xmm2 {k7} {z}, xmm3, xmm4 +# ATT: vfmsub213bf16 %xmm4, %xmm3, %xmm2 {%k7} {z} +# INTEL: vfmsub213bf16 xmm2 {k7} {z}, xmm3, xmm4 0x62,0xf6,0x64,0x8f,0xaa,0xd4 -# ATT: vfmsub213nepbf16 268435456(%esp,%esi,8), %zmm3, %zmm2 -# INTEL: vfmsub213nepbf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456] +# ATT: vfmsub213bf16 268435456(%esp,%esi,8), %zmm3, %zmm2 +# INTEL: vfmsub213bf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456] 0x62,0xf6,0x64,0x48,0xaa,0x94,0xf4,0x00,0x00,0x00,0x10 -# ATT: vfmsub213nepbf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7} -# INTEL: vfmsub213nepbf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291] +# ATT: vfmsub213bf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7} +# INTEL: vfmsub213bf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291] 0x62,0xf6,0x64,0x4f,0xaa,0x94,0x87,0x23,0x01,0x00,0x00 -# ATT: vfmsub213nepbf16 (%eax){1to32}, %zmm3, %zmm2 -# INTEL: vfmsub213nepbf16 zmm2, zmm3, word ptr [eax]{1to32} +# ATT: vfmsub213bf16 (%eax){1to32}, %zmm3, %zmm2 +# INTEL: vfmsub213bf16 zmm2, zmm3, word ptr [eax]{1to32} 0x62,0xf6,0x64,0x58,0xaa,0x10 -# ATT: vfmsub213nepbf16 -2048(,%ebp,2), %zmm3, %zmm2 -# INTEL: vfmsub213nepbf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048] +# ATT: vfmsub213bf16 -2048(,%ebp,2), %zmm3, %zmm2 +# INTEL: vfmsub213bf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048] 0x62,0xf6,0x64,0x48,0xaa,0x14,0x6d,0x00,0xf8,0xff,0xff -# ATT: vfmsub213nepbf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z} -# INTEL: vfmsub213nepbf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128] +# ATT: vfmsub213bf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z} +# INTEL: vfmsub213bf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128] 0x62,0xf6,0x64,0xcf,0xaa,0x51,0x7f -# ATT: vfmsub213nepbf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z} -# INTEL: vfmsub213nepbf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32} +# ATT: vfmsub213bf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z} +# INTEL: vfmsub213bf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32} 0x62,0xf6,0x64,0xdf,0xaa,0x52,0x80 -# ATT: vfmsub213nepbf16 268435456(%esp,%esi,8), %ymm3, %ymm2 -# INTEL: vfmsub213nepbf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456] +# ATT: vfmsub213bf16 268435456(%esp,%esi,8), %ymm3, %ymm2 +# INTEL: vfmsub213bf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456] 0x62,0xf6,0x64,0x28,0xaa,0x94,0xf4,0x00,0x00,0x00,0x10 -# ATT: vfmsub213nepbf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7} -# INTEL: vfmsub213nepbf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291] +# ATT: vfmsub213bf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7} +# INTEL: vfmsub213bf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291] 0x62,0xf6,0x64,0x2f,0xaa,0x94,0x87,0x23,0x01,0x00,0x00 -# ATT: vfmsub213nepbf16 (%eax){1to16}, %ymm3, %ymm2 -# INTEL: vfmsub213nepbf16 ymm2, ymm3, word ptr [eax]{1to16} +# ATT: vfmsub213bf16 (%eax){1to16}, %ymm3, %ymm2 +# INTEL: vfmsub213bf16 ymm2, ymm3, word ptr [eax]{1to16} 0x62,0xf6,0x64,0x38,0xaa,0x10 -# ATT: vfmsub213nepbf16 -1024(,%ebp,2), %ymm3, %ymm2 -# INTEL: vfmsub213nepbf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024] +# ATT: vfmsub213bf16 -1024(,%ebp,2), %ymm3, %ymm2 +# INTEL: vfmsub213bf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024] 0x62,0xf6,0x64,0x28,0xaa,0x14,0x6d,0x00,0xfc,0xff,0xff -# ATT: vfmsub213nepbf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z} -# INTEL: vfmsub213nepbf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064] +# ATT: vfmsub213bf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z} +# INTEL: vfmsub213bf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064] 0x62,0xf6,0x64,0xaf,0xaa,0x51,0x7f -# ATT: vfmsub213nepbf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z} -# INTEL: vfmsub213nepbf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16} +# ATT: vfmsub213bf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z} +# INTEL: vfmsub213bf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16} 0x62,0xf6,0x64,0xbf,0xaa,0x52,0x80 -# ATT: vfmsub213nepbf16 268435456(%esp,%esi,8), %xmm3, %xmm2 -# INTEL: vfmsub213nepbf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456] +# ATT: vfmsub213bf16 268435456(%esp,%esi,8), %xmm3, %xmm2 +# INTEL: vfmsub213bf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456] 0x62,0xf6,0x64,0x08,0xaa,0x94,0xf4,0x00,0x00,0x00,0x10 -# ATT: vfmsub213nepbf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7} -# INTEL: vfmsub213nepbf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291] +# ATT: vfmsub213bf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7} +# INTEL: vfmsub213bf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291] 0x62,0xf6,0x64,0x0f,0xaa,0x94,0x87,0x23,0x01,0x00,0x00 -# ATT: vfmsub213nepbf16 (%eax){1to8}, %xmm3, %xmm2 -# INTEL: vfmsub213nepbf16 xmm2, xmm3, word ptr [eax]{1to8} +# ATT: vfmsub213bf16 (%eax){1to8}, %xmm3, %xmm2 +# INTEL: vfmsub213bf16 xmm2, xmm3, word ptr [eax]{1to8} 0x62,0xf6,0x64,0x18,0xaa,0x10 -# ATT: vfmsub213nepbf16 -512(,%ebp,2), %xmm3, %xmm2 -# INTEL: vfmsub213nepbf16 xmm2, xmm3, xmmword ptr [2*ebp - 512] +# ATT: vfmsub213bf16 -512(,%ebp,2), %xmm3, %xmm2 +# INTEL: vfmsub213bf16 xmm2, xmm3, xmmword ptr [2*ebp - 512] 0x62,0xf6,0x64,0x08,0xaa,0x14,0x6d,0x00,0xfe,0xff,0xff -# ATT: vfmsub213nepbf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z} -# INTEL: vfmsub213nepbf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032] +# ATT: vfmsub213bf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z} +# INTEL: vfmsub213bf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032] 0x62,0xf6,0x64,0x8f,0xaa,0x51,0x7f -# ATT: vfmsub213nepbf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z} -# INTEL: vfmsub213nepbf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8} +# ATT: vfmsub213bf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z} +# INTEL: vfmsub213bf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8} 0x62,0xf6,0x64,0x9f,0xaa,0x52,0x80 -# ATT: vfmsub231nepbf16 %ymm4, %ymm3, %ymm2 -# INTEL: vfmsub231nepbf16 ymm2, ymm3, ymm4 +# ATT: vfmsub231bf16 %ymm4, %ymm3, %ymm2 +# INTEL: vfmsub231bf16 ymm2, ymm3, ymm4 0x62,0xf6,0x64,0x28,0xba,0xd4 -# ATT: vfmsub231nepbf16 %ymm4, %ymm3, %ymm2 {%k7} -# INTEL: vfmsub231nepbf16 ymm2 {k7}, ymm3, ymm4 +# ATT: vfmsub231bf16 %ymm4, %ymm3, %ymm2 {%k7} +# INTEL: vfmsub231bf16 ymm2 {k7}, ymm3, ymm4 0x62,0xf6,0x64,0x2f,0xba,0xd4 -# ATT: vfmsub231nepbf16 %ymm4, %ymm3, %ymm2 {%k7} {z} -# INTEL: vfmsub231nepbf16 ymm2 {k7} {z}, ymm3, ymm4 +# ATT: vfmsub231bf16 %ymm4, %ymm3, %ymm2 {%k7} {z} +# INTEL: vfmsub231bf16 ymm2 {k7} {z}, ymm3, ymm4 0x62,0xf6,0x64,0xaf,0xba,0xd4 -# ATT: vfmsub231nepbf16 %zmm4, %zmm3, %zmm2 -# INTEL: vfmsub231nepbf16 zmm2, zmm3, zmm4 +# ATT: vfmsub231bf16 %zmm4, %zmm3, %zmm2 +# INTEL: vfmsub231bf16 zmm2, zmm3, zmm4 0x62,0xf6,0x64,0x48,0xba,0xd4 -# ATT: vfmsub231nepbf16 %zmm4, %zmm3, %zmm2 {%k7} -# INTEL: vfmsub231nepbf16 zmm2 {k7}, zmm3, zmm4 +# ATT: vfmsub231bf16 %zmm4, %zmm3, %zmm2 {%k7} +# INTEL: vfmsub231bf16 zmm2 {k7}, zmm3, zmm4 0x62,0xf6,0x64,0x4f,0xba,0xd4 -# ATT: vfmsub231nepbf16 %zmm4, %zmm3, %zmm2 {%k7} {z} -# INTEL: vfmsub231nepbf16 zmm2 {k7} {z}, zmm3, zmm4 +# ATT: vfmsub231bf16 %zmm4, %zmm3, %zmm2 {%k7} {z} +# INTEL: vfmsub231bf16 zmm2 {k7} {z}, zmm3, zmm4 0x62,0xf6,0x64,0xcf,0xba,0xd4 -# ATT: vfmsub231nepbf16 %xmm4, %xmm3, %xmm2 -# INTEL: vfmsub231nepbf16 xmm2, xmm3, xmm4 +# ATT: vfmsub231bf16 %xmm4, %xmm3, %xmm2 +# INTEL: vfmsub231bf16 xmm2, xmm3, xmm4 0x62,0xf6,0x64,0x08,0xba,0xd4 -# ATT: vfmsub231nepbf16 %xmm4, %xmm3, %xmm2 {%k7} -# INTEL: vfmsub231nepbf16 xmm2 {k7}, xmm3, xmm4 +# ATT: vfmsub231bf16 %xmm4, %xmm3, %xmm2 {%k7} +# INTEL: vfmsub231bf16 xmm2 {k7}, xmm3, xmm4 0x62,0xf6,0x64,0x0f,0xba,0xd4 -# ATT: vfmsub231nepbf16 %xmm4, %xmm3, %xmm2 {%k7} {z} -# INTEL: vfmsub231nepbf16 xmm2 {k7} {z}, xmm3, xmm4 +# ATT: vfmsub231bf16 %xmm4, %xmm3, %xmm2 {%k7} {z} +# INTEL: vfmsub231bf16 xmm2 {k7} {z}, xmm3, xmm4 0x62,0xf6,0x64,0x8f,0xba,0xd4 -# ATT: vfmsub231nepbf16 268435456(%esp,%esi,8), %zmm3, %zmm2 -# INTEL: vfmsub231nepbf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456] +# ATT: vfmsub231bf16 268435456(%esp,%esi,8), %zmm3, %zmm2 +# INTEL: vfmsub231bf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456] 0x62,0xf6,0x64,0x48,0xba,0x94,0xf4,0x00,0x00,0x00,0x10 -# ATT: vfmsub231nepbf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7} -# INTEL: vfmsub231nepbf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291] +# ATT: vfmsub231bf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7} +# INTEL: vfmsub231bf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291] 0x62,0xf6,0x64,0x4f,0xba,0x94,0x87,0x23,0x01,0x00,0x00 -# ATT: vfmsub231nepbf16 (%eax){1to32}, %zmm3, %zmm2 -# INTEL: vfmsub231nepbf16 zmm2, zmm3, word ptr [eax]{1to32} +# ATT: vfmsub231bf16 (%eax){1to32}, %zmm3, %zmm2 +# INTEL: vfmsub231bf16 zmm2, zmm3, word ptr [eax]{1to32} 0x62,0xf6,0x64,0x58,0xba,0x10 -# ATT: vfmsub231nepbf16 -2048(,%ebp,2), %zmm3, %zmm2 -# INTEL: vfmsub231nepbf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048] +# ATT: vfmsub231bf16 -2048(,%ebp,2), %zmm3, %zmm2 +# INTEL: vfmsub231bf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048] 0x62,0xf6,0x64,0x48,0xba,0x14,0x6d,0x00,0xf8,0xff,0xff -# ATT: vfmsub231nepbf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z} -# INTEL: vfmsub231nepbf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128] +# ATT: vfmsub231bf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z} +# INTEL: vfmsub231bf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128] 0x62,0xf6,0x64,0xcf,0xba,0x51,0x7f -# ATT: vfmsub231nepbf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z} -# INTEL: vfmsub231nepbf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32} +# ATT: vfmsub231bf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z} +# INTEL: vfmsub231bf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32} 0x62,0xf6,0x64,0xdf,0xba,0x52,0x80 -# ATT: vfmsub231nepbf16 268435456(%esp,%esi,8), %ymm3, %ymm2 -# INTEL: vfmsub231nepbf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456] +# ATT: vfmsub231bf16 268435456(%esp,%esi,8), %ymm3, %ymm2 +# INTEL: vfmsub231bf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456] 0x62,0xf6,0x64,0x28,0xba,0x94,0xf4,0x00,0x00,0x00,0x10 -# ATT: vfmsub231nepbf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7} -# INTEL: vfmsub231nepbf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291] +# ATT: vfmsub231bf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7} +# INTEL: vfmsub231bf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291] 0x62,0xf6,0x64,0x2f,0xba,0x94,0x87,0x23,0x01,0x00,0x00 -# ATT: vfmsub231nepbf16 (%eax){1to16}, %ymm3, %ymm2 -# INTEL: vfmsub231nepbf16 ymm2, ymm3, word ptr [eax]{1to16} +# ATT: vfmsub231bf16 (%eax){1to16}, %ymm3, %ymm2 +# INTEL: vfmsub231bf16 ymm2, ymm3, word ptr [eax]{1to16} 0x62,0xf6,0x64,0x38,0xba,0x10 -# ATT: vfmsub231nepbf16 -1024(,%ebp,2), %ymm3, %ymm2 -# INTEL: vfmsub231nepbf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024] +# ATT: vfmsub231bf16 -1024(,%ebp,2), %ymm3, %ymm2 +# INTEL: vfmsub231bf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024] 0x62,0xf6,0x64,0x28,0xba,0x14,0x6d,0x00,0xfc,0xff,0xff -# ATT: vfmsub231nepbf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z} -# INTEL: vfmsub231nepbf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064] +# ATT: vfmsub231bf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z} +# INTEL: vfmsub231bf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064] 0x62,0xf6,0x64,0xaf,0xba,0x51,0x7f -# ATT: vfmsub231nepbf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z} -# INTEL: vfmsub231nepbf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16} +# ATT: vfmsub231bf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z} +# INTEL: vfmsub231bf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16} 0x62,0xf6,0x64,0xbf,0xba,0x52,0x80 -# ATT: vfmsub231nepbf16 268435456(%esp,%esi,8), %xmm3, %xmm2 -# INTEL: vfmsub231nepbf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456] +# ATT: vfmsub231bf16 268435456(%esp,%esi,8), %xmm3, %xmm2 +# INTEL: vfmsub231bf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456] 0x62,0xf6,0x64,0x08,0xba,0x94,0xf4,0x00,0x00,0x00,0x10 -# ATT: vfmsub231nepbf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7} -# INTEL: vfmsub231nepbf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291] +# ATT: vfmsub231bf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7} +# INTEL: vfmsub231bf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291] 0x62,0xf6,0x64,0x0f,0xba,0x94,0x87,0x23,0x01,0x00,0x00 -# ATT: vfmsub231nepbf16 (%eax){1to8}, %xmm3, %xmm2 -# INTEL: vfmsub231nepbf16 xmm2, xmm3, word ptr [eax]{1to8} +# ATT: vfmsub231bf16 (%eax){1to8}, %xmm3, %xmm2 +# INTEL: vfmsub231bf16 xmm2, xmm3, word ptr [eax]{1to8} 0x62,0xf6,0x64,0x18,0xba,0x10 -# ATT: vfmsub231nepbf16 -512(,%ebp,2), %xmm3, %xmm2 -# INTEL: vfmsub231nepbf16 xmm2, xmm3, xmmword ptr [2*ebp - 512] +# ATT: vfmsub231bf16 -512(,%ebp,2), %xmm3, %xmm2 +# INTEL: vfmsub231bf16 xmm2, xmm3, xmmword ptr [2*ebp - 512] 0x62,0xf6,0x64,0x08,0xba,0x14,0x6d,0x00,0xfe,0xff,0xff -# ATT: vfmsub231nepbf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z} -# INTEL: vfmsub231nepbf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032] +# ATT: vfmsub231bf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z} +# INTEL: vfmsub231bf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032] 0x62,0xf6,0x64,0x8f,0xba,0x51,0x7f -# ATT: vfmsub231nepbf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z} -# INTEL: vfmsub231nepbf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8} +# ATT: vfmsub231bf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z} +# INTEL: vfmsub231bf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8} 0x62,0xf6,0x64,0x9f,0xba,0x52,0x80 -# ATT: vfnmadd132nepbf16 %ymm4, %ymm3, %ymm2 -# INTEL: vfnmadd132nepbf16 ymm2, ymm3, ymm4 +# ATT: vfnmadd132bf16 %ymm4, %ymm3, %ymm2 +# INTEL: vfnmadd132bf16 ymm2, ymm3, ymm4 0x62,0xf6,0x64,0x28,0x9c,0xd4 -# ATT: vfnmadd132nepbf16 %ymm4, %ymm3, %ymm2 {%k7} -# INTEL: vfnmadd132nepbf16 ymm2 {k7}, ymm3, ymm4 +# ATT: vfnmadd132bf16 %ymm4, %ymm3, %ymm2 {%k7} +# INTEL: vfnmadd132bf16 ymm2 {k7}, ymm3, ymm4 0x62,0xf6,0x64,0x2f,0x9c,0xd4 -# ATT: vfnmadd132nepbf16 %ymm4, %ymm3, %ymm2 {%k7} {z} -# INTEL: vfnmadd132nepbf16 ymm2 {k7} {z}, ymm3, ymm4 +# ATT: vfnmadd132bf16 %ymm4, %ymm3, %ymm2 {%k7} {z} +# INTEL: vfnmadd132bf16 ymm2 {k7} {z}, ymm3, ymm4 0x62,0xf6,0x64,0xaf,0x9c,0xd4 -# ATT: vfnmadd132nepbf16 %zmm4, %zmm3, %zmm2 -# INTEL: vfnmadd132nepbf16 zmm2, zmm3, zmm4 +# ATT: vfnmadd132bf16 %zmm4, %zmm3, %zmm2 +# INTEL: vfnmadd132bf16 zmm2, zmm3, zmm4 0x62,0xf6,0x64,0x48,0x9c,0xd4 -# ATT: vfnmadd132nepbf16 %zmm4, %zmm3, %zmm2 {%k7} -# INTEL: vfnmadd132nepbf16 zmm2 {k7}, zmm3, zmm4 +# ATT: vfnmadd132bf16 %zmm4, %zmm3, %zmm2 {%k7} +# INTEL: vfnmadd132bf16 zmm2 {k7}, zmm3, zmm4 0x62,0xf6,0x64,0x4f,0x9c,0xd4 -# ATT: vfnmadd132nepbf16 %zmm4, %zmm3, %zmm2 {%k7} {z} -# INTEL: vfnmadd132nepbf16 zmm2 {k7} {z}, zmm3, zmm4 +# ATT: vfnmadd132bf16 %zmm4, %zmm3, %zmm2 {%k7} {z} +# INTEL: vfnmadd132bf16 zmm2 {k7} {z}, zmm3, zmm4 0x62,0xf6,0x64,0xcf,0x9c,0xd4 -# ATT: vfnmadd132nepbf16 %xmm4, %xmm3, %xmm2 -# INTEL: vfnmadd132nepbf16 xmm2, xmm3, xmm4 +# ATT: vfnmadd132bf16 %xmm4, %xmm3, %xmm2 +# INTEL: vfnmadd132bf16 xmm2, xmm3, xmm4 0x62,0xf6,0x64,0x08,0x9c,0xd4 -# ATT: vfnmadd132nepbf16 %xmm4, %xmm3, %xmm2 {%k7} -# INTEL: vfnmadd132nepbf16 xmm2 {k7}, xmm3, xmm4 +# ATT: vfnmadd132bf16 %xmm4, %xmm3, %xmm2 {%k7} +# INTEL: vfnmadd132bf16 xmm2 {k7}, xmm3, xmm4 0x62,0xf6,0x64,0x0f,0x9c,0xd4 -# ATT: vfnmadd132nepbf16 %xmm4, %xmm3, %xmm2 {%k7} {z} -# INTEL: vfnmadd132nepbf16 xmm2 {k7} {z}, xmm3, xmm4 +# ATT: vfnmadd132bf16 %xmm4, %xmm3, %xmm2 {%k7} {z} +# INTEL: vfnmadd132bf16 xmm2 {k7} {z}, xmm3, xmm4 0x62,0xf6,0x64,0x8f,0x9c,0xd4 -# ATT: vfnmadd132nepbf16 268435456(%esp,%esi,8), %zmm3, %zmm2 -# INTEL: vfnmadd132nepbf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456] +# ATT: vfnmadd132bf16 268435456(%esp,%esi,8), %zmm3, %zmm2 +# INTEL: vfnmadd132bf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456] 0x62,0xf6,0x64,0x48,0x9c,0x94,0xf4,0x00,0x00,0x00,0x10 -# ATT: vfnmadd132nepbf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7} -# INTEL: vfnmadd132nepbf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291] +# ATT: vfnmadd132bf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7} +# INTEL: vfnmadd132bf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291] 0x62,0xf6,0x64,0x4f,0x9c,0x94,0x87,0x23,0x01,0x00,0x00 -# ATT: vfnmadd132nepbf16 (%eax){1to32}, %zmm3, %zmm2 -# INTEL: vfnmadd132nepbf16 zmm2, zmm3, word ptr [eax]{1to32} +# ATT: vfnmadd132bf16 (%eax){1to32}, %zmm3, %zmm2 +# INTEL: vfnmadd132bf16 zmm2, zmm3, word ptr [eax]{1to32} 0x62,0xf6,0x64,0x58,0x9c,0x10 -# ATT: vfnmadd132nepbf16 -2048(,%ebp,2), %zmm3, %zmm2 -# INTEL: vfnmadd132nepbf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048] +# ATT: vfnmadd132bf16 -2048(,%ebp,2), %zmm3, %zmm2 +# INTEL: vfnmadd132bf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048] 0x62,0xf6,0x64,0x48,0x9c,0x14,0x6d,0x00,0xf8,0xff,0xff -# ATT: vfnmadd132nepbf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z} -# INTEL: vfnmadd132nepbf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128] +# ATT: vfnmadd132bf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z} +# INTEL: vfnmadd132bf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128] 0x62,0xf6,0x64,0xcf,0x9c,0x51,0x7f -# ATT: vfnmadd132nepbf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z} -# INTEL: vfnmadd132nepbf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32} +# ATT: vfnmadd132bf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z} +# INTEL: vfnmadd132bf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32} 0x62,0xf6,0x64,0xdf,0x9c,0x52,0x80 -# ATT: vfnmadd132nepbf16 268435456(%esp,%esi,8), %ymm3, %ymm2 -# INTEL: vfnmadd132nepbf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456] +# ATT: vfnmadd132bf16 268435456(%esp,%esi,8), %ymm3, %ymm2 +# INTEL: vfnmadd132bf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456] 0x62,0xf6,0x64,0x28,0x9c,0x94,0xf4,0x00,0x00,0x00,0x10 -# ATT: vfnmadd132nepbf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7} -# INTEL: vfnmadd132nepbf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291] +# ATT: vfnmadd132bf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7} +# INTEL: vfnmadd132bf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291] 0x62,0xf6,0x64,0x2f,0x9c,0x94,0x87,0x23,0x01,0x00,0x00 -# ATT: vfnmadd132nepbf16 (%eax){1to16}, %ymm3, %ymm2 -# INTEL: vfnmadd132nepbf16 ymm2, ymm3, word ptr [eax]{1to16} +# ATT: vfnmadd132bf16 (%eax){1to16}, %ymm3, %ymm2 +# INTEL: vfnmadd132bf16 ymm2, ymm3, word ptr [eax]{1to16} 0x62,0xf6,0x64,0x38,0x9c,0x10 -# ATT: vfnmadd132nepbf16 -1024(,%ebp,2), %ymm3, %ymm2 -# INTEL: vfnmadd132nepbf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024] +# ATT: vfnmadd132bf16 -1024(,%ebp,2), %ymm3, %ymm2 +# INTEL: vfnmadd132bf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024] 0x62,0xf6,0x64,0x28,0x9c,0x14,0x6d,0x00,0xfc,0xff,0xff -# ATT: vfnmadd132nepbf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z} -# INTEL: vfnmadd132nepbf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064] +# ATT: vfnmadd132bf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z} +# INTEL: vfnmadd132bf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064] 0x62,0xf6,0x64,0xaf,0x9c,0x51,0x7f -# ATT: vfnmadd132nepbf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z} -# INTEL: vfnmadd132nepbf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16} +# ATT: vfnmadd132bf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z} +# INTEL: vfnmadd132bf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16} 0x62,0xf6,0x64,0xbf,0x9c,0x52,0x80 -# ATT: vfnmadd132nepbf16 268435456(%esp,%esi,8), %xmm3, %xmm2 -# INTEL: vfnmadd132nepbf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456] +# ATT: vfnmadd132bf16 268435456(%esp,%esi,8), %xmm3, %xmm2 +# INTEL: vfnmadd132bf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456] 0x62,0xf6,0x64,0x08,0x9c,0x94,0xf4,0x00,0x00,0x00,0x10 -# ATT: vfnmadd132nepbf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7} -# INTEL: vfnmadd132nepbf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291] +# ATT: vfnmadd132bf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7} +# INTEL: vfnmadd132bf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291] 0x62,0xf6,0x64,0x0f,0x9c,0x94,0x87,0x23,0x01,0x00,0x00 -# ATT: vfnmadd132nepbf16 (%eax){1to8}, %xmm3, %xmm2 -# INTEL: vfnmadd132nepbf16 xmm2, xmm3, word ptr [eax]{1to8} +# ATT: vfnmadd132bf16 (%eax){1to8}, %xmm3, %xmm2 +# INTEL: vfnmadd132bf16 xmm2, xmm3, word ptr [eax]{1to8} 0x62,0xf6,0x64,0x18,0x9c,0x10 -# ATT: vfnmadd132nepbf16 -512(,%ebp,2), %xmm3, %xmm2 -# INTEL: vfnmadd132nepbf16 xmm2, xmm3, xmmword ptr [2*ebp - 512] +# ATT: vfnmadd132bf16 -512(,%ebp,2), %xmm3, %xmm2 +# INTEL: vfnmadd132bf16 xmm2, xmm3, xmmword ptr [2*ebp - 512] 0x62,0xf6,0x64,0x08,0x9c,0x14,0x6d,0x00,0xfe,0xff,0xff -# ATT: vfnmadd132nepbf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z} -# INTEL: vfnmadd132nepbf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032] +# ATT: vfnmadd132bf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z} +# INTEL: vfnmadd132bf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032] 0x62,0xf6,0x64,0x8f,0x9c,0x51,0x7f -# ATT: vfnmadd132nepbf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z} -# INTEL: vfnmadd132nepbf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8} +# ATT: vfnmadd132bf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z} +# INTEL: vfnmadd132bf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8} 0x62,0xf6,0x64,0x9f,0x9c,0x52,0x80 -# ATT: vfnmadd213nepbf16 %ymm4, %ymm3, %ymm2 -# INTEL: vfnmadd213nepbf16 ymm2, ymm3, ymm4 +# ATT: vfnmadd213bf16 %ymm4, %ymm3, %ymm2 +# INTEL: vfnmadd213bf16 ymm2, ymm3, ymm4 0x62,0xf6,0x64,0x28,0xac,0xd4 -# ATT: vfnmadd213nepbf16 %ymm4, %ymm3, %ymm2 {%k7} -# INTEL: vfnmadd213nepbf16 ymm2 {k7}, ymm3, ymm4 +# ATT: vfnmadd213bf16 %ymm4, %ymm3, %ymm2 {%k7} +# INTEL: vfnmadd213bf16 ymm2 {k7}, ymm3, ymm4 0x62,0xf6,0x64,0x2f,0xac,0xd4 -# ATT: vfnmadd213nepbf16 %ymm4, %ymm3, %ymm2 {%k7} {z} -# INTEL: vfnmadd213nepbf16 ymm2 {k7} {z}, ymm3, ymm4 +# ATT: vfnmadd213bf16 %ymm4, %ymm3, %ymm2 {%k7} {z} +# INTEL: vfnmadd213bf16 ymm2 {k7} {z}, ymm3, ymm4 0x62,0xf6,0x64,0xaf,0xac,0xd4 -# ATT: vfnmadd213nepbf16 %zmm4, %zmm3, %zmm2 -# INTEL: vfnmadd213nepbf16 zmm2, zmm3, zmm4 +# ATT: vfnmadd213bf16 %zmm4, %zmm3, %zmm2 +# INTEL: vfnmadd213bf16 zmm2, zmm3, zmm4 0x62,0xf6,0x64,0x48,0xac,0xd4 -# ATT: vfnmadd213nepbf16 %zmm4, %zmm3, %zmm2 {%k7} -# INTEL: vfnmadd213nepbf16 zmm2 {k7}, zmm3, zmm4 +# ATT: vfnmadd213bf16 %zmm4, %zmm3, %zmm2 {%k7} +# INTEL: vfnmadd213bf16 zmm2 {k7}, zmm3, zmm4 0x62,0xf6,0x64,0x4f,0xac,0xd4 -# ATT: vfnmadd213nepbf16 %zmm4, %zmm3, %zmm2 {%k7} {z} -# INTEL: vfnmadd213nepbf16 zmm2 {k7} {z}, zmm3, zmm4 +# ATT: vfnmadd213bf16 %zmm4, %zmm3, %zmm2 {%k7} {z} +# INTEL: vfnmadd213bf16 zmm2 {k7} {z}, zmm3, zmm4 0x62,0xf6,0x64,0xcf,0xac,0xd4 -# ATT: vfnmadd213nepbf16 %xmm4, %xmm3, %xmm2 -# INTEL: vfnmadd213nepbf16 xmm2, xmm3, xmm4 +# ATT: vfnmadd213bf16 %xmm4, %xmm3, %xmm2 +# INTEL: vfnmadd213bf16 xmm2, xmm3, xmm4 0x62,0xf6,0x64,0x08,0xac,0xd4 -# ATT: vfnmadd213nepbf16 %xmm4, %xmm3, %xmm2 {%k7} -# INTEL: vfnmadd213nepbf16 xmm2 {k7}, xmm3, xmm4 +# ATT: vfnmadd213bf16 %xmm4, %xmm3, %xmm2 {%k7} +# INTEL: vfnmadd213bf16 xmm2 {k7}, xmm3, xmm4 0x62,0xf6,0x64,0x0f,0xac,0xd4 -# ATT: vfnmadd213nepbf16 %xmm4, %xmm3, %xmm2 {%k7} {z} -# INTEL: vfnmadd213nepbf16 xmm2 {k7} {z}, xmm3, xmm4 +# ATT: vfnmadd213bf16 %xmm4, %xmm3, %xmm2 {%k7} {z} +# INTEL: vfnmadd213bf16 xmm2 {k7} {z}, xmm3, xmm4 0x62,0xf6,0x64,0x8f,0xac,0xd4 -# ATT: vfnmadd213nepbf16 268435456(%esp,%esi,8), %zmm3, %zmm2 -# INTEL: vfnmadd213nepbf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456] +# ATT: vfnmadd213bf16 268435456(%esp,%esi,8), %zmm3, %zmm2 +# INTEL: vfnmadd213bf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456] 0x62,0xf6,0x64,0x48,0xac,0x94,0xf4,0x00,0x00,0x00,0x10 -# ATT: vfnmadd213nepbf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7} -# INTEL: vfnmadd213nepbf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291] +# ATT: vfnmadd213bf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7} +# INTEL: vfnmadd213bf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291] 0x62,0xf6,0x64,0x4f,0xac,0x94,0x87,0x23,0x01,0x00,0x00 -# ATT: vfnmadd213nepbf16 (%eax){1to32}, %zmm3, %zmm2 -# INTEL: vfnmadd213nepbf16 zmm2, zmm3, word ptr [eax]{1to32} +# ATT: vfnmadd213bf16 (%eax){1to32}, %zmm3, %zmm2 +# INTEL: vfnmadd213bf16 zmm2, zmm3, word ptr [eax]{1to32} 0x62,0xf6,0x64,0x58,0xac,0x10 -# ATT: vfnmadd213nepbf16 -2048(,%ebp,2), %zmm3, %zmm2 -# INTEL: vfnmadd213nepbf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048] +# ATT: vfnmadd213bf16 -2048(,%ebp,2), %zmm3, %zmm2 +# INTEL: vfnmadd213bf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048] 0x62,0xf6,0x64,0x48,0xac,0x14,0x6d,0x00,0xf8,0xff,0xff -# ATT: vfnmadd213nepbf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z} -# INTEL: vfnmadd213nepbf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128] +# ATT: vfnmadd213bf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z} +# INTEL: vfnmadd213bf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128] 0x62,0xf6,0x64,0xcf,0xac,0x51,0x7f -# ATT: vfnmadd213nepbf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z} -# INTEL: vfnmadd213nepbf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32} +# ATT: vfnmadd213bf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z} +# INTEL: vfnmadd213bf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32} 0x62,0xf6,0x64,0xdf,0xac,0x52,0x80 -# ATT: vfnmadd213nepbf16 268435456(%esp,%esi,8), %ymm3, %ymm2 -# INTEL: vfnmadd213nepbf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456] +# ATT: vfnmadd213bf16 268435456(%esp,%esi,8), %ymm3, %ymm2 +# INTEL: vfnmadd213bf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456] 0x62,0xf6,0x64,0x28,0xac,0x94,0xf4,0x00,0x00,0x00,0x10 -# ATT: vfnmadd213nepbf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7} -# INTEL: vfnmadd213nepbf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291] +# ATT: vfnmadd213bf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7} +# INTEL: vfnmadd213bf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291] 0x62,0xf6,0x64,0x2f,0xac,0x94,0x87,0x23,0x01,0x00,0x00 -# ATT: vfnmadd213nepbf16 (%eax){1to16}, %ymm3, %ymm2 -# INTEL: vfnmadd213nepbf16 ymm2, ymm3, word ptr [eax]{1to16} +# ATT: vfnmadd213bf16 (%eax){1to16}, %ymm3, %ymm2 +# INTEL: vfnmadd213bf16 ymm2, ymm3, word ptr [eax]{1to16} 0x62,0xf6,0x64,0x38,0xac,0x10 -# ATT: vfnmadd213nepbf16 -1024(,%ebp,2), %ymm3, %ymm2 -# INTEL: vfnmadd213nepbf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024] +# ATT: vfnmadd213bf16 -1024(,%ebp,2), %ymm3, %ymm2 +# INTEL: vfnmadd213bf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024] 0x62,0xf6,0x64,0x28,0xac,0x14,0x6d,0x00,0xfc,0xff,0xff -# ATT: vfnmadd213nepbf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z} -# INTEL: vfnmadd213nepbf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064] +# ATT: vfnmadd213bf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z} +# INTEL: vfnmadd213bf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064] 0x62,0xf6,0x64,0xaf,0xac,0x51,0x7f -# ATT: vfnmadd213nepbf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z} -# INTEL: vfnmadd213nepbf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16} +# ATT: vfnmadd213bf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z} +# INTEL: vfnmadd213bf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16} 0x62,0xf6,0x64,0xbf,0xac,0x52,0x80 -# ATT: vfnmadd213nepbf16 268435456(%esp,%esi,8), %xmm3, %xmm2 -# INTEL: vfnmadd213nepbf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456] +# ATT: vfnmadd213bf16 268435456(%esp,%esi,8), %xmm3, %xmm2 +# INTEL: vfnmadd213bf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456] 0x62,0xf6,0x64,0x08,0xac,0x94,0xf4,0x00,0x00,0x00,0x10 -# ATT: vfnmadd213nepbf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7} -# INTEL: vfnmadd213nepbf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291] +# ATT: vfnmadd213bf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7} +# INTEL: vfnmadd213bf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291] 0x62,0xf6,0x64,0x0f,0xac,0x94,0x87,0x23,0x01,0x00,0x00 -# ATT: vfnmadd213nepbf16 (%eax){1to8}, %xmm3, %xmm2 -# INTEL: vfnmadd213nepbf16 xmm2, xmm3, word ptr [eax]{1to8} +# ATT: vfnmadd213bf16 (%eax){1to8}, %xmm3, %xmm2 +# INTEL: vfnmadd213bf16 xmm2, xmm3, word ptr [eax]{1to8} 0x62,0xf6,0x64,0x18,0xac,0x10 -# ATT: vfnmadd213nepbf16 -512(,%ebp,2), %xmm3, %xmm2 -# INTEL: vfnmadd213nepbf16 xmm2, xmm3, xmmword ptr [2*ebp - 512] +# ATT: vfnmadd213bf16 -512(,%ebp,2), %xmm3, %xmm2 +# INTEL: vfnmadd213bf16 xmm2, xmm3, xmmword ptr [2*ebp - 512] 0x62,0xf6,0x64,0x08,0xac,0x14,0x6d,0x00,0xfe,0xff,0xff -# ATT: vfnmadd213nepbf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z} -# INTEL: vfnmadd213nepbf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032] +# ATT: vfnmadd213bf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z} +# INTEL: vfnmadd213bf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032] 0x62,0xf6,0x64,0x8f,0xac,0x51,0x7f -# ATT: vfnmadd213nepbf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z} -# INTEL: vfnmadd213nepbf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8} +# ATT: vfnmadd213bf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z} +# INTEL: vfnmadd213bf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8} 0x62,0xf6,0x64,0x9f,0xac,0x52,0x80 -# ATT: vfnmadd231nepbf16 %ymm4, %ymm3, %ymm2 -# INTEL: vfnmadd231nepbf16 ymm2, ymm3, ymm4 +# ATT: vfnmadd231bf16 %ymm4, %ymm3, %ymm2 +# INTEL: vfnmadd231bf16 ymm2, ymm3, ymm4 0x62,0xf6,0x64,0x28,0xbc,0xd4 -# ATT: vfnmadd231nepbf16 %ymm4, %ymm3, %ymm2 {%k7} -# INTEL: vfnmadd231nepbf16 ymm2 {k7}, ymm3, ymm4 +# ATT: vfnmadd231bf16 %ymm4, %ymm3, %ymm2 {%k7} +# INTEL: vfnmadd231bf16 ymm2 {k7}, ymm3, ymm4 0x62,0xf6,0x64,0x2f,0xbc,0xd4 -# ATT: vfnmadd231nepbf16 %ymm4, %ymm3, %ymm2 {%k7} {z} -# INTEL: vfnmadd231nepbf16 ymm2 {k7} {z}, ymm3, ymm4 +# ATT: vfnmadd231bf16 %ymm4, %ymm3, %ymm2 {%k7} {z} +# INTEL: vfnmadd231bf16 ymm2 {k7} {z}, ymm3, ymm4 0x62,0xf6,0x64,0xaf,0xbc,0xd4 -# ATT: vfnmadd231nepbf16 %zmm4, %zmm3, %zmm2 -# INTEL: vfnmadd231nepbf16 zmm2, zmm3, zmm4 +# ATT: vfnmadd231bf16 %zmm4, %zmm3, %zmm2 +# INTEL: vfnmadd231bf16 zmm2, zmm3, zmm4 0x62,0xf6,0x64,0x48,0xbc,0xd4 -# ATT: vfnmadd231nepbf16 %zmm4, %zmm3, %zmm2 {%k7} -# INTEL: vfnmadd231nepbf16 zmm2 {k7}, zmm3, zmm4 +# ATT: vfnmadd231bf16 %zmm4, %zmm3, %zmm2 {%k7} +# INTEL: vfnmadd231bf16 zmm2 {k7}, zmm3, zmm4 0x62,0xf6,0x64,0x4f,0xbc,0xd4 -# ATT: vfnmadd231nepbf16 %zmm4, %zmm3, %zmm2 {%k7} {z} -# INTEL: vfnmadd231nepbf16 zmm2 {k7} {z}, zmm3, zmm4 +# ATT: vfnmadd231bf16 %zmm4, %zmm3, %zmm2 {%k7} {z} +# INTEL: vfnmadd231bf16 zmm2 {k7} {z}, zmm3, zmm4 0x62,0xf6,0x64,0xcf,0xbc,0xd4 -# ATT: vfnmadd231nepbf16 %xmm4, %xmm3, %xmm2 -# INTEL: vfnmadd231nepbf16 xmm2, xmm3, xmm4 +# ATT: vfnmadd231bf16 %xmm4, %xmm3, %xmm2 +# INTEL: vfnmadd231bf16 xmm2, xmm3, xmm4 0x62,0xf6,0x64,0x08,0xbc,0xd4 -# ATT: vfnmadd231nepbf16 %xmm4, %xmm3, %xmm2 {%k7} -# INTEL: vfnmadd231nepbf16 xmm2 {k7}, xmm3, xmm4 +# ATT: vfnmadd231bf16 %xmm4, %xmm3, %xmm2 {%k7} +# INTEL: vfnmadd231bf16 xmm2 {k7}, xmm3, xmm4 0x62,0xf6,0x64,0x0f,0xbc,0xd4 -# ATT: vfnmadd231nepbf16 %xmm4, %xmm3, %xmm2 {%k7} {z} -# INTEL: vfnmadd231nepbf16 xmm2 {k7} {z}, xmm3, xmm4 +# ATT: vfnmadd231bf16 %xmm4, %xmm3, %xmm2 {%k7} {z} +# INTEL: vfnmadd231bf16 xmm2 {k7} {z}, xmm3, xmm4 0x62,0xf6,0x64,0x8f,0xbc,0xd4 -# ATT: vfnmadd231nepbf16 268435456(%esp,%esi,8), %zmm3, %zmm2 -# INTEL: vfnmadd231nepbf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456] +# ATT: vfnmadd231bf16 268435456(%esp,%esi,8), %zmm3, %zmm2 +# INTEL: vfnmadd231bf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456] 0x62,0xf6,0x64,0x48,0xbc,0x94,0xf4,0x00,0x00,0x00,0x10 -# ATT: vfnmadd231nepbf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7} -# INTEL: vfnmadd231nepbf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291] +# ATT: vfnmadd231bf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7} +# INTEL: vfnmadd231bf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291] 0x62,0xf6,0x64,0x4f,0xbc,0x94,0x87,0x23,0x01,0x00,0x00 -# ATT: vfnmadd231nepbf16 (%eax){1to32}, %zmm3, %zmm2 -# INTEL: vfnmadd231nepbf16 zmm2, zmm3, word ptr [eax]{1to32} +# ATT: vfnmadd231bf16 (%eax){1to32}, %zmm3, %zmm2 +# INTEL: vfnmadd231bf16 zmm2, zmm3, word ptr [eax]{1to32} 0x62,0xf6,0x64,0x58,0xbc,0x10 -# ATT: vfnmadd231nepbf16 -2048(,%ebp,2), %zmm3, %zmm2 -# INTEL: vfnmadd231nepbf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048] +# ATT: vfnmadd231bf16 -2048(,%ebp,2), %zmm3, %zmm2 +# INTEL: vfnmadd231bf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048] 0x62,0xf6,0x64,0x48,0xbc,0x14,0x6d,0x00,0xf8,0xff,0xff -# ATT: vfnmadd231nepbf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z} -# INTEL: vfnmadd231nepbf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128] +# ATT: vfnmadd231bf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z} +# INTEL: vfnmadd231bf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128] 0x62,0xf6,0x64,0xcf,0xbc,0x51,0x7f -# ATT: vfnmadd231nepbf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z} -# INTEL: vfnmadd231nepbf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32} +# ATT: vfnmadd231bf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z} +# INTEL: vfnmadd231bf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32} 0x62,0xf6,0x64,0xdf,0xbc,0x52,0x80 -# ATT: vfnmadd231nepbf16 268435456(%esp,%esi,8), %ymm3, %ymm2 -# INTEL: vfnmadd231nepbf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456] +# ATT: vfnmadd231bf16 268435456(%esp,%esi,8), %ymm3, %ymm2 +# INTEL: vfnmadd231bf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456] 0x62,0xf6,0x64,0x28,0xbc,0x94,0xf4,0x00,0x00,0x00,0x10 -# ATT: vfnmadd231nepbf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7} -# INTEL: vfnmadd231nepbf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291] +# ATT: vfnmadd231bf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7} +# INTEL: vfnmadd231bf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291] 0x62,0xf6,0x64,0x2f,0xbc,0x94,0x87,0x23,0x01,0x00,0x00 -# ATT: vfnmadd231nepbf16 (%eax){1to16}, %ymm3, %ymm2 -# INTEL: vfnmadd231nepbf16 ymm2, ymm3, word ptr [eax]{1to16} +# ATT: vfnmadd231bf16 (%eax){1to16}, %ymm3, %ymm2 +# INTEL: vfnmadd231bf16 ymm2, ymm3, word ptr [eax]{1to16} 0x62,0xf6,0x64,0x38,0xbc,0x10 -# ATT: vfnmadd231nepbf16 -1024(,%ebp,2), %ymm3, %ymm2 -# INTEL: vfnmadd231nepbf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024] +# ATT: vfnmadd231bf16 -1024(,%ebp,2), %ymm3, %ymm2 +# INTEL: vfnmadd231bf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024] 0x62,0xf6,0x64,0x28,0xbc,0x14,0x6d,0x00,0xfc,0xff,0xff -# ATT: vfnmadd231nepbf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z} -# INTEL: vfnmadd231nepbf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064] +# ATT: vfnmadd231bf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z} +# INTEL: vfnmadd231bf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064] 0x62,0xf6,0x64,0xaf,0xbc,0x51,0x7f -# ATT: vfnmadd231nepbf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z} -# INTEL: vfnmadd231nepbf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16} +# ATT: vfnmadd231bf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z} +# INTEL: vfnmadd231bf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16} 0x62,0xf6,0x64,0xbf,0xbc,0x52,0x80 -# ATT: vfnmadd231nepbf16 268435456(%esp,%esi,8), %xmm3, %xmm2 -# INTEL: vfnmadd231nepbf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456] +# ATT: vfnmadd231bf16 268435456(%esp,%esi,8), %xmm3, %xmm2 +# INTEL: vfnmadd231bf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456] 0x62,0xf6,0x64,0x08,0xbc,0x94,0xf4,0x00,0x00,0x00,0x10 -# ATT: vfnmadd231nepbf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7} -# INTEL: vfnmadd231nepbf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291] +# ATT: vfnmadd231bf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7} +# INTEL: vfnmadd231bf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291] 0x62,0xf6,0x64,0x0f,0xbc,0x94,0x87,0x23,0x01,0x00,0x00 -# ATT: vfnmadd231nepbf16 (%eax){1to8}, %xmm3, %xmm2 -# INTEL: vfnmadd231nepbf16 xmm2, xmm3, word ptr [eax]{1to8} +# ATT: vfnmadd231bf16 (%eax){1to8}, %xmm3, %xmm2 +# INTEL: vfnmadd231bf16 xmm2, xmm3, word ptr [eax]{1to8} 0x62,0xf6,0x64,0x18,0xbc,0x10 -# ATT: vfnmadd231nepbf16 -512(,%ebp,2), %xmm3, %xmm2 -# INTEL: vfnmadd231nepbf16 xmm2, xmm3, xmmword ptr [2*ebp - 512] +# ATT: vfnmadd231bf16 -512(,%ebp,2), %xmm3, %xmm2 +# INTEL: vfnmadd231bf16 xmm2, xmm3, xmmword ptr [2*ebp - 512] 0x62,0xf6,0x64,0x08,0xbc,0x14,0x6d,0x00,0xfe,0xff,0xff -# ATT: vfnmadd231nepbf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z} -# INTEL: vfnmadd231nepbf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032] +# ATT: vfnmadd231bf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z} +# INTEL: vfnmadd231bf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032] 0x62,0xf6,0x64,0x8f,0xbc,0x51,0x7f -# ATT: vfnmadd231nepbf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z} -# INTEL: vfnmadd231nepbf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8} +# ATT: vfnmadd231bf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z} +# INTEL: vfnmadd231bf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8} 0x62,0xf6,0x64,0x9f,0xbc,0x52,0x80 -# ATT: vfnmsub132nepbf16 %ymm4, %ymm3, %ymm2 -# INTEL: vfnmsub132nepbf16 ymm2, ymm3, ymm4 +# ATT: vfnmsub132bf16 %ymm4, %ymm3, %ymm2 +# INTEL: vfnmsub132bf16 ymm2, ymm3, ymm4 0x62,0xf6,0x64,0x28,0x9e,0xd4 -# ATT: vfnmsub132nepbf16 %ymm4, %ymm3, %ymm2 {%k7} -# INTEL: vfnmsub132nepbf16 ymm2 {k7}, ymm3, ymm4 +# ATT: vfnmsub132bf16 %ymm4, %ymm3, %ymm2 {%k7} +# INTEL: vfnmsub132bf16 ymm2 {k7}, ymm3, ymm4 0x62,0xf6,0x64,0x2f,0x9e,0xd4 -# ATT: vfnmsub132nepbf16 %ymm4, %ymm3, %ymm2 {%k7} {z} -# INTEL: vfnmsub132nepbf16 ymm2 {k7} {z}, ymm3, ymm4 +# ATT: vfnmsub132bf16 %ymm4, %ymm3, %ymm2 {%k7} {z} +# INTEL: vfnmsub132bf16 ymm2 {k7} {z}, ymm3, ymm4 0x62,0xf6,0x64,0xaf,0x9e,0xd4 -# ATT: vfnmsub132nepbf16 %zmm4, %zmm3, %zmm2 -# INTEL: vfnmsub132nepbf16 zmm2, zmm3, zmm4 +# ATT: vfnmsub132bf16 %zmm4, %zmm3, %zmm2 +# INTEL: vfnmsub132bf16 zmm2, zmm3, zmm4 0x62,0xf6,0x64,0x48,0x9e,0xd4 -# ATT: vfnmsub132nepbf16 %zmm4, %zmm3, %zmm2 {%k7} -# INTEL: vfnmsub132nepbf16 zmm2 {k7}, zmm3, zmm4 +# ATT: vfnmsub132bf16 %zmm4, %zmm3, %zmm2 {%k7} +# INTEL: vfnmsub132bf16 zmm2 {k7}, zmm3, zmm4 0x62,0xf6,0x64,0x4f,0x9e,0xd4 -# ATT: vfnmsub132nepbf16 %zmm4, %zmm3, %zmm2 {%k7} {z} -# INTEL: vfnmsub132nepbf16 zmm2 {k7} {z}, zmm3, zmm4 +# ATT: vfnmsub132bf16 %zmm4, %zmm3, %zmm2 {%k7} {z} +# INTEL: vfnmsub132bf16 zmm2 {k7} {z}, zmm3, zmm4 0x62,0xf6,0x64,0xcf,0x9e,0xd4 -# ATT: vfnmsub132nepbf16 %xmm4, %xmm3, %xmm2 -# INTEL: vfnmsub132nepbf16 xmm2, xmm3, xmm4 +# ATT: vfnmsub132bf16 %xmm4, %xmm3, %xmm2 +# INTEL: vfnmsub132bf16 xmm2, xmm3, xmm4 0x62,0xf6,0x64,0x08,0x9e,0xd4 -# ATT: vfnmsub132nepbf16 %xmm4, %xmm3, %xmm2 {%k7} -# INTEL: vfnmsub132nepbf16 xmm2 {k7}, xmm3, xmm4 +# ATT: vfnmsub132bf16 %xmm4, %xmm3, %xmm2 {%k7} +# INTEL: vfnmsub132bf16 xmm2 {k7}, xmm3, xmm4 0x62,0xf6,0x64,0x0f,0x9e,0xd4 -# ATT: vfnmsub132nepbf16 %xmm4, %xmm3, %xmm2 {%k7} {z} -# INTEL: vfnmsub132nepbf16 xmm2 {k7} {z}, xmm3, xmm4 +# ATT: vfnmsub132bf16 %xmm4, %xmm3, %xmm2 {%k7} {z} +# INTEL: vfnmsub132bf16 xmm2 {k7} {z}, xmm3, xmm4 0x62,0xf6,0x64,0x8f,0x9e,0xd4 -# ATT: vfnmsub132nepbf16 268435456(%esp,%esi,8), %zmm3, %zmm2 -# INTEL: vfnmsub132nepbf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456] +# ATT: vfnmsub132bf16 268435456(%esp,%esi,8), %zmm3, %zmm2 +# INTEL: vfnmsub132bf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456] 0x62,0xf6,0x64,0x48,0x9e,0x94,0xf4,0x00,0x00,0x00,0x10 -# ATT: vfnmsub132nepbf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7} -# INTEL: vfnmsub132nepbf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291] +# ATT: vfnmsub132bf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7} +# INTEL: vfnmsub132bf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291] 0x62,0xf6,0x64,0x4f,0x9e,0x94,0x87,0x23,0x01,0x00,0x00 -# ATT: vfnmsub132nepbf16 (%eax){1to32}, %zmm3, %zmm2 -# INTEL: vfnmsub132nepbf16 zmm2, zmm3, word ptr [eax]{1to32} +# ATT: vfnmsub132bf16 (%eax){1to32}, %zmm3, %zmm2 +# INTEL: vfnmsub132bf16 zmm2, zmm3, word ptr [eax]{1to32} 0x62,0xf6,0x64,0x58,0x9e,0x10 -# ATT: vfnmsub132nepbf16 -2048(,%ebp,2), %zmm3, %zmm2 -# INTEL: vfnmsub132nepbf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048] +# ATT: vfnmsub132bf16 -2048(,%ebp,2), %zmm3, %zmm2 +# INTEL: vfnmsub132bf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048] 0x62,0xf6,0x64,0x48,0x9e,0x14,0x6d,0x00,0xf8,0xff,0xff -# ATT: vfnmsub132nepbf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z} -# INTEL: vfnmsub132nepbf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128] +# ATT: vfnmsub132bf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z} +# INTEL: vfnmsub132bf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128] 0x62,0xf6,0x64,0xcf,0x9e,0x51,0x7f -# ATT: vfnmsub132nepbf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z} -# INTEL: vfnmsub132nepbf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32} +# ATT: vfnmsub132bf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z} +# INTEL: vfnmsub132bf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32} 0x62,0xf6,0x64,0xdf,0x9e,0x52,0x80 -# ATT: vfnmsub132nepbf16 268435456(%esp,%esi,8), %ymm3, %ymm2 -# INTEL: vfnmsub132nepbf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456] +# ATT: vfnmsub132bf16 268435456(%esp,%esi,8), %ymm3, %ymm2 +# INTEL: vfnmsub132bf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456] 0x62,0xf6,0x64,0x28,0x9e,0x94,0xf4,0x00,0x00,0x00,0x10 -# ATT: vfnmsub132nepbf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7} -# INTEL: vfnmsub132nepbf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291] +# ATT: vfnmsub132bf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7} +# INTEL: vfnmsub132bf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291] 0x62,0xf6,0x64,0x2f,0x9e,0x94,0x87,0x23,0x01,0x00,0x00 -# ATT: vfnmsub132nepbf16 (%eax){1to16}, %ymm3, %ymm2 -# INTEL: vfnmsub132nepbf16 ymm2, ymm3, word ptr [eax]{1to16} +# ATT: vfnmsub132bf16 (%eax){1to16}, %ymm3, %ymm2 +# INTEL: vfnmsub132bf16 ymm2, ymm3, word ptr [eax]{1to16} 0x62,0xf6,0x64,0x38,0x9e,0x10 -# ATT: vfnmsub132nepbf16 -1024(,%ebp,2), %ymm3, %ymm2 -# INTEL: vfnmsub132nepbf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024] +# ATT: vfnmsub132bf16 -1024(,%ebp,2), %ymm3, %ymm2 +# INTEL: vfnmsub132bf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024] 0x62,0xf6,0x64,0x28,0x9e,0x14,0x6d,0x00,0xfc,0xff,0xff -# ATT: vfnmsub132nepbf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z} -# INTEL: vfnmsub132nepbf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064] +# ATT: vfnmsub132bf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z} +# INTEL: vfnmsub132bf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064] 0x62,0xf6,0x64,0xaf,0x9e,0x51,0x7f -# ATT: vfnmsub132nepbf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z} -# INTEL: vfnmsub132nepbf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16} +# ATT: vfnmsub132bf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z} +# INTEL: vfnmsub132bf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16} 0x62,0xf6,0x64,0xbf,0x9e,0x52,0x80 -# ATT: vfnmsub132nepbf16 268435456(%esp,%esi,8), %xmm3, %xmm2 -# INTEL: vfnmsub132nepbf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456] +# ATT: vfnmsub132bf16 268435456(%esp,%esi,8), %xmm3, %xmm2 +# INTEL: vfnmsub132bf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456] 0x62,0xf6,0x64,0x08,0x9e,0x94,0xf4,0x00,0x00,0x00,0x10 -# ATT: vfnmsub132nepbf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7} -# INTEL: vfnmsub132nepbf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291] +# ATT: vfnmsub132bf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7} +# INTEL: vfnmsub132bf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291] 0x62,0xf6,0x64,0x0f,0x9e,0x94,0x87,0x23,0x01,0x00,0x00 -# ATT: vfnmsub132nepbf16 (%eax){1to8}, %xmm3, %xmm2 -# INTEL: vfnmsub132nepbf16 xmm2, xmm3, word ptr [eax]{1to8} +# ATT: vfnmsub132bf16 (%eax){1to8}, %xmm3, %xmm2 +# INTEL: vfnmsub132bf16 xmm2, xmm3, word ptr [eax]{1to8} 0x62,0xf6,0x64,0x18,0x9e,0x10 -# ATT: vfnmsub132nepbf16 -512(,%ebp,2), %xmm3, %xmm2 -# INTEL: vfnmsub132nepbf16 xmm2, xmm3, xmmword ptr [2*ebp - 512] +# ATT: vfnmsub132bf16 -512(,%ebp,2), %xmm3, %xmm2 +# INTEL: vfnmsub132bf16 xmm2, xmm3, xmmword ptr [2*ebp - 512] 0x62,0xf6,0x64,0x08,0x9e,0x14,0x6d,0x00,0xfe,0xff,0xff -# ATT: vfnmsub132nepbf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z} -# INTEL: vfnmsub132nepbf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032] +# ATT: vfnmsub132bf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z} +# INTEL: vfnmsub132bf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032] 0x62,0xf6,0x64,0x8f,0x9e,0x51,0x7f -# ATT: vfnmsub132nepbf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z} -# INTEL: vfnmsub132nepbf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8} +# ATT: vfnmsub132bf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z} +# INTEL: vfnmsub132bf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8} 0x62,0xf6,0x64,0x9f,0x9e,0x52,0x80 -# ATT: vfnmsub213nepbf16 %ymm4, %ymm3, %ymm2 -# INTEL: vfnmsub213nepbf16 ymm2, ymm3, ymm4 +# ATT: vfnmsub213bf16 %ymm4, %ymm3, %ymm2 +# INTEL: vfnmsub213bf16 ymm2, ymm3, ymm4 0x62,0xf6,0x64,0x28,0xae,0xd4 -# ATT: vfnmsub213nepbf16 %ymm4, %ymm3, %ymm2 {%k7} -# INTEL: vfnmsub213nepbf16 ymm2 {k7}, ymm3, ymm4 +# ATT: vfnmsub213bf16 %ymm4, %ymm3, %ymm2 {%k7} +# INTEL: vfnmsub213bf16 ymm2 {k7}, ymm3, ymm4 0x62,0xf6,0x64,0x2f,0xae,0xd4 -# ATT: vfnmsub213nepbf16 %ymm4, %ymm3, %ymm2 {%k7} {z} -# INTEL: vfnmsub213nepbf16 ymm2 {k7} {z}, ymm3, ymm4 +# ATT: vfnmsub213bf16 %ymm4, %ymm3, %ymm2 {%k7} {z} +# INTEL: vfnmsub213bf16 ymm2 {k7} {z}, ymm3, ymm4 0x62,0xf6,0x64,0xaf,0xae,0xd4 -# ATT: vfnmsub213nepbf16 %zmm4, %zmm3, %zmm2 -# INTEL: vfnmsub213nepbf16 zmm2, zmm3, zmm4 +# ATT: vfnmsub213bf16 %zmm4, %zmm3, %zmm2 +# INTEL: vfnmsub213bf16 zmm2, zmm3, zmm4 0x62,0xf6,0x64,0x48,0xae,0xd4 -# ATT: vfnmsub213nepbf16 %zmm4, %zmm3, %zmm2 {%k7} -# INTEL: vfnmsub213nepbf16 zmm2 {k7}, zmm3, zmm4 +# ATT: vfnmsub213bf16 %zmm4, %zmm3, %zmm2 {%k7} +# INTEL: vfnmsub213bf16 zmm2 {k7}, zmm3, zmm4 0x62,0xf6,0x64,0x4f,0xae,0xd4 -# ATT: vfnmsub213nepbf16 %zmm4, %zmm3, %zmm2 {%k7} {z} -# INTEL: vfnmsub213nepbf16 zmm2 {k7} {z}, zmm3, zmm4 +# ATT: vfnmsub213bf16 %zmm4, %zmm3, %zmm2 {%k7} {z} +# INTEL: vfnmsub213bf16 zmm2 {k7} {z}, zmm3, zmm4 0x62,0xf6,0x64,0xcf,0xae,0xd4 -# ATT: vfnmsub213nepbf16 %xmm4, %xmm3, %xmm2 -# INTEL: vfnmsub213nepbf16 xmm2, xmm3, xmm4 +# ATT: vfnmsub213bf16 %xmm4, %xmm3, %xmm2 +# INTEL: vfnmsub213bf16 xmm2, xmm3, xmm4 0x62,0xf6,0x64,0x08,0xae,0xd4 -# ATT: vfnmsub213nepbf16 %xmm4, %xmm3, %xmm2 {%k7} -# INTEL: vfnmsub213nepbf16 xmm2 {k7}, xmm3, xmm4 +# ATT: vfnmsub213bf16 %xmm4, %xmm3, %xmm2 {%k7} +# INTEL: vfnmsub213bf16 xmm2 {k7}, xmm3, xmm4 0x62,0xf6,0x64,0x0f,0xae,0xd4 -# ATT: vfnmsub213nepbf16 %xmm4, %xmm3, %xmm2 {%k7} {z} -# INTEL: vfnmsub213nepbf16 xmm2 {k7} {z}, xmm3, xmm4 +# ATT: vfnmsub213bf16 %xmm4, %xmm3, %xmm2 {%k7} {z} +# INTEL: vfnmsub213bf16 xmm2 {k7} {z}, xmm3, xmm4 0x62,0xf6,0x64,0x8f,0xae,0xd4 -# ATT: vfnmsub213nepbf16 268435456(%esp,%esi,8), %zmm3, %zmm2 -# INTEL: vfnmsub213nepbf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456] +# ATT: vfnmsub213bf16 268435456(%esp,%esi,8), %zmm3, %zmm2 +# INTEL: vfnmsub213bf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456] 0x62,0xf6,0x64,0x48,0xae,0x94,0xf4,0x00,0x00,0x00,0x10 -# ATT: vfnmsub213nepbf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7} -# INTEL: vfnmsub213nepbf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291] +# ATT: vfnmsub213bf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7} +# INTEL: vfnmsub213bf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291] 0x62,0xf6,0x64,0x4f,0xae,0x94,0x87,0x23,0x01,0x00,0x00 -# ATT: vfnmsub213nepbf16 (%eax){1to32}, %zmm3, %zmm2 -# INTEL: vfnmsub213nepbf16 zmm2, zmm3, word ptr [eax]{1to32} +# ATT: vfnmsub213bf16 (%eax){1to32}, %zmm3, %zmm2 +# INTEL: vfnmsub213bf16 zmm2, zmm3, word ptr [eax]{1to32} 0x62,0xf6,0x64,0x58,0xae,0x10 -# ATT: vfnmsub213nepbf16 -2048(,%ebp,2), %zmm3, %zmm2 -# INTEL: vfnmsub213nepbf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048] +# ATT: vfnmsub213bf16 -2048(,%ebp,2), %zmm3, %zmm2 +# INTEL: vfnmsub213bf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048] 0x62,0xf6,0x64,0x48,0xae,0x14,0x6d,0x00,0xf8,0xff,0xff -# ATT: vfnmsub213nepbf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z} -# INTEL: vfnmsub213nepbf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128] +# ATT: vfnmsub213bf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z} +# INTEL: vfnmsub213bf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128] 0x62,0xf6,0x64,0xcf,0xae,0x51,0x7f -# ATT: vfnmsub213nepbf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z} -# INTEL: vfnmsub213nepbf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32} +# ATT: vfnmsub213bf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z} +# INTEL: vfnmsub213bf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32} 0x62,0xf6,0x64,0xdf,0xae,0x52,0x80 -# ATT: vfnmsub213nepbf16 268435456(%esp,%esi,8), %ymm3, %ymm2 -# INTEL: vfnmsub213nepbf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456] +# ATT: vfnmsub213bf16 268435456(%esp,%esi,8), %ymm3, %ymm2 +# INTEL: vfnmsub213bf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456] 0x62,0xf6,0x64,0x28,0xae,0x94,0xf4,0x00,0x00,0x00,0x10 -# ATT: vfnmsub213nepbf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7} -# INTEL: vfnmsub213nepbf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291] +# ATT: vfnmsub213bf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7} +# INTEL: vfnmsub213bf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291] 0x62,0xf6,0x64,0x2f,0xae,0x94,0x87,0x23,0x01,0x00,0x00 -# ATT: vfnmsub213nepbf16 (%eax){1to16}, %ymm3, %ymm2 -# INTEL: vfnmsub213nepbf16 ymm2, ymm3, word ptr [eax]{1to16} +# ATT: vfnmsub213bf16 (%eax){1to16}, %ymm3, %ymm2 +# INTEL: vfnmsub213bf16 ymm2, ymm3, word ptr [eax]{1to16} 0x62,0xf6,0x64,0x38,0xae,0x10 -# ATT: vfnmsub213nepbf16 -1024(,%ebp,2), %ymm3, %ymm2 -# INTEL: vfnmsub213nepbf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024] +# ATT: vfnmsub213bf16 -1024(,%ebp,2), %ymm3, %ymm2 +# INTEL: vfnmsub213bf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024] 0x62,0xf6,0x64,0x28,0xae,0x14,0x6d,0x00,0xfc,0xff,0xff -# ATT: vfnmsub213nepbf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z} -# INTEL: vfnmsub213nepbf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064] +# ATT: vfnmsub213bf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z} +# INTEL: vfnmsub213bf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064] 0x62,0xf6,0x64,0xaf,0xae,0x51,0x7f -# ATT: vfnmsub213nepbf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z} -# INTEL: vfnmsub213nepbf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16} +# ATT: vfnmsub213bf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z} +# INTEL: vfnmsub213bf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16} 0x62,0xf6,0x64,0xbf,0xae,0x52,0x80 -# ATT: vfnmsub213nepbf16 268435456(%esp,%esi,8), %xmm3, %xmm2 -# INTEL: vfnmsub213nepbf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456] +# ATT: vfnmsub213bf16 268435456(%esp,%esi,8), %xmm3, %xmm2 +# INTEL: vfnmsub213bf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456] 0x62,0xf6,0x64,0x08,0xae,0x94,0xf4,0x00,0x00,0x00,0x10 -# ATT: vfnmsub213nepbf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7} -# INTEL: vfnmsub213nepbf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291] +# ATT: vfnmsub213bf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7} +# INTEL: vfnmsub213bf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291] 0x62,0xf6,0x64,0x0f,0xae,0x94,0x87,0x23,0x01,0x00,0x00 -# ATT: vfnmsub213nepbf16 (%eax){1to8}, %xmm3, %xmm2 -# INTEL: vfnmsub213nepbf16 xmm2, xmm3, word ptr [eax]{1to8} +# ATT: vfnmsub213bf16 (%eax){1to8}, %xmm3, %xmm2 +# INTEL: vfnmsub213bf16 xmm2, xmm3, word ptr [eax]{1to8} 0x62,0xf6,0x64,0x18,0xae,0x10 -# ATT: vfnmsub213nepbf16 -512(,%ebp,2), %xmm3, %xmm2 -# INTEL: vfnmsub213nepbf16 xmm2, xmm3, xmmword ptr [2*ebp - 512] +# ATT: vfnmsub213bf16 -512(,%ebp,2), %xmm3, %xmm2 +# INTEL: vfnmsub213bf16 xmm2, xmm3, xmmword ptr [2*ebp - 512] 0x62,0xf6,0x64,0x08,0xae,0x14,0x6d,0x00,0xfe,0xff,0xff -# ATT: vfnmsub213nepbf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z} -# INTEL: vfnmsub213nepbf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032] +# ATT: vfnmsub213bf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z} +# INTEL: vfnmsub213bf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032] 0x62,0xf6,0x64,0x8f,0xae,0x51,0x7f -# ATT: vfnmsub213nepbf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z} -# INTEL: vfnmsub213nepbf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8} +# ATT: vfnmsub213bf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z} +# INTEL: vfnmsub213bf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8} 0x62,0xf6,0x64,0x9f,0xae,0x52,0x80 -# ATT: vfnmsub231nepbf16 %ymm4, %ymm3, %ymm2 -# INTEL: vfnmsub231nepbf16 ymm2, ymm3, ymm4 +# ATT: vfnmsub231bf16 %ymm4, %ymm3, %ymm2 +# INTEL: vfnmsub231bf16 ymm2, ymm3, ymm4 0x62,0xf6,0x64,0x28,0xbe,0xd4 -# ATT: vfnmsub231nepbf16 %ymm4, %ymm3, %ymm2 {%k7} -# INTEL: vfnmsub231nepbf16 ymm2 {k7}, ymm3, ymm4 +# ATT: vfnmsub231bf16 %ymm4, %ymm3, %ymm2 {%k7} +# INTEL: vfnmsub231bf16 ymm2 {k7}, ymm3, ymm4 0x62,0xf6,0x64,0x2f,0xbe,0xd4 -# ATT: vfnmsub231nepbf16 %ymm4, %ymm3, %ymm2 {%k7} {z} -# INTEL: vfnmsub231nepbf16 ymm2 {k7} {z}, ymm3, ymm4 +# ATT: vfnmsub231bf16 %ymm4, %ymm3, %ymm2 {%k7} {z} +# INTEL: vfnmsub231bf16 ymm2 {k7} {z}, ymm3, ymm4 0x62,0xf6,0x64,0xaf,0xbe,0xd4 -# ATT: vfnmsub231nepbf16 %zmm4, %zmm3, %zmm2 -# INTEL: vfnmsub231nepbf16 zmm2, zmm3, zmm4 +# ATT: vfnmsub231bf16 %zmm4, %zmm3, %zmm2 +# INTEL: vfnmsub231bf16 zmm2, zmm3, zmm4 0x62,0xf6,0x64,0x48,0xbe,0xd4 -# ATT: vfnmsub231nepbf16 %zmm4, %zmm3, %zmm2 {%k7} -# INTEL: vfnmsub231nepbf16 zmm2 {k7}, zmm3, zmm4 +# ATT: vfnmsub231bf16 %zmm4, %zmm3, %zmm2 {%k7} +# INTEL: vfnmsub231bf16 zmm2 {k7}, zmm3, zmm4 0x62,0xf6,0x64,0x4f,0xbe,0xd4 -# ATT: vfnmsub231nepbf16 %zmm4, %zmm3, %zmm2 {%k7} {z} -# INTEL: vfnmsub231nepbf16 zmm2 {k7} {z}, zmm3, zmm4 +# ATT: vfnmsub231bf16 %zmm4, %zmm3, %zmm2 {%k7} {z} +# INTEL: vfnmsub231bf16 zmm2 {k7} {z}, zmm3, zmm4 0x62,0xf6,0x64,0xcf,0xbe,0xd4 -# ATT: vfnmsub231nepbf16 %xmm4, %xmm3, %xmm2 -# INTEL: vfnmsub231nepbf16 xmm2, xmm3, xmm4 +# ATT: vfnmsub231bf16 %xmm4, %xmm3, %xmm2 +# INTEL: vfnmsub231bf16 xmm2, xmm3, xmm4 0x62,0xf6,0x64,0x08,0xbe,0xd4 -# ATT: vfnmsub231nepbf16 %xmm4, %xmm3, %xmm2 {%k7} -# INTEL: vfnmsub231nepbf16 xmm2 {k7}, xmm3, xmm4 +# ATT: vfnmsub231bf16 %xmm4, %xmm3, %xmm2 {%k7} +# INTEL: vfnmsub231bf16 xmm2 {k7}, xmm3, xmm4 0x62,0xf6,0x64,0x0f,0xbe,0xd4 -# ATT: vfnmsub231nepbf16 %xmm4, %xmm3, %xmm2 {%k7} {z} -# INTEL: vfnmsub231nepbf16 xmm2 {k7} {z}, xmm3, xmm4 +# ATT: vfnmsub231bf16 %xmm4, %xmm3, %xmm2 {%k7} {z} +# INTEL: vfnmsub231bf16 xmm2 {k7} {z}, xmm3, xmm4 0x62,0xf6,0x64,0x8f,0xbe,0xd4 -# ATT: vfnmsub231nepbf16 268435456(%esp,%esi,8), %zmm3, %zmm2 -# INTEL: vfnmsub231nepbf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456] +# ATT: vfnmsub231bf16 268435456(%esp,%esi,8), %zmm3, %zmm2 +# INTEL: vfnmsub231bf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456] 0x62,0xf6,0x64,0x48,0xbe,0x94,0xf4,0x00,0x00,0x00,0x10 -# ATT: vfnmsub231nepbf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7} -# INTEL: vfnmsub231nepbf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291] +# ATT: vfnmsub231bf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7} +# INTEL: vfnmsub231bf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291] 0x62,0xf6,0x64,0x4f,0xbe,0x94,0x87,0x23,0x01,0x00,0x00 -# ATT: vfnmsub231nepbf16 (%eax){1to32}, %zmm3, %zmm2 -# INTEL: vfnmsub231nepbf16 zmm2, zmm3, word ptr [eax]{1to32} +# ATT: vfnmsub231bf16 (%eax){1to32}, %zmm3, %zmm2 +# INTEL: vfnmsub231bf16 zmm2, zmm3, word ptr [eax]{1to32} 0x62,0xf6,0x64,0x58,0xbe,0x10 -# ATT: vfnmsub231nepbf16 -2048(,%ebp,2), %zmm3, %zmm2 -# INTEL: vfnmsub231nepbf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048] +# ATT: vfnmsub231bf16 -2048(,%ebp,2), %zmm3, %zmm2 +# INTEL: vfnmsub231bf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048] 0x62,0xf6,0x64,0x48,0xbe,0x14,0x6d,0x00,0xf8,0xff,0xff -# ATT: vfnmsub231nepbf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z} -# INTEL: vfnmsub231nepbf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128] +# ATT: vfnmsub231bf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z} +# INTEL: vfnmsub231bf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128] 0x62,0xf6,0x64,0xcf,0xbe,0x51,0x7f -# ATT: vfnmsub231nepbf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z} -# INTEL: vfnmsub231nepbf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32} +# ATT: vfnmsub231bf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z} +# INTEL: vfnmsub231bf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32} 0x62,0xf6,0x64,0xdf,0xbe,0x52,0x80 -# ATT: vfnmsub231nepbf16 268435456(%esp,%esi,8), %ymm3, %ymm2 -# INTEL: vfnmsub231nepbf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456] +# ATT: vfnmsub231bf16 268435456(%esp,%esi,8), %ymm3, %ymm2 +# INTEL: vfnmsub231bf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456] 0x62,0xf6,0x64,0x28,0xbe,0x94,0xf4,0x00,0x00,0x00,0x10 -# ATT: vfnmsub231nepbf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7} -# INTEL: vfnmsub231nepbf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291] +# ATT: vfnmsub231bf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7} +# INTEL: vfnmsub231bf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291] 0x62,0xf6,0x64,0x2f,0xbe,0x94,0x87,0x23,0x01,0x00,0x00 -# ATT: vfnmsub231nepbf16 (%eax){1to16}, %ymm3, %ymm2 -# INTEL: vfnmsub231nepbf16 ymm2, ymm3, word ptr [eax]{1to16} +# ATT: vfnmsub231bf16 (%eax){1to16}, %ymm3, %ymm2 +# INTEL: vfnmsub231bf16 ymm2, ymm3, word ptr [eax]{1to16} 0x62,0xf6,0x64,0x38,0xbe,0x10 -# ATT: vfnmsub231nepbf16 -1024(,%ebp,2), %ymm3, %ymm2 -# INTEL: vfnmsub231nepbf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024] +# ATT: vfnmsub231bf16 -1024(,%ebp,2), %ymm3, %ymm2 +# INTEL: vfnmsub231bf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024] 0x62,0xf6,0x64,0x28,0xbe,0x14,0x6d,0x00,0xfc,0xff,0xff -# ATT: vfnmsub231nepbf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z} -# INTEL: vfnmsub231nepbf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064] +# ATT: vfnmsub231bf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z} +# INTEL: vfnmsub231bf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064] 0x62,0xf6,0x64,0xaf,0xbe,0x51,0x7f -# ATT: vfnmsub231nepbf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z} -# INTEL: vfnmsub231nepbf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16} +# ATT: vfnmsub231bf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z} +# INTEL: vfnmsub231bf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16} 0x62,0xf6,0x64,0xbf,0xbe,0x52,0x80 -# ATT: vfnmsub231nepbf16 268435456(%esp,%esi,8), %xmm3, %xmm2 -# INTEL: vfnmsub231nepbf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456] +# ATT: vfnmsub231bf16 268435456(%esp,%esi,8), %xmm3, %xmm2 +# INTEL: vfnmsub231bf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456] 0x62,0xf6,0x64,0x08,0xbe,0x94,0xf4,0x00,0x00,0x00,0x10 -# ATT: vfnmsub231nepbf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7} -# INTEL: vfnmsub231nepbf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291] +# ATT: vfnmsub231bf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7} +# INTEL: vfnmsub231bf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291] 0x62,0xf6,0x64,0x0f,0xbe,0x94,0x87,0x23,0x01,0x00,0x00 -# ATT: vfnmsub231nepbf16 (%eax){1to8}, %xmm3, %xmm2 -# INTEL: vfnmsub231nepbf16 xmm2, xmm3, word ptr [eax]{1to8} +# ATT: vfnmsub231bf16 (%eax){1to8}, %xmm3, %xmm2 +# INTEL: vfnmsub231bf16 xmm2, xmm3, word ptr [eax]{1to8} 0x62,0xf6,0x64,0x18,0xbe,0x10 -# ATT: vfnmsub231nepbf16 -512(,%ebp,2), %xmm3, %xmm2 -# INTEL: vfnmsub231nepbf16 xmm2, xmm3, xmmword ptr [2*ebp - 512] +# ATT: vfnmsub231bf16 -512(,%ebp,2), %xmm3, %xmm2 +# INTEL: vfnmsub231bf16 xmm2, xmm3, xmmword ptr [2*ebp - 512] 0x62,0xf6,0x64,0x08,0xbe,0x14,0x6d,0x00,0xfe,0xff,0xff -# ATT: vfnmsub231nepbf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z} -# INTEL: vfnmsub231nepbf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032] +# ATT: vfnmsub231bf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z} +# INTEL: vfnmsub231bf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032] 0x62,0xf6,0x64,0x8f,0xbe,0x51,0x7f -# ATT: vfnmsub231nepbf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z} -# INTEL: vfnmsub231nepbf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8} +# ATT: vfnmsub231bf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z} +# INTEL: vfnmsub231bf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8} 0x62,0xf6,0x64,0x9f,0xbe,0x52,0x80 -# ATT: vfpclasspbf16 $123, %zmm3, %k5 -# INTEL: vfpclasspbf16 k5, zmm3, 123 +# ATT: vfpclassbf16 $123, %zmm3, %k5 +# INTEL: vfpclassbf16 k5, zmm3, 123 0x62,0xf3,0x7f,0x48,0x66,0xeb,0x7b -# ATT: vfpclasspbf16 $123, %zmm3, %k5 {%k7} -# INTEL: vfpclasspbf16 k5 {k7}, zmm3, 123 +# ATT: vfpclassbf16 $123, %zmm3, %k5 {%k7} +# INTEL: vfpclassbf16 k5 {k7}, zmm3, 123 0x62,0xf3,0x7f,0x4f,0x66,0xeb,0x7b -# ATT: vfpclasspbf16 $123, %ymm3, %k5 -# INTEL: vfpclasspbf16 k5, ymm3, 123 +# ATT: vfpclassbf16 $123, %ymm3, %k5 +# INTEL: vfpclassbf16 k5, ymm3, 123 0x62,0xf3,0x7f,0x28,0x66,0xeb,0x7b -# ATT: vfpclasspbf16 $123, %ymm3, %k5 {%k7} -# INTEL: vfpclasspbf16 k5 {k7}, ymm3, 123 +# ATT: vfpclassbf16 $123, %ymm3, %k5 {%k7} +# INTEL: vfpclassbf16 k5 {k7}, ymm3, 123 0x62,0xf3,0x7f,0x2f,0x66,0xeb,0x7b -# ATT: vfpclasspbf16 $123, %xmm3, %k5 -# INTEL: vfpclasspbf16 k5, xmm3, 123 +# ATT: vfpclassbf16 $123, %xmm3, %k5 +# INTEL: vfpclassbf16 k5, xmm3, 123 0x62,0xf3,0x7f,0x08,0x66,0xeb,0x7b -# ATT: vfpclasspbf16 $123, %xmm3, %k5 {%k7} -# INTEL: vfpclasspbf16 k5 {k7}, xmm3, 123 +# ATT: vfpclassbf16 $123, %xmm3, %k5 {%k7} +# INTEL: vfpclassbf16 k5 {k7}, xmm3, 123 0x62,0xf3,0x7f,0x0f,0x66,0xeb,0x7b -# ATT: vfpclasspbf16x $123, 268435456(%esp,%esi,8), %k5 -# INTEL: vfpclasspbf16 k5, xmmword ptr [esp + 8*esi + 268435456], 123 +# ATT: vfpclassbf16x $123, 268435456(%esp,%esi,8), %k5 +# INTEL: vfpclassbf16 k5, xmmword ptr [esp + 8*esi + 268435456], 123 0x62,0xf3,0x7f,0x08,0x66,0xac,0xf4,0x00,0x00,0x00,0x10,0x7b -# ATT: vfpclasspbf16x $123, 291(%edi,%eax,4), %k5 {%k7} -# INTEL: vfpclasspbf16 k5 {k7}, xmmword ptr [edi + 4*eax + 291], 123 +# ATT: vfpclassbf16x $123, 291(%edi,%eax,4), %k5 {%k7} +# INTEL: vfpclassbf16 k5 {k7}, xmmword ptr [edi + 4*eax + 291], 123 0x62,0xf3,0x7f,0x0f,0x66,0xac,0x87,0x23,0x01,0x00,0x00,0x7b -# ATT: vfpclasspbf16 $123, (%eax){1to8}, %k5 -# INTEL: vfpclasspbf16 k5, word ptr [eax]{1to8}, 123 +# ATT: vfpclassbf16 $123, (%eax){1to8}, %k5 +# INTEL: vfpclassbf16 k5, word ptr [eax]{1to8}, 123 0x62,0xf3,0x7f,0x18,0x66,0x28,0x7b -# ATT: vfpclasspbf16x $123, -512(,%ebp,2), %k5 -# INTEL: vfpclasspbf16 k5, xmmword ptr [2*ebp - 512], 123 +# ATT: vfpclassbf16x $123, -512(,%ebp,2), %k5 +# INTEL: vfpclassbf16 k5, xmmword ptr [2*ebp - 512], 123 0x62,0xf3,0x7f,0x08,0x66,0x2c,0x6d,0x00,0xfe,0xff,0xff,0x7b -# ATT: vfpclasspbf16x $123, 2032(%ecx), %k5 {%k7} -# INTEL: vfpclasspbf16 k5 {k7}, xmmword ptr [ecx + 2032], 123 +# ATT: vfpclassbf16x $123, 2032(%ecx), %k5 {%k7} +# INTEL: vfpclassbf16 k5 {k7}, xmmword ptr [ecx + 2032], 123 0x62,0xf3,0x7f,0x0f,0x66,0x69,0x7f,0x7b -# ATT: vfpclasspbf16 $123, -256(%edx){1to8}, %k5 {%k7} -# INTEL: vfpclasspbf16 k5 {k7}, word ptr [edx - 256]{1to8}, 123 +# ATT: vfpclassbf16 $123, -256(%edx){1to8}, %k5 {%k7} +# INTEL: vfpclassbf16 k5 {k7}, word ptr [edx - 256]{1to8}, 123 0x62,0xf3,0x7f,0x1f,0x66,0x6a,0x80,0x7b -# ATT: vfpclasspbf16 $123, (%eax){1to16}, %k5 -# INTEL: vfpclasspbf16 k5, word ptr [eax]{1to16}, 123 +# ATT: vfpclassbf16 $123, (%eax){1to16}, %k5 +# INTEL: vfpclassbf16 k5, word ptr [eax]{1to16}, 123 0x62,0xf3,0x7f,0x38,0x66,0x28,0x7b -# ATT: vfpclasspbf16y $123, -1024(,%ebp,2), %k5 -# INTEL: vfpclasspbf16 k5, ymmword ptr [2*ebp - 1024], 123 +# ATT: vfpclassbf16y $123, -1024(,%ebp,2), %k5 +# INTEL: vfpclassbf16 k5, ymmword ptr [2*ebp - 1024], 123 0x62,0xf3,0x7f,0x28,0x66,0x2c,0x6d,0x00,0xfc,0xff,0xff,0x7b -# ATT: vfpclasspbf16y $123, 4064(%ecx), %k5 {%k7} -# INTEL: vfpclasspbf16 k5 {k7}, ymmword ptr [ecx + 4064], 123 +# ATT: vfpclassbf16y $123, 4064(%ecx), %k5 {%k7} +# INTEL: vfpclassbf16 k5 {k7}, ymmword ptr [ecx + 4064], 123 0x62,0xf3,0x7f,0x2f,0x66,0x69,0x7f,0x7b -# ATT: vfpclasspbf16 $123, -256(%edx){1to16}, %k5 {%k7} -# INTEL: vfpclasspbf16 k5 {k7}, word ptr [edx - 256]{1to16}, 123 +# ATT: vfpclassbf16 $123, -256(%edx){1to16}, %k5 {%k7} +# INTEL: vfpclassbf16 k5 {k7}, word ptr [edx - 256]{1to16}, 123 0x62,0xf3,0x7f,0x3f,0x66,0x6a,0x80,0x7b -# ATT: vfpclasspbf16 $123, (%eax){1to32}, %k5 -# INTEL: vfpclasspbf16 k5, word ptr [eax]{1to32}, 123 +# ATT: vfpclassbf16 $123, (%eax){1to32}, %k5 +# INTEL: vfpclassbf16 k5, word ptr [eax]{1to32}, 123 0x62,0xf3,0x7f,0x58,0x66,0x28,0x7b -# ATT: vfpclasspbf16z $123, -2048(,%ebp,2), %k5 -# INTEL: vfpclasspbf16 k5, zmmword ptr [2*ebp - 2048], 123 +# ATT: vfpclassbf16z $123, -2048(,%ebp,2), %k5 +# INTEL: vfpclassbf16 k5, zmmword ptr [2*ebp - 2048], 123 0x62,0xf3,0x7f,0x48,0x66,0x2c,0x6d,0x00,0xf8,0xff,0xff,0x7b -# ATT: vfpclasspbf16z $123, 8128(%ecx), %k5 {%k7} -# INTEL: vfpclasspbf16 k5 {k7}, zmmword ptr [ecx + 8128], 123 +# ATT: vfpclassbf16z $123, 8128(%ecx), %k5 {%k7} +# INTEL: vfpclassbf16 k5 {k7}, zmmword ptr [ecx + 8128], 123 0x62,0xf3,0x7f,0x4f,0x66,0x69,0x7f,0x7b -# ATT: vfpclasspbf16 $123, -256(%edx){1to32}, %k5 {%k7} -# INTEL: vfpclasspbf16 k5 {k7}, word ptr [edx - 256]{1to32}, 123 +# ATT: vfpclassbf16 $123, -256(%edx){1to32}, %k5 {%k7} +# INTEL: vfpclassbf16 k5 {k7}, word ptr [edx - 256]{1to32}, 123 0x62,0xf3,0x7f,0x5f,0x66,0x6a,0x80,0x7b -# ATT: vgetexppbf16 %xmm3, %xmm2 -# INTEL: vgetexppbf16 xmm2, xmm3 +# ATT: vgetexpbf16 %xmm3, %xmm2 +# INTEL: vgetexpbf16 xmm2, xmm3 0x62,0xf5,0x7d,0x08,0x42,0xd3 -# ATT: vgetexppbf16 %xmm3, %xmm2 {%k7} -# INTEL: vgetexppbf16 xmm2 {k7}, xmm3 +# ATT: vgetexpbf16 %xmm3, %xmm2 {%k7} +# INTEL: vgetexpbf16 xmm2 {k7}, xmm3 0x62,0xf5,0x7d,0x0f,0x42,0xd3 -# ATT: vgetexppbf16 %xmm3, %xmm2 {%k7} {z} -# INTEL: vgetexppbf16 xmm2 {k7} {z}, xmm3 +# ATT: vgetexpbf16 %xmm3, %xmm2 {%k7} {z} +# INTEL: vgetexpbf16 xmm2 {k7} {z}, xmm3 0x62,0xf5,0x7d,0x8f,0x42,0xd3 -# ATT: vgetexppbf16 %zmm3, %zmm2 -# INTEL: vgetexppbf16 zmm2, zmm3 +# ATT: vgetexpbf16 %zmm3, %zmm2 +# INTEL: vgetexpbf16 zmm2, zmm3 0x62,0xf5,0x7d,0x48,0x42,0xd3 -# ATT: vgetexppbf16 %zmm3, %zmm2 {%k7} -# INTEL: vgetexppbf16 zmm2 {k7}, zmm3 +# ATT: vgetexpbf16 %zmm3, %zmm2 {%k7} +# INTEL: vgetexpbf16 zmm2 {k7}, zmm3 0x62,0xf5,0x7d,0x4f,0x42,0xd3 -# ATT: vgetexppbf16 %zmm3, %zmm2 {%k7} {z} -# INTEL: vgetexppbf16 zmm2 {k7} {z}, zmm3 +# ATT: vgetexpbf16 %zmm3, %zmm2 {%k7} {z} +# INTEL: vgetexpbf16 zmm2 {k7} {z}, zmm3 0x62,0xf5,0x7d,0xcf,0x42,0xd3 -# ATT: vgetexppbf16 %ymm3, %ymm2 -# INTEL: vgetexppbf16 ymm2, ymm3 +# ATT: vgetexpbf16 %ymm3, %ymm2 +# INTEL: vgetexpbf16 ymm2, ymm3 0x62,0xf5,0x7d,0x28,0x42,0xd3 -# ATT: vgetexppbf16 %ymm3, %ymm2 {%k7} -# INTEL: vgetexppbf16 ymm2 {k7}, ymm3 +# ATT: vgetexpbf16 %ymm3, %ymm2 {%k7} +# INTEL: vgetexpbf16 ymm2 {k7}, ymm3 0x62,0xf5,0x7d,0x2f,0x42,0xd3 -# ATT: vgetexppbf16 %ymm3, %ymm2 {%k7} {z} -# INTEL: vgetexppbf16 ymm2 {k7} {z}, ymm3 +# ATT: vgetexpbf16 %ymm3, %ymm2 {%k7} {z} +# INTEL: vgetexpbf16 ymm2 {k7} {z}, ymm3 0x62,0xf5,0x7d,0xaf,0x42,0xd3 -# ATT: vgetexppbf16 268435456(%esp,%esi,8), %xmm2 -# INTEL: vgetexppbf16 xmm2, xmmword ptr [esp + 8*esi + 268435456] +# ATT: vgetexpbf16 268435456(%esp,%esi,8), %xmm2 +# INTEL: vgetexpbf16 xmm2, xmmword ptr [esp + 8*esi + 268435456] 0x62,0xf5,0x7d,0x08,0x42,0x94,0xf4,0x00,0x00,0x00,0x10 -# ATT: vgetexppbf16 291(%edi,%eax,4), %xmm2 {%k7} -# INTEL: vgetexppbf16 xmm2 {k7}, xmmword ptr [edi + 4*eax + 291] +# ATT: vgetexpbf16 291(%edi,%eax,4), %xmm2 {%k7} +# INTEL: vgetexpbf16 xmm2 {k7}, xmmword ptr [edi + 4*eax + 291] 0x62,0xf5,0x7d,0x0f,0x42,0x94,0x87,0x23,0x01,0x00,0x00 -# ATT: vgetexppbf16 (%eax){1to8}, %xmm2 -# INTEL: vgetexppbf16 xmm2, word ptr [eax]{1to8} +# ATT: vgetexpbf16 (%eax){1to8}, %xmm2 +# INTEL: vgetexpbf16 xmm2, word ptr [eax]{1to8} 0x62,0xf5,0x7d,0x18,0x42,0x10 -# ATT: vgetexppbf16 -512(,%ebp,2), %xmm2 -# INTEL: vgetexppbf16 xmm2, xmmword ptr [2*ebp - 512] +# ATT: vgetexpbf16 -512(,%ebp,2), %xmm2 +# INTEL: vgetexpbf16 xmm2, xmmword ptr [2*ebp - 512] 0x62,0xf5,0x7d,0x08,0x42,0x14,0x6d,0x00,0xfe,0xff,0xff -# ATT: vgetexppbf16 2032(%ecx), %xmm2 {%k7} {z} -# INTEL: vgetexppbf16 xmm2 {k7} {z}, xmmword ptr [ecx + 2032] +# ATT: vgetexpbf16 2032(%ecx), %xmm2 {%k7} {z} +# INTEL: vgetexpbf16 xmm2 {k7} {z}, xmmword ptr [ecx + 2032] 0x62,0xf5,0x7d,0x8f,0x42,0x51,0x7f -# ATT: vgetexppbf16 -256(%edx){1to8}, %xmm2 {%k7} {z} -# INTEL: vgetexppbf16 xmm2 {k7} {z}, word ptr [edx - 256]{1to8} +# ATT: vgetexpbf16 -256(%edx){1to8}, %xmm2 {%k7} {z} +# INTEL: vgetexpbf16 xmm2 {k7} {z}, word ptr [edx - 256]{1to8} 0x62,0xf5,0x7d,0x9f,0x42,0x52,0x80 -# ATT: vgetexppbf16 268435456(%esp,%esi,8), %ymm2 -# INTEL: vgetexppbf16 ymm2, ymmword ptr [esp + 8*esi + 268435456] +# ATT: vgetexpbf16 268435456(%esp,%esi,8), %ymm2 +# INTEL: vgetexpbf16 ymm2, ymmword ptr [esp + 8*esi + 268435456] 0x62,0xf5,0x7d,0x28,0x42,0x94,0xf4,0x00,0x00,0x00,0x10 -# ATT: vgetexppbf16 291(%edi,%eax,4), %ymm2 {%k7} -# INTEL: vgetexppbf16 ymm2 {k7}, ymmword ptr [edi + 4*eax + 291] +# ATT: vgetexpbf16 291(%edi,%eax,4), %ymm2 {%k7} +# INTEL: vgetexpbf16 ymm2 {k7}, ymmword ptr [edi + 4*eax + 291] 0x62,0xf5,0x7d,0x2f,0x42,0x94,0x87,0x23,0x01,0x00,0x00 -# ATT: vgetexppbf16 (%eax){1to16}, %ymm2 -# INTEL: vgetexppbf16 ymm2, word ptr [eax]{1to16} +# ATT: vgetexpbf16 (%eax){1to16}, %ymm2 +# INTEL: vgetexpbf16 ymm2, word ptr [eax]{1to16} 0x62,0xf5,0x7d,0x38,0x42,0x10 -# ATT: vgetexppbf16 -1024(,%ebp,2), %ymm2 -# INTEL: vgetexppbf16 ymm2, ymmword ptr [2*ebp - 1024] +# ATT: vgetexpbf16 -1024(,%ebp,2), %ymm2 +# INTEL: vgetexpbf16 ymm2, ymmword ptr [2*ebp - 1024] 0x62,0xf5,0x7d,0x28,0x42,0x14,0x6d,0x00,0xfc,0xff,0xff -# ATT: vgetexppbf16 4064(%ecx), %ymm2 {%k7} {z} -# INTEL: vgetexppbf16 ymm2 {k7} {z}, ymmword ptr [ecx + 4064] +# ATT: vgetexpbf16 4064(%ecx), %ymm2 {%k7} {z} +# INTEL: vgetexpbf16 ymm2 {k7} {z}, ymmword ptr [ecx + 4064] 0x62,0xf5,0x7d,0xaf,0x42,0x51,0x7f -# ATT: vgetexppbf16 -256(%edx){1to16}, %ymm2 {%k7} {z} -# INTEL: vgetexppbf16 ymm2 {k7} {z}, word ptr [edx - 256]{1to16} +# ATT: vgetexpbf16 -256(%edx){1to16}, %ymm2 {%k7} {z} +# INTEL: vgetexpbf16 ymm2 {k7} {z}, word ptr [edx - 256]{1to16} 0x62,0xf5,0x7d,0xbf,0x42,0x52,0x80 -# ATT: vgetexppbf16 268435456(%esp,%esi,8), %zmm2 -# INTEL: vgetexppbf16 zmm2, zmmword ptr [esp + 8*esi + 268435456] +# ATT: vgetexpbf16 268435456(%esp,%esi,8), %zmm2 +# INTEL: vgetexpbf16 zmm2, zmmword ptr [esp + 8*esi + 268435456] 0x62,0xf5,0x7d,0x48,0x42,0x94,0xf4,0x00,0x00,0x00,0x10 -# ATT: vgetexppbf16 291(%edi,%eax,4), %zmm2 {%k7} -# INTEL: vgetexppbf16 zmm2 {k7}, zmmword ptr [edi + 4*eax + 291] +# ATT: vgetexpbf16 291(%edi,%eax,4), %zmm2 {%k7} +# INTEL: vgetexpbf16 zmm2 {k7}, zmmword ptr [edi + 4*eax + 291] 0x62,0xf5,0x7d,0x4f,0x42,0x94,0x87,0x23,0x01,0x00,0x00 -# ATT: vgetexppbf16 (%eax){1to32}, %zmm2 -# INTEL: vgetexppbf16 zmm2, word ptr [eax]{1to32} +# ATT: vgetexpbf16 (%eax){1to32}, %zmm2 +# INTEL: vgetexpbf16 zmm2, word ptr [eax]{1to32} 0x62,0xf5,0x7d,0x58,0x42,0x10 -# ATT: vgetexppbf16 -2048(,%ebp,2), %zmm2 -# INTEL: vgetexppbf16 zmm2, zmmword ptr [2*ebp - 2048] +# ATT: vgetexpbf16 -2048(,%ebp,2), %zmm2 +# INTEL: vgetexpbf16 zmm2, zmmword ptr [2*ebp - 2048] 0x62,0xf5,0x7d,0x48,0x42,0x14,0x6d,0x00,0xf8,0xff,0xff -# ATT: vgetexppbf16 8128(%ecx), %zmm2 {%k7} {z} -# INTEL: vgetexppbf16 zmm2 {k7} {z}, zmmword ptr [ecx + 8128] +# ATT: vgetexpbf16 8128(%ecx), %zmm2 {%k7} {z} +# INTEL: vgetexpbf16 zmm2 {k7} {z}, zmmword ptr [ecx + 8128] 0x62,0xf5,0x7d,0xcf,0x42,0x51,0x7f -# ATT: vgetexppbf16 -256(%edx){1to32}, %zmm2 {%k7} {z} -# INTEL: vgetexppbf16 zmm2 {k7} {z}, word ptr [edx - 256]{1to32} +# ATT: vgetexpbf16 -256(%edx){1to32}, %zmm2 {%k7} {z} +# INTEL: vgetexpbf16 zmm2 {k7} {z}, word ptr [edx - 256]{1to32} 0x62,0xf5,0x7d,0xdf,0x42,0x52,0x80 -# ATT: vgetmantpbf16 $123, %zmm3, %zmm2 -# INTEL: vgetmantpbf16 zmm2, zmm3, 123 +# ATT: vgetmantbf16 $123, %zmm3, %zmm2 +# INTEL: vgetmantbf16 zmm2, zmm3, 123 0x62,0xf3,0x7f,0x48,0x26,0xd3,0x7b -# ATT: vgetmantpbf16 $123, %zmm3, %zmm2 {%k7} -# INTEL: vgetmantpbf16 zmm2 {k7}, zmm3, 123 +# ATT: vgetmantbf16 $123, %zmm3, %zmm2 {%k7} +# INTEL: vgetmantbf16 zmm2 {k7}, zmm3, 123 0x62,0xf3,0x7f,0x4f,0x26,0xd3,0x7b -# ATT: vgetmantpbf16 $123, %zmm3, %zmm2 {%k7} {z} -# INTEL: vgetmantpbf16 zmm2 {k7} {z}, zmm3, 123 +# ATT: vgetmantbf16 $123, %zmm3, %zmm2 {%k7} {z} +# INTEL: vgetmantbf16 zmm2 {k7} {z}, zmm3, 123 0x62,0xf3,0x7f,0xcf,0x26,0xd3,0x7b -# ATT: vgetmantpbf16 $123, %ymm3, %ymm2 -# INTEL: vgetmantpbf16 ymm2, ymm3, 123 +# ATT: vgetmantbf16 $123, %ymm3, %ymm2 +# INTEL: vgetmantbf16 ymm2, ymm3, 123 0x62,0xf3,0x7f,0x28,0x26,0xd3,0x7b -# ATT: vgetmantpbf16 $123, %ymm3, %ymm2 {%k7} -# INTEL: vgetmantpbf16 ymm2 {k7}, ymm3, 123 +# ATT: vgetmantbf16 $123, %ymm3, %ymm2 {%k7} +# INTEL: vgetmantbf16 ymm2 {k7}, ymm3, 123 0x62,0xf3,0x7f,0x2f,0x26,0xd3,0x7b -# ATT: vgetmantpbf16 $123, %ymm3, %ymm2 {%k7} {z} -# INTEL: vgetmantpbf16 ymm2 {k7} {z}, ymm3, 123 +# ATT: vgetmantbf16 $123, %ymm3, %ymm2 {%k7} {z} +# INTEL: vgetmantbf16 ymm2 {k7} {z}, ymm3, 123 0x62,0xf3,0x7f,0xaf,0x26,0xd3,0x7b -# ATT: vgetmantpbf16 $123, %xmm3, %xmm2 -# INTEL: vgetmantpbf16 xmm2, xmm3, 123 +# ATT: vgetmantbf16 $123, %xmm3, %xmm2 +# INTEL: vgetmantbf16 xmm2, xmm3, 123 0x62,0xf3,0x7f,0x08,0x26,0xd3,0x7b -# ATT: vgetmantpbf16 $123, %xmm3, %xmm2 {%k7} -# INTEL: vgetmantpbf16 xmm2 {k7}, xmm3, 123 +# ATT: vgetmantbf16 $123, %xmm3, %xmm2 {%k7} +# INTEL: vgetmantbf16 xmm2 {k7}, xmm3, 123 0x62,0xf3,0x7f,0x0f,0x26,0xd3,0x7b -# ATT: vgetmantpbf16 $123, %xmm3, %xmm2 {%k7} {z} -# INTEL: vgetmantpbf16 xmm2 {k7} {z}, xmm3, 123 +# ATT: vgetmantbf16 $123, %xmm3, %xmm2 {%k7} {z} +# INTEL: vgetmantbf16 xmm2 {k7} {z}, xmm3, 123 0x62,0xf3,0x7f,0x8f,0x26,0xd3,0x7b -# ATT: vgetmantpbf16 $123, 268435456(%esp,%esi,8), %xmm2 -# INTEL: vgetmantpbf16 xmm2, xmmword ptr [esp + 8*esi + 268435456], 123 +# ATT: vgetmantbf16 $123, 268435456(%esp,%esi,8), %xmm2 +# INTEL: vgetmantbf16 xmm2, xmmword ptr [esp + 8*esi + 268435456], 123 0x62,0xf3,0x7f,0x08,0x26,0x94,0xf4,0x00,0x00,0x00,0x10,0x7b -# ATT: vgetmantpbf16 $123, 291(%edi,%eax,4), %xmm2 {%k7} -# INTEL: vgetmantpbf16 xmm2 {k7}, xmmword ptr [edi + 4*eax + 291], 123 +# ATT: vgetmantbf16 $123, 291(%edi,%eax,4), %xmm2 {%k7} +# INTEL: vgetmantbf16 xmm2 {k7}, xmmword ptr [edi + 4*eax + 291], 123 0x62,0xf3,0x7f,0x0f,0x26,0x94,0x87,0x23,0x01,0x00,0x00,0x7b -# ATT: vgetmantpbf16 $123, (%eax){1to8}, %xmm2 -# INTEL: vgetmantpbf16 xmm2, word ptr [eax]{1to8}, 123 +# ATT: vgetmantbf16 $123, (%eax){1to8}, %xmm2 +# INTEL: vgetmantbf16 xmm2, word ptr [eax]{1to8}, 123 0x62,0xf3,0x7f,0x18,0x26,0x10,0x7b -# ATT: vgetmantpbf16 $123, -512(,%ebp,2), %xmm2 -# INTEL: vgetmantpbf16 xmm2, xmmword ptr [2*ebp - 512], 123 +# ATT: vgetmantbf16 $123, -512(,%ebp,2), %xmm2 +# INTEL: vgetmantbf16 xmm2, xmmword ptr [2*ebp - 512], 123 0x62,0xf3,0x7f,0x08,0x26,0x14,0x6d,0x00,0xfe,0xff,0xff,0x7b -# ATT: vgetmantpbf16 $123, 2032(%ecx), %xmm2 {%k7} {z} -# INTEL: vgetmantpbf16 xmm2 {k7} {z}, xmmword ptr [ecx + 2032], 123 +# ATT: vgetmantbf16 $123, 2032(%ecx), %xmm2 {%k7} {z} +# INTEL: vgetmantbf16 xmm2 {k7} {z}, xmmword ptr [ecx + 2032], 123 0x62,0xf3,0x7f,0x8f,0x26,0x51,0x7f,0x7b -# ATT: vgetmantpbf16 $123, -256(%edx){1to8}, %xmm2 {%k7} {z} -# INTEL: vgetmantpbf16 xmm2 {k7} {z}, word ptr [edx - 256]{1to8}, 123 +# ATT: vgetmantbf16 $123, -256(%edx){1to8}, %xmm2 {%k7} {z} +# INTEL: vgetmantbf16 xmm2 {k7} {z}, word ptr [edx - 256]{1to8}, 123 0x62,0xf3,0x7f,0x9f,0x26,0x52,0x80,0x7b -# ATT: vgetmantpbf16 $123, 268435456(%esp,%esi,8), %ymm2 -# INTEL: vgetmantpbf16 ymm2, ymmword ptr [esp + 8*esi + 268435456], 123 +# ATT: vgetmantbf16 $123, 268435456(%esp,%esi,8), %ymm2 +# INTEL: vgetmantbf16 ymm2, ymmword ptr [esp + 8*esi + 268435456], 123 0x62,0xf3,0x7f,0x28,0x26,0x94,0xf4,0x00,0x00,0x00,0x10,0x7b -# ATT: vgetmantpbf16 $123, 291(%edi,%eax,4), %ymm2 {%k7} -# INTEL: vgetmantpbf16 ymm2 {k7}, ymmword ptr [edi + 4*eax + 291], 123 +# ATT: vgetmantbf16 $123, 291(%edi,%eax,4), %ymm2 {%k7} +# INTEL: vgetmantbf16 ymm2 {k7}, ymmword ptr [edi + 4*eax + 291], 123 0x62,0xf3,0x7f,0x2f,0x26,0x94,0x87,0x23,0x01,0x00,0x00,0x7b -# ATT: vgetmantpbf16 $123, (%eax){1to16}, %ymm2 -# INTEL: vgetmantpbf16 ymm2, word ptr [eax]{1to16}, 123 +# ATT: vgetmantbf16 $123, (%eax){1to16}, %ymm2 +# INTEL: vgetmantbf16 ymm2, word ptr [eax]{1to16}, 123 0x62,0xf3,0x7f,0x38,0x26,0x10,0x7b -# ATT: vgetmantpbf16 $123, -1024(,%ebp,2), %ymm2 -# INTEL: vgetmantpbf16 ymm2, ymmword ptr [2*ebp - 1024], 123 +# ATT: vgetmantbf16 $123, -1024(,%ebp,2), %ymm2 +# INTEL: vgetmantbf16 ymm2, ymmword ptr [2*ebp - 1024], 123 0x62,0xf3,0x7f,0x28,0x26,0x14,0x6d,0x00,0xfc,0xff,0xff,0x7b -# ATT: vgetmantpbf16 $123, 4064(%ecx), %ymm2 {%k7} {z} -# INTEL: vgetmantpbf16 ymm2 {k7} {z}, ymmword ptr [ecx + 4064], 123 +# ATT: vgetmantbf16 $123, 4064(%ecx), %ymm2 {%k7} {z} +# INTEL: vgetmantbf16 ymm2 {k7} {z}, ymmword ptr [ecx + 4064], 123 0x62,0xf3,0x7f,0xaf,0x26,0x51,0x7f,0x7b -# ATT: vgetmantpbf16 $123, -256(%edx){1to16}, %ymm2 {%k7} {z} -# INTEL: vgetmantpbf16 ymm2 {k7} {z}, word ptr [edx - 256]{1to16}, 123 +# ATT: vgetmantbf16 $123, -256(%edx){1to16}, %ymm2 {%k7} {z} +# INTEL: vgetmantbf16 ymm2 {k7} {z}, word ptr [edx - 256]{1to16}, 123 0x62,0xf3,0x7f,0xbf,0x26,0x52,0x80,0x7b -# ATT: vgetmantpbf16 $123, 268435456(%esp,%esi,8), %zmm2 -# INTEL: vgetmantpbf16 zmm2, zmmword ptr [esp + 8*esi + 268435456], 123 +# ATT: vgetmantbf16 $123, 268435456(%esp,%esi,8), %zmm2 +# INTEL: vgetmantbf16 zmm2, zmmword ptr [esp + 8*esi + 268435456], 123 0x62,0xf3,0x7f,0x48,0x26,0x94,0xf4,0x00,0x00,0x00,0x10,0x7b -# ATT: vgetmantpbf16 $123, 291(%edi,%eax,4), %zmm2 {%k7} -# INTEL: vgetmantpbf16 zmm2 {k7}, zmmword ptr [edi + 4*eax + 291], 123 +# ATT: vgetmantbf16 $123, 291(%edi,%eax,4), %zmm2 {%k7} +# INTEL: vgetmantbf16 zmm2 {k7}, zmmword ptr [edi + 4*eax + 291], 123 0x62,0xf3,0x7f,0x4f,0x26,0x94,0x87,0x23,0x01,0x00,0x00,0x7b -# ATT: vgetmantpbf16 $123, (%eax){1to32}, %zmm2 -# INTEL: vgetmantpbf16 zmm2, word ptr [eax]{1to32}, 123 +# ATT: vgetmantbf16 $123, (%eax){1to32}, %zmm2 +# INTEL: vgetmantbf16 zmm2, word ptr [eax]{1to32}, 123 0x62,0xf3,0x7f,0x58,0x26,0x10,0x7b -# ATT: vgetmantpbf16 $123, -2048(,%ebp,2), %zmm2 -# INTEL: vgetmantpbf16 zmm2, zmmword ptr [2*ebp - 2048], 123 +# ATT: vgetmantbf16 $123, -2048(,%ebp,2), %zmm2 +# INTEL: vgetmantbf16 zmm2, zmmword ptr [2*ebp - 2048], 123 0x62,0xf3,0x7f,0x48,0x26,0x14,0x6d,0x00,0xf8,0xff,0xff,0x7b -# ATT: vgetmantpbf16 $123, 8128(%ecx), %zmm2 {%k7} {z} -# INTEL: vgetmantpbf16 zmm2 {k7} {z}, zmmword ptr [ecx + 8128], 123 +# ATT: vgetmantbf16 $123, 8128(%ecx), %zmm2 {%k7} {z} +# INTEL: vgetmantbf16 zmm2 {k7} {z}, zmmword ptr [ecx + 8128], 123 0x62,0xf3,0x7f,0xcf,0x26,0x51,0x7f,0x7b -# ATT: vgetmantpbf16 $123, -256(%edx){1to32}, %zmm2 {%k7} {z} -# INTEL: vgetmantpbf16 zmm2 {k7} {z}, word ptr [edx - 256]{1to32}, 123 +# ATT: vgetmantbf16 $123, -256(%edx){1to32}, %zmm2 {%k7} {z} +# INTEL: vgetmantbf16 zmm2 {k7} {z}, word ptr [edx - 256]{1to32}, 123 0x62,0xf3,0x7f,0xdf,0x26,0x52,0x80,0x7b -# ATT: vmaxpbf16 %ymm4, %ymm3, %ymm2 -# INTEL: vmaxpbf16 ymm2, ymm3, ymm4 +# ATT: vmaxbf16 %ymm4, %ymm3, %ymm2 +# INTEL: vmaxbf16 ymm2, ymm3, ymm4 0x62,0xf5,0x65,0x28,0x5f,0xd4 -# ATT: vmaxpbf16 %ymm4, %ymm3, %ymm2 {%k7} -# INTEL: vmaxpbf16 ymm2 {k7}, ymm3, ymm4 +# ATT: vmaxbf16 %ymm4, %ymm3, %ymm2 {%k7} +# INTEL: vmaxbf16 ymm2 {k7}, ymm3, ymm4 0x62,0xf5,0x65,0x2f,0x5f,0xd4 -# ATT: vmaxpbf16 %ymm4, %ymm3, %ymm2 {%k7} {z} -# INTEL: vmaxpbf16 ymm2 {k7} {z}, ymm3, ymm4 +# ATT: vmaxbf16 %ymm4, %ymm3, %ymm2 {%k7} {z} +# INTEL: vmaxbf16 ymm2 {k7} {z}, ymm3, ymm4 0x62,0xf5,0x65,0xaf,0x5f,0xd4 -# ATT: vmaxpbf16 %zmm4, %zmm3, %zmm2 -# INTEL: vmaxpbf16 zmm2, zmm3, zmm4 +# ATT: vmaxbf16 %zmm4, %zmm3, %zmm2 +# INTEL: vmaxbf16 zmm2, zmm3, zmm4 0x62,0xf5,0x65,0x48,0x5f,0xd4 -# ATT: vmaxpbf16 %zmm4, %zmm3, %zmm2 {%k7} -# INTEL: vmaxpbf16 zmm2 {k7}, zmm3, zmm4 +# ATT: vmaxbf16 %zmm4, %zmm3, %zmm2 {%k7} +# INTEL: vmaxbf16 zmm2 {k7}, zmm3, zmm4 0x62,0xf5,0x65,0x4f,0x5f,0xd4 -# ATT: vmaxpbf16 %zmm4, %zmm3, %zmm2 {%k7} {z} -# INTEL: vmaxpbf16 zmm2 {k7} {z}, zmm3, zmm4 +# ATT: vmaxbf16 %zmm4, %zmm3, %zmm2 {%k7} {z} +# INTEL: vmaxbf16 zmm2 {k7} {z}, zmm3, zmm4 0x62,0xf5,0x65,0xcf,0x5f,0xd4 -# ATT: vmaxpbf16 %xmm4, %xmm3, %xmm2 -# INTEL: vmaxpbf16 xmm2, xmm3, xmm4 +# ATT: vmaxbf16 %xmm4, %xmm3, %xmm2 +# INTEL: vmaxbf16 xmm2, xmm3, xmm4 0x62,0xf5,0x65,0x08,0x5f,0xd4 -# ATT: vmaxpbf16 %xmm4, %xmm3, %xmm2 {%k7} -# INTEL: vmaxpbf16 xmm2 {k7}, xmm3, xmm4 +# ATT: vmaxbf16 %xmm4, %xmm3, %xmm2 {%k7} +# INTEL: vmaxbf16 xmm2 {k7}, xmm3, xmm4 0x62,0xf5,0x65,0x0f,0x5f,0xd4 -# ATT: vmaxpbf16 %xmm4, %xmm3, %xmm2 {%k7} {z} -# INTEL: vmaxpbf16 xmm2 {k7} {z}, xmm3, xmm4 +# ATT: vmaxbf16 %xmm4, %xmm3, %xmm2 {%k7} {z} +# INTEL: vmaxbf16 xmm2 {k7} {z}, xmm3, xmm4 0x62,0xf5,0x65,0x8f,0x5f,0xd4 -# ATT: vmaxpbf16 268435456(%esp,%esi,8), %zmm3, %zmm2 -# INTEL: vmaxpbf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456] +# ATT: vmaxbf16 268435456(%esp,%esi,8), %zmm3, %zmm2 +# INTEL: vmaxbf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456] 0x62,0xf5,0x65,0x48,0x5f,0x94,0xf4,0x00,0x00,0x00,0x10 -# ATT: vmaxpbf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7} -# INTEL: vmaxpbf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291] +# ATT: vmaxbf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7} +# INTEL: vmaxbf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291] 0x62,0xf5,0x65,0x4f,0x5f,0x94,0x87,0x23,0x01,0x00,0x00 -# ATT: vmaxpbf16 (%eax){1to32}, %zmm3, %zmm2 -# INTEL: vmaxpbf16 zmm2, zmm3, word ptr [eax]{1to32} +# ATT: vmaxbf16 (%eax){1to32}, %zmm3, %zmm2 +# INTEL: vmaxbf16 zmm2, zmm3, word ptr [eax]{1to32} 0x62,0xf5,0x65,0x58,0x5f,0x10 -# ATT: vmaxpbf16 -2048(,%ebp,2), %zmm3, %zmm2 -# INTEL: vmaxpbf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048] +# ATT: vmaxbf16 -2048(,%ebp,2), %zmm3, %zmm2 +# INTEL: vmaxbf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048] 0x62,0xf5,0x65,0x48,0x5f,0x14,0x6d,0x00,0xf8,0xff,0xff -# ATT: vmaxpbf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z} -# INTEL: vmaxpbf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128] +# ATT: vmaxbf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z} +# INTEL: vmaxbf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128] 0x62,0xf5,0x65,0xcf,0x5f,0x51,0x7f -# ATT: vmaxpbf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z} -# INTEL: vmaxpbf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32} +# ATT: vmaxbf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z} +# INTEL: vmaxbf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32} 0x62,0xf5,0x65,0xdf,0x5f,0x52,0x80 -# ATT: vmaxpbf16 268435456(%esp,%esi,8), %ymm3, %ymm2 -# INTEL: vmaxpbf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456] +# ATT: vmaxbf16 268435456(%esp,%esi,8), %ymm3, %ymm2 +# INTEL: vmaxbf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456] 0x62,0xf5,0x65,0x28,0x5f,0x94,0xf4,0x00,0x00,0x00,0x10 -# ATT: vmaxpbf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7} -# INTEL: vmaxpbf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291] +# ATT: vmaxbf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7} +# INTEL: vmaxbf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291] 0x62,0xf5,0x65,0x2f,0x5f,0x94,0x87,0x23,0x01,0x00,0x00 -# ATT: vmaxpbf16 (%eax){1to16}, %ymm3, %ymm2 -# INTEL: vmaxpbf16 ymm2, ymm3, word ptr [eax]{1to16} +# ATT: vmaxbf16 (%eax){1to16}, %ymm3, %ymm2 +# INTEL: vmaxbf16 ymm2, ymm3, word ptr [eax]{1to16} 0x62,0xf5,0x65,0x38,0x5f,0x10 -# ATT: vmaxpbf16 -1024(,%ebp,2), %ymm3, %ymm2 -# INTEL: vmaxpbf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024] +# ATT: vmaxbf16 -1024(,%ebp,2), %ymm3, %ymm2 +# INTEL: vmaxbf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024] 0x62,0xf5,0x65,0x28,0x5f,0x14,0x6d,0x00,0xfc,0xff,0xff -# ATT: vmaxpbf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z} -# INTEL: vmaxpbf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064] +# ATT: vmaxbf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z} +# INTEL: vmaxbf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064] 0x62,0xf5,0x65,0xaf,0x5f,0x51,0x7f -# ATT: vmaxpbf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z} -# INTEL: vmaxpbf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16} +# ATT: vmaxbf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z} +# INTEL: vmaxbf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16} 0x62,0xf5,0x65,0xbf,0x5f,0x52,0x80 -# ATT: vmaxpbf16 268435456(%esp,%esi,8), %xmm3, %xmm2 -# INTEL: vmaxpbf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456] +# ATT: vmaxbf16 268435456(%esp,%esi,8), %xmm3, %xmm2 +# INTEL: vmaxbf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456] 0x62,0xf5,0x65,0x08,0x5f,0x94,0xf4,0x00,0x00,0x00,0x10 -# ATT: vmaxpbf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7} -# INTEL: vmaxpbf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291] +# ATT: vmaxbf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7} +# INTEL: vmaxbf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291] 0x62,0xf5,0x65,0x0f,0x5f,0x94,0x87,0x23,0x01,0x00,0x00 -# ATT: vmaxpbf16 (%eax){1to8}, %xmm3, %xmm2 -# INTEL: vmaxpbf16 xmm2, xmm3, word ptr [eax]{1to8} +# ATT: vmaxbf16 (%eax){1to8}, %xmm3, %xmm2 +# INTEL: vmaxbf16 xmm2, xmm3, word ptr [eax]{1to8} 0x62,0xf5,0x65,0x18,0x5f,0x10 -# ATT: vmaxpbf16 -512(,%ebp,2), %xmm3, %xmm2 -# INTEL: vmaxpbf16 xmm2, xmm3, xmmword ptr [2*ebp - 512] +# ATT: vmaxbf16 -512(,%ebp,2), %xmm3, %xmm2 +# INTEL: vmaxbf16 xmm2, xmm3, xmmword ptr [2*ebp - 512] 0x62,0xf5,0x65,0x08,0x5f,0x14,0x6d,0x00,0xfe,0xff,0xff -# ATT: vmaxpbf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z} -# INTEL: vmaxpbf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032] +# ATT: vmaxbf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z} +# INTEL: vmaxbf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032] 0x62,0xf5,0x65,0x8f,0x5f,0x51,0x7f -# ATT: vmaxpbf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z} -# INTEL: vmaxpbf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8} +# ATT: vmaxbf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z} +# INTEL: vmaxbf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8} 0x62,0xf5,0x65,0x9f,0x5f,0x52,0x80 -# ATT: vminpbf16 %ymm4, %ymm3, %ymm2 -# INTEL: vminpbf16 ymm2, ymm3, ymm4 +# ATT: vminbf16 %ymm4, %ymm3, %ymm2 +# INTEL: vminbf16 ymm2, ymm3, ymm4 0x62,0xf5,0x65,0x28,0x5d,0xd4 -# ATT: vminpbf16 %ymm4, %ymm3, %ymm2 {%k7} -# INTEL: vminpbf16 ymm2 {k7}, ymm3, ymm4 +# ATT: vminbf16 %ymm4, %ymm3, %ymm2 {%k7} +# INTEL: vminbf16 ymm2 {k7}, ymm3, ymm4 0x62,0xf5,0x65,0x2f,0x5d,0xd4 -# ATT: vminpbf16 %ymm4, %ymm3, %ymm2 {%k7} {z} -# INTEL: vminpbf16 ymm2 {k7} {z}, ymm3, ymm4 +# ATT: vminbf16 %ymm4, %ymm3, %ymm2 {%k7} {z} +# INTEL: vminbf16 ymm2 {k7} {z}, ymm3, ymm4 0x62,0xf5,0x65,0xaf,0x5d,0xd4 -# ATT: vminpbf16 %zmm4, %zmm3, %zmm2 -# INTEL: vminpbf16 zmm2, zmm3, zmm4 +# ATT: vminbf16 %zmm4, %zmm3, %zmm2 +# INTEL: vminbf16 zmm2, zmm3, zmm4 0x62,0xf5,0x65,0x48,0x5d,0xd4 -# ATT: vminpbf16 %zmm4, %zmm3, %zmm2 {%k7} -# INTEL: vminpbf16 zmm2 {k7}, zmm3, zmm4 +# ATT: vminbf16 %zmm4, %zmm3, %zmm2 {%k7} +# INTEL: vminbf16 zmm2 {k7}, zmm3, zmm4 0x62,0xf5,0x65,0x4f,0x5d,0xd4 -# ATT: vminpbf16 %zmm4, %zmm3, %zmm2 {%k7} {z} -# INTEL: vminpbf16 zmm2 {k7} {z}, zmm3, zmm4 +# ATT: vminbf16 %zmm4, %zmm3, %zmm2 {%k7} {z} +# INTEL: vminbf16 zmm2 {k7} {z}, zmm3, zmm4 0x62,0xf5,0x65,0xcf,0x5d,0xd4 -# ATT: vminpbf16 %xmm4, %xmm3, %xmm2 -# INTEL: vminpbf16 xmm2, xmm3, xmm4 +# ATT: vminbf16 %xmm4, %xmm3, %xmm2 +# INTEL: vminbf16 xmm2, xmm3, xmm4 0x62,0xf5,0x65,0x08,0x5d,0xd4 -# ATT: vminpbf16 %xmm4, %xmm3, %xmm2 {%k7} -# INTEL: vminpbf16 xmm2 {k7}, xmm3, xmm4 +# ATT: vminbf16 %xmm4, %xmm3, %xmm2 {%k7} +# INTEL: vminbf16 xmm2 {k7}, xmm3, xmm4 0x62,0xf5,0x65,0x0f,0x5d,0xd4 -# ATT: vminpbf16 %xmm4, %xmm3, %xmm2 {%k7} {z} -# INTEL: vminpbf16 xmm2 {k7} {z}, xmm3, xmm4 +# ATT: vminbf16 %xmm4, %xmm3, %xmm2 {%k7} {z} +# INTEL: vminbf16 xmm2 {k7} {z}, xmm3, xmm4 0x62,0xf5,0x65,0x8f,0x5d,0xd4 -# ATT: vminpbf16 268435456(%esp,%esi,8), %zmm3, %zmm2 -# INTEL: vminpbf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456] +# ATT: vminbf16 268435456(%esp,%esi,8), %zmm3, %zmm2 +# INTEL: vminbf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456] 0x62,0xf5,0x65,0x48,0x5d,0x94,0xf4,0x00,0x00,0x00,0x10 -# ATT: vminpbf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7} -# INTEL: vminpbf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291] +# ATT: vminbf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7} +# INTEL: vminbf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291] 0x62,0xf5,0x65,0x4f,0x5d,0x94,0x87,0x23,0x01,0x00,0x00 -# ATT: vminpbf16 (%eax){1to32}, %zmm3, %zmm2 -# INTEL: vminpbf16 zmm2, zmm3, word ptr [eax]{1to32} +# ATT: vminbf16 (%eax){1to32}, %zmm3, %zmm2 +# INTEL: vminbf16 zmm2, zmm3, word ptr [eax]{1to32} 0x62,0xf5,0x65,0x58,0x5d,0x10 -# ATT: vminpbf16 -2048(,%ebp,2), %zmm3, %zmm2 -# INTEL: vminpbf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048] +# ATT: vminbf16 -2048(,%ebp,2), %zmm3, %zmm2 +# INTEL: vminbf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048] 0x62,0xf5,0x65,0x48,0x5d,0x14,0x6d,0x00,0xf8,0xff,0xff -# ATT: vminpbf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z} -# INTEL: vminpbf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128] +# ATT: vminbf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z} +# INTEL: vminbf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128] 0x62,0xf5,0x65,0xcf,0x5d,0x51,0x7f -# ATT: vminpbf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z} -# INTEL: vminpbf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32} +# ATT: vminbf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z} +# INTEL: vminbf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32} 0x62,0xf5,0x65,0xdf,0x5d,0x52,0x80 -# ATT: vminpbf16 268435456(%esp,%esi,8), %ymm3, %ymm2 -# INTEL: vminpbf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456] +# ATT: vminbf16 268435456(%esp,%esi,8), %ymm3, %ymm2 +# INTEL: vminbf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456] 0x62,0xf5,0x65,0x28,0x5d,0x94,0xf4,0x00,0x00,0x00,0x10 -# ATT: vminpbf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7} -# INTEL: vminpbf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291] +# ATT: vminbf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7} +# INTEL: vminbf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291] 0x62,0xf5,0x65,0x2f,0x5d,0x94,0x87,0x23,0x01,0x00,0x00 -# ATT: vminpbf16 (%eax){1to16}, %ymm3, %ymm2 -# INTEL: vminpbf16 ymm2, ymm3, word ptr [eax]{1to16} +# ATT: vminbf16 (%eax){1to16}, %ymm3, %ymm2 +# INTEL: vminbf16 ymm2, ymm3, word ptr [eax]{1to16} 0x62,0xf5,0x65,0x38,0x5d,0x10 -# ATT: vminpbf16 -1024(,%ebp,2), %ymm3, %ymm2 -# INTEL: vminpbf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024] +# ATT: vminbf16 -1024(,%ebp,2), %ymm3, %ymm2 +# INTEL: vminbf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024] 0x62,0xf5,0x65,0x28,0x5d,0x14,0x6d,0x00,0xfc,0xff,0xff -# ATT: vminpbf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z} -# INTEL: vminpbf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064] +# ATT: vminbf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z} +# INTEL: vminbf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064] 0x62,0xf5,0x65,0xaf,0x5d,0x51,0x7f -# ATT: vminpbf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z} -# INTEL: vminpbf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16} +# ATT: vminbf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z} +# INTEL: vminbf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16} 0x62,0xf5,0x65,0xbf,0x5d,0x52,0x80 -# ATT: vminpbf16 268435456(%esp,%esi,8), %xmm3, %xmm2 -# INTEL: vminpbf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456] +# ATT: vminbf16 268435456(%esp,%esi,8), %xmm3, %xmm2 +# INTEL: vminbf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456] 0x62,0xf5,0x65,0x08,0x5d,0x94,0xf4,0x00,0x00,0x00,0x10 -# ATT: vminpbf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7} -# INTEL: vminpbf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291] +# ATT: vminbf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7} +# INTEL: vminbf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291] 0x62,0xf5,0x65,0x0f,0x5d,0x94,0x87,0x23,0x01,0x00,0x00 -# ATT: vminpbf16 (%eax){1to8}, %xmm3, %xmm2 -# INTEL: vminpbf16 xmm2, xmm3, word ptr [eax]{1to8} +# ATT: vminbf16 (%eax){1to8}, %xmm3, %xmm2 +# INTEL: vminbf16 xmm2, xmm3, word ptr [eax]{1to8} 0x62,0xf5,0x65,0x18,0x5d,0x10 -# ATT: vminpbf16 -512(,%ebp,2), %xmm3, %xmm2 -# INTEL: vminpbf16 xmm2, xmm3, xmmword ptr [2*ebp - 512] +# ATT: vminbf16 -512(,%ebp,2), %xmm3, %xmm2 +# INTEL: vminbf16 xmm2, xmm3, xmmword ptr [2*ebp - 512] 0x62,0xf5,0x65,0x08,0x5d,0x14,0x6d,0x00,0xfe,0xff,0xff -# ATT: vminpbf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z} -# INTEL: vminpbf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032] +# ATT: vminbf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z} +# INTEL: vminbf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032] 0x62,0xf5,0x65,0x8f,0x5d,0x51,0x7f -# ATT: vminpbf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z} -# INTEL: vminpbf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8} +# ATT: vminbf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z} +# INTEL: vminbf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8} 0x62,0xf5,0x65,0x9f,0x5d,0x52,0x80 -# ATT: vmulnepbf16 %ymm4, %ymm3, %ymm2 -# INTEL: vmulnepbf16 ymm2, ymm3, ymm4 +# ATT: vmulbf16 %ymm4, %ymm3, %ymm2 +# INTEL: vmulbf16 ymm2, ymm3, ymm4 0x62,0xf5,0x65,0x28,0x59,0xd4 -# ATT: vmulnepbf16 %ymm4, %ymm3, %ymm2 {%k7} -# INTEL: vmulnepbf16 ymm2 {k7}, ymm3, ymm4 +# ATT: vmulbf16 %ymm4, %ymm3, %ymm2 {%k7} +# INTEL: vmulbf16 ymm2 {k7}, ymm3, ymm4 0x62,0xf5,0x65,0x2f,0x59,0xd4 -# ATT: vmulnepbf16 %ymm4, %ymm3, %ymm2 {%k7} {z} -# INTEL: vmulnepbf16 ymm2 {k7} {z}, ymm3, ymm4 +# ATT: vmulbf16 %ymm4, %ymm3, %ymm2 {%k7} {z} +# INTEL: vmulbf16 ymm2 {k7} {z}, ymm3, ymm4 0x62,0xf5,0x65,0xaf,0x59,0xd4 -# ATT: vmulnepbf16 %zmm4, %zmm3, %zmm2 -# INTEL: vmulnepbf16 zmm2, zmm3, zmm4 +# ATT: vmulbf16 %zmm4, %zmm3, %zmm2 +# INTEL: vmulbf16 zmm2, zmm3, zmm4 0x62,0xf5,0x65,0x48,0x59,0xd4 -# ATT: vmulnepbf16 %zmm4, %zmm3, %zmm2 {%k7} -# INTEL: vmulnepbf16 zmm2 {k7}, zmm3, zmm4 +# ATT: vmulbf16 %zmm4, %zmm3, %zmm2 {%k7} +# INTEL: vmulbf16 zmm2 {k7}, zmm3, zmm4 0x62,0xf5,0x65,0x4f,0x59,0xd4 -# ATT: vmulnepbf16 %zmm4, %zmm3, %zmm2 {%k7} {z} -# INTEL: vmulnepbf16 zmm2 {k7} {z}, zmm3, zmm4 +# ATT: vmulbf16 %zmm4, %zmm3, %zmm2 {%k7} {z} +# INTEL: vmulbf16 zmm2 {k7} {z}, zmm3, zmm4 0x62,0xf5,0x65,0xcf,0x59,0xd4 -# ATT: vmulnepbf16 %xmm4, %xmm3, %xmm2 -# INTEL: vmulnepbf16 xmm2, xmm3, xmm4 +# ATT: vmulbf16 %xmm4, %xmm3, %xmm2 +# INTEL: vmulbf16 xmm2, xmm3, xmm4 0x62,0xf5,0x65,0x08,0x59,0xd4 -# ATT: vmulnepbf16 %xmm4, %xmm3, %xmm2 {%k7} -# INTEL: vmulnepbf16 xmm2 {k7}, xmm3, xmm4 +# ATT: vmulbf16 %xmm4, %xmm3, %xmm2 {%k7} +# INTEL: vmulbf16 xmm2 {k7}, xmm3, xmm4 0x62,0xf5,0x65,0x0f,0x59,0xd4 -# ATT: vmulnepbf16 %xmm4, %xmm3, %xmm2 {%k7} {z} -# INTEL: vmulnepbf16 xmm2 {k7} {z}, xmm3, xmm4 +# ATT: vmulbf16 %xmm4, %xmm3, %xmm2 {%k7} {z} +# INTEL: vmulbf16 xmm2 {k7} {z}, xmm3, xmm4 0x62,0xf5,0x65,0x8f,0x59,0xd4 -# ATT: vmulnepbf16 268435456(%esp,%esi,8), %zmm3, %zmm2 -# INTEL: vmulnepbf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456] +# ATT: vmulbf16 268435456(%esp,%esi,8), %zmm3, %zmm2 +# INTEL: vmulbf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456] 0x62,0xf5,0x65,0x48,0x59,0x94,0xf4,0x00,0x00,0x00,0x10 -# ATT: vmulnepbf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7} -# INTEL: vmulnepbf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291] +# ATT: vmulbf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7} +# INTEL: vmulbf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291] 0x62,0xf5,0x65,0x4f,0x59,0x94,0x87,0x23,0x01,0x00,0x00 -# ATT: vmulnepbf16 (%eax){1to32}, %zmm3, %zmm2 -# INTEL: vmulnepbf16 zmm2, zmm3, word ptr [eax]{1to32} +# ATT: vmulbf16 (%eax){1to32}, %zmm3, %zmm2 +# INTEL: vmulbf16 zmm2, zmm3, word ptr [eax]{1to32} 0x62,0xf5,0x65,0x58,0x59,0x10 -# ATT: vmulnepbf16 -2048(,%ebp,2), %zmm3, %zmm2 -# INTEL: vmulnepbf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048] +# ATT: vmulbf16 -2048(,%ebp,2), %zmm3, %zmm2 +# INTEL: vmulbf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048] 0x62,0xf5,0x65,0x48,0x59,0x14,0x6d,0x00,0xf8,0xff,0xff -# ATT: vmulnepbf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z} -# INTEL: vmulnepbf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128] +# ATT: vmulbf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z} +# INTEL: vmulbf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128] 0x62,0xf5,0x65,0xcf,0x59,0x51,0x7f -# ATT: vmulnepbf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z} -# INTEL: vmulnepbf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32} +# ATT: vmulbf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z} +# INTEL: vmulbf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32} 0x62,0xf5,0x65,0xdf,0x59,0x52,0x80 -# ATT: vmulnepbf16 268435456(%esp,%esi,8), %ymm3, %ymm2 -# INTEL: vmulnepbf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456] +# ATT: vmulbf16 268435456(%esp,%esi,8), %ymm3, %ymm2 +# INTEL: vmulbf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456] 0x62,0xf5,0x65,0x28,0x59,0x94,0xf4,0x00,0x00,0x00,0x10 -# ATT: vmulnepbf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7} -# INTEL: vmulnepbf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291] +# ATT: vmulbf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7} +# INTEL: vmulbf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291] 0x62,0xf5,0x65,0x2f,0x59,0x94,0x87,0x23,0x01,0x00,0x00 -# ATT: vmulnepbf16 (%eax){1to16}, %ymm3, %ymm2 -# INTEL: vmulnepbf16 ymm2, ymm3, word ptr [eax]{1to16} +# ATT: vmulbf16 (%eax){1to16}, %ymm3, %ymm2 +# INTEL: vmulbf16 ymm2, ymm3, word ptr [eax]{1to16} 0x62,0xf5,0x65,0x38,0x59,0x10 -# ATT: vmulnepbf16 -1024(,%ebp,2), %ymm3, %ymm2 -# INTEL: vmulnepbf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024] +# ATT: vmulbf16 -1024(,%ebp,2), %ymm3, %ymm2 +# INTEL: vmulbf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024] 0x62,0xf5,0x65,0x28,0x59,0x14,0x6d,0x00,0xfc,0xff,0xff -# ATT: vmulnepbf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z} -# INTEL: vmulnepbf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064] +# ATT: vmulbf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z} +# INTEL: vmulbf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064] 0x62,0xf5,0x65,0xaf,0x59,0x51,0x7f -# ATT: vmulnepbf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z} -# INTEL: vmulnepbf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16} +# ATT: vmulbf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z} +# INTEL: vmulbf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16} 0x62,0xf5,0x65,0xbf,0x59,0x52,0x80 -# ATT: vmulnepbf16 268435456(%esp,%esi,8), %xmm3, %xmm2 -# INTEL: vmulnepbf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456] +# ATT: vmulbf16 268435456(%esp,%esi,8), %xmm3, %xmm2 +# INTEL: vmulbf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456] 0x62,0xf5,0x65,0x08,0x59,0x94,0xf4,0x00,0x00,0x00,0x10 -# ATT: vmulnepbf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7} -# INTEL: vmulnepbf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291] +# ATT: vmulbf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7} +# INTEL: vmulbf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291] 0x62,0xf5,0x65,0x0f,0x59,0x94,0x87,0x23,0x01,0x00,0x00 -# ATT: vmulnepbf16 (%eax){1to8}, %xmm3, %xmm2 -# INTEL: vmulnepbf16 xmm2, xmm3, word ptr [eax]{1to8} +# ATT: vmulbf16 (%eax){1to8}, %xmm3, %xmm2 +# INTEL: vmulbf16 xmm2, xmm3, word ptr [eax]{1to8} 0x62,0xf5,0x65,0x18,0x59,0x10 -# ATT: vmulnepbf16 -512(,%ebp,2), %xmm3, %xmm2 -# INTEL: vmulnepbf16 xmm2, xmm3, xmmword ptr [2*ebp - 512] +# ATT: vmulbf16 -512(,%ebp,2), %xmm3, %xmm2 +# INTEL: vmulbf16 xmm2, xmm3, xmmword ptr [2*ebp - 512] 0x62,0xf5,0x65,0x08,0x59,0x14,0x6d,0x00,0xfe,0xff,0xff -# ATT: vmulnepbf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z} -# INTEL: vmulnepbf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032] +# ATT: vmulbf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z} +# INTEL: vmulbf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032] 0x62,0xf5,0x65,0x8f,0x59,0x51,0x7f -# ATT: vmulnepbf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z} -# INTEL: vmulnepbf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8} +# ATT: vmulbf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z} +# INTEL: vmulbf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8} 0x62,0xf5,0x65,0x9f,0x59,0x52,0x80 -# ATT: vrcppbf16 %xmm3, %xmm2 -# INTEL: vrcppbf16 xmm2, xmm3 +# ATT: vrcpbf16 %xmm3, %xmm2 +# INTEL: vrcpbf16 xmm2, xmm3 0x62,0xf6,0x7c,0x08,0x4c,0xd3 -# ATT: vrcppbf16 %xmm3, %xmm2 {%k7} -# INTEL: vrcppbf16 xmm2 {k7}, xmm3 +# ATT: vrcpbf16 %xmm3, %xmm2 {%k7} +# INTEL: vrcpbf16 xmm2 {k7}, xmm3 0x62,0xf6,0x7c,0x0f,0x4c,0xd3 -# ATT: vrcppbf16 %xmm3, %xmm2 {%k7} {z} -# INTEL: vrcppbf16 xmm2 {k7} {z}, xmm3 +# ATT: vrcpbf16 %xmm3, %xmm2 {%k7} {z} +# INTEL: vrcpbf16 xmm2 {k7} {z}, xmm3 0x62,0xf6,0x7c,0x8f,0x4c,0xd3 -# ATT: vrcppbf16 %zmm3, %zmm2 -# INTEL: vrcppbf16 zmm2, zmm3 +# ATT: vrcpbf16 %zmm3, %zmm2 +# INTEL: vrcpbf16 zmm2, zmm3 0x62,0xf6,0x7c,0x48,0x4c,0xd3 -# ATT: vrcppbf16 %zmm3, %zmm2 {%k7} -# INTEL: vrcppbf16 zmm2 {k7}, zmm3 +# ATT: vrcpbf16 %zmm3, %zmm2 {%k7} +# INTEL: vrcpbf16 zmm2 {k7}, zmm3 0x62,0xf6,0x7c,0x4f,0x4c,0xd3 -# ATT: vrcppbf16 %zmm3, %zmm2 {%k7} {z} -# INTEL: vrcppbf16 zmm2 {k7} {z}, zmm3 +# ATT: vrcpbf16 %zmm3, %zmm2 {%k7} {z} +# INTEL: vrcpbf16 zmm2 {k7} {z}, zmm3 0x62,0xf6,0x7c,0xcf,0x4c,0xd3 -# ATT: vrcppbf16 %ymm3, %ymm2 -# INTEL: vrcppbf16 ymm2, ymm3 +# ATT: vrcpbf16 %ymm3, %ymm2 +# INTEL: vrcpbf16 ymm2, ymm3 0x62,0xf6,0x7c,0x28,0x4c,0xd3 -# ATT: vrcppbf16 %ymm3, %ymm2 {%k7} -# INTEL: vrcppbf16 ymm2 {k7}, ymm3 +# ATT: vrcpbf16 %ymm3, %ymm2 {%k7} +# INTEL: vrcpbf16 ymm2 {k7}, ymm3 0x62,0xf6,0x7c,0x2f,0x4c,0xd3 -# ATT: vrcppbf16 %ymm3, %ymm2 {%k7} {z} -# INTEL: vrcppbf16 ymm2 {k7} {z}, ymm3 +# ATT: vrcpbf16 %ymm3, %ymm2 {%k7} {z} +# INTEL: vrcpbf16 ymm2 {k7} {z}, ymm3 0x62,0xf6,0x7c,0xaf,0x4c,0xd3 -# ATT: vrcppbf16 268435456(%esp,%esi,8), %xmm2 -# INTEL: vrcppbf16 xmm2, xmmword ptr [esp + 8*esi + 268435456] +# ATT: vrcpbf16 268435456(%esp,%esi,8), %xmm2 +# INTEL: vrcpbf16 xmm2, xmmword ptr [esp + 8*esi + 268435456] 0x62,0xf6,0x7c,0x08,0x4c,0x94,0xf4,0x00,0x00,0x00,0x10 -# ATT: vrcppbf16 291(%edi,%eax,4), %xmm2 {%k7} -# INTEL: vrcppbf16 xmm2 {k7}, xmmword ptr [edi + 4*eax + 291] +# ATT: vrcpbf16 291(%edi,%eax,4), %xmm2 {%k7} +# INTEL: vrcpbf16 xmm2 {k7}, xmmword ptr [edi + 4*eax + 291] 0x62,0xf6,0x7c,0x0f,0x4c,0x94,0x87,0x23,0x01,0x00,0x00 -# ATT: vrcppbf16 (%eax){1to8}, %xmm2 -# INTEL: vrcppbf16 xmm2, word ptr [eax]{1to8} +# ATT: vrcpbf16 (%eax){1to8}, %xmm2 +# INTEL: vrcpbf16 xmm2, word ptr [eax]{1to8} 0x62,0xf6,0x7c,0x18,0x4c,0x10 -# ATT: vrcppbf16 -512(,%ebp,2), %xmm2 -# INTEL: vrcppbf16 xmm2, xmmword ptr [2*ebp - 512] +# ATT: vrcpbf16 -512(,%ebp,2), %xmm2 +# INTEL: vrcpbf16 xmm2, xmmword ptr [2*ebp - 512] 0x62,0xf6,0x7c,0x08,0x4c,0x14,0x6d,0x00,0xfe,0xff,0xff -# ATT: vrcppbf16 2032(%ecx), %xmm2 {%k7} {z} -# INTEL: vrcppbf16 xmm2 {k7} {z}, xmmword ptr [ecx + 2032] +# ATT: vrcpbf16 2032(%ecx), %xmm2 {%k7} {z} +# INTEL: vrcpbf16 xmm2 {k7} {z}, xmmword ptr [ecx + 2032] 0x62,0xf6,0x7c,0x8f,0x4c,0x51,0x7f -# ATT: vrcppbf16 -256(%edx){1to8}, %xmm2 {%k7} {z} -# INTEL: vrcppbf16 xmm2 {k7} {z}, word ptr [edx - 256]{1to8} +# ATT: vrcpbf16 -256(%edx){1to8}, %xmm2 {%k7} {z} +# INTEL: vrcpbf16 xmm2 {k7} {z}, word ptr [edx - 256]{1to8} 0x62,0xf6,0x7c,0x9f,0x4c,0x52,0x80 -# ATT: vrcppbf16 268435456(%esp,%esi,8), %ymm2 -# INTEL: vrcppbf16 ymm2, ymmword ptr [esp + 8*esi + 268435456] +# ATT: vrcpbf16 268435456(%esp,%esi,8), %ymm2 +# INTEL: vrcpbf16 ymm2, ymmword ptr [esp + 8*esi + 268435456] 0x62,0xf6,0x7c,0x28,0x4c,0x94,0xf4,0x00,0x00,0x00,0x10 -# ATT: vrcppbf16 291(%edi,%eax,4), %ymm2 {%k7} -# INTEL: vrcppbf16 ymm2 {k7}, ymmword ptr [edi + 4*eax + 291] +# ATT: vrcpbf16 291(%edi,%eax,4), %ymm2 {%k7} +# INTEL: vrcpbf16 ymm2 {k7}, ymmword ptr [edi + 4*eax + 291] 0x62,0xf6,0x7c,0x2f,0x4c,0x94,0x87,0x23,0x01,0x00,0x00 -# ATT: vrcppbf16 (%eax){1to16}, %ymm2 -# INTEL: vrcppbf16 ymm2, word ptr [eax]{1to16} +# ATT: vrcpbf16 (%eax){1to16}, %ymm2 +# INTEL: vrcpbf16 ymm2, word ptr [eax]{1to16} 0x62,0xf6,0x7c,0x38,0x4c,0x10 -# ATT: vrcppbf16 -1024(,%ebp,2), %ymm2 -# INTEL: vrcppbf16 ymm2, ymmword ptr [2*ebp - 1024] +# ATT: vrcpbf16 -1024(,%ebp,2), %ymm2 +# INTEL: vrcpbf16 ymm2, ymmword ptr [2*ebp - 1024] 0x62,0xf6,0x7c,0x28,0x4c,0x14,0x6d,0x00,0xfc,0xff,0xff -# ATT: vrcppbf16 4064(%ecx), %ymm2 {%k7} {z} -# INTEL: vrcppbf16 ymm2 {k7} {z}, ymmword ptr [ecx + 4064] +# ATT: vrcpbf16 4064(%ecx), %ymm2 {%k7} {z} +# INTEL: vrcpbf16 ymm2 {k7} {z}, ymmword ptr [ecx + 4064] 0x62,0xf6,0x7c,0xaf,0x4c,0x51,0x7f -# ATT: vrcppbf16 -256(%edx){1to16}, %ymm2 {%k7} {z} -# INTEL: vrcppbf16 ymm2 {k7} {z}, word ptr [edx - 256]{1to16} +# ATT: vrcpbf16 -256(%edx){1to16}, %ymm2 {%k7} {z} +# INTEL: vrcpbf16 ymm2 {k7} {z}, word ptr [edx - 256]{1to16} 0x62,0xf6,0x7c,0xbf,0x4c,0x52,0x80 -# ATT: vrcppbf16 268435456(%esp,%esi,8), %zmm2 -# INTEL: vrcppbf16 zmm2, zmmword ptr [esp + 8*esi + 268435456] +# ATT: vrcpbf16 268435456(%esp,%esi,8), %zmm2 +# INTEL: vrcpbf16 zmm2, zmmword ptr [esp + 8*esi + 268435456] 0x62,0xf6,0x7c,0x48,0x4c,0x94,0xf4,0x00,0x00,0x00,0x10 -# ATT: vrcppbf16 291(%edi,%eax,4), %zmm2 {%k7} -# INTEL: vrcppbf16 zmm2 {k7}, zmmword ptr [edi + 4*eax + 291] +# ATT: vrcpbf16 291(%edi,%eax,4), %zmm2 {%k7} +# INTEL: vrcpbf16 zmm2 {k7}, zmmword ptr [edi + 4*eax + 291] 0x62,0xf6,0x7c,0x4f,0x4c,0x94,0x87,0x23,0x01,0x00,0x00 -# ATT: vrcppbf16 (%eax){1to32}, %zmm2 -# INTEL: vrcppbf16 zmm2, word ptr [eax]{1to32} +# ATT: vrcpbf16 (%eax){1to32}, %zmm2 +# INTEL: vrcpbf16 zmm2, word ptr [eax]{1to32} 0x62,0xf6,0x7c,0x58,0x4c,0x10 -# ATT: vrcppbf16 -2048(,%ebp,2), %zmm2 -# INTEL: vrcppbf16 zmm2, zmmword ptr [2*ebp - 2048] +# ATT: vrcpbf16 -2048(,%ebp,2), %zmm2 +# INTEL: vrcpbf16 zmm2, zmmword ptr [2*ebp - 2048] 0x62,0xf6,0x7c,0x48,0x4c,0x14,0x6d,0x00,0xf8,0xff,0xff -# ATT: vrcppbf16 8128(%ecx), %zmm2 {%k7} {z} -# INTEL: vrcppbf16 zmm2 {k7} {z}, zmmword ptr [ecx + 8128] +# ATT: vrcpbf16 8128(%ecx), %zmm2 {%k7} {z} +# INTEL: vrcpbf16 zmm2 {k7} {z}, zmmword ptr [ecx + 8128] 0x62,0xf6,0x7c,0xcf,0x4c,0x51,0x7f -# ATT: vrcppbf16 -256(%edx){1to32}, %zmm2 {%k7} {z} -# INTEL: vrcppbf16 zmm2 {k7} {z}, word ptr [edx - 256]{1to32} +# ATT: vrcpbf16 -256(%edx){1to32}, %zmm2 {%k7} {z} +# INTEL: vrcpbf16 zmm2 {k7} {z}, word ptr [edx - 256]{1to32} 0x62,0xf6,0x7c,0xdf,0x4c,0x52,0x80 -# ATT: vreducenepbf16 $123, %zmm3, %zmm2 -# INTEL: vreducenepbf16 zmm2, zmm3, 123 +# ATT: vreducebf16 $123, %zmm3, %zmm2 +# INTEL: vreducebf16 zmm2, zmm3, 123 0x62,0xf3,0x7f,0x48,0x56,0xd3,0x7b -# ATT: vreducenepbf16 $123, %zmm3, %zmm2 {%k7} -# INTEL: vreducenepbf16 zmm2 {k7}, zmm3, 123 +# ATT: vreducebf16 $123, %zmm3, %zmm2 {%k7} +# INTEL: vreducebf16 zmm2 {k7}, zmm3, 123 0x62,0xf3,0x7f,0x4f,0x56,0xd3,0x7b -# ATT: vreducenepbf16 $123, %zmm3, %zmm2 {%k7} {z} -# INTEL: vreducenepbf16 zmm2 {k7} {z}, zmm3, 123 +# ATT: vreducebf16 $123, %zmm3, %zmm2 {%k7} {z} +# INTEL: vreducebf16 zmm2 {k7} {z}, zmm3, 123 0x62,0xf3,0x7f,0xcf,0x56,0xd3,0x7b -# ATT: vreducenepbf16 $123, %ymm3, %ymm2 -# INTEL: vreducenepbf16 ymm2, ymm3, 123 +# ATT: vreducebf16 $123, %ymm3, %ymm2 +# INTEL: vreducebf16 ymm2, ymm3, 123 0x62,0xf3,0x7f,0x28,0x56,0xd3,0x7b -# ATT: vreducenepbf16 $123, %ymm3, %ymm2 {%k7} -# INTEL: vreducenepbf16 ymm2 {k7}, ymm3, 123 +# ATT: vreducebf16 $123, %ymm3, %ymm2 {%k7} +# INTEL: vreducebf16 ymm2 {k7}, ymm3, 123 0x62,0xf3,0x7f,0x2f,0x56,0xd3,0x7b -# ATT: vreducenepbf16 $123, %ymm3, %ymm2 {%k7} {z} -# INTEL: vreducenepbf16 ymm2 {k7} {z}, ymm3, 123 +# ATT: vreducebf16 $123, %ymm3, %ymm2 {%k7} {z} +# INTEL: vreducebf16 ymm2 {k7} {z}, ymm3, 123 0x62,0xf3,0x7f,0xaf,0x56,0xd3,0x7b -# ATT: vreducenepbf16 $123, %xmm3, %xmm2 -# INTEL: vreducenepbf16 xmm2, xmm3, 123 +# ATT: vreducebf16 $123, %xmm3, %xmm2 +# INTEL: vreducebf16 xmm2, xmm3, 123 0x62,0xf3,0x7f,0x08,0x56,0xd3,0x7b -# ATT: vreducenepbf16 $123, %xmm3, %xmm2 {%k7} -# INTEL: vreducenepbf16 xmm2 {k7}, xmm3, 123 +# ATT: vreducebf16 $123, %xmm3, %xmm2 {%k7} +# INTEL: vreducebf16 xmm2 {k7}, xmm3, 123 0x62,0xf3,0x7f,0x0f,0x56,0xd3,0x7b -# ATT: vreducenepbf16 $123, %xmm3, %xmm2 {%k7} {z} -# INTEL: vreducenepbf16 xmm2 {k7} {z}, xmm3, 123 +# ATT: vreducebf16 $123, %xmm3, %xmm2 {%k7} {z} +# INTEL: vreducebf16 xmm2 {k7} {z}, xmm3, 123 0x62,0xf3,0x7f,0x8f,0x56,0xd3,0x7b -# ATT: vreducenepbf16 $123, 268435456(%esp,%esi,8), %xmm2 -# INTEL: vreducenepbf16 xmm2, xmmword ptr [esp + 8*esi + 268435456], 123 +# ATT: vreducebf16 $123, 268435456(%esp,%esi,8), %xmm2 +# INTEL: vreducebf16 xmm2, xmmword ptr [esp + 8*esi + 268435456], 123 0x62,0xf3,0x7f,0x08,0x56,0x94,0xf4,0x00,0x00,0x00,0x10,0x7b -# ATT: vreducenepbf16 $123, 291(%edi,%eax,4), %xmm2 {%k7} -# INTEL: vreducenepbf16 xmm2 {k7}, xmmword ptr [edi + 4*eax + 291], 123 +# ATT: vreducebf16 $123, 291(%edi,%eax,4), %xmm2 {%k7} +# INTEL: vreducebf16 xmm2 {k7}, xmmword ptr [edi + 4*eax + 291], 123 0x62,0xf3,0x7f,0x0f,0x56,0x94,0x87,0x23,0x01,0x00,0x00,0x7b -# ATT: vreducenepbf16 $123, (%eax){1to8}, %xmm2 -# INTEL: vreducenepbf16 xmm2, word ptr [eax]{1to8}, 123 +# ATT: vreducebf16 $123, (%eax){1to8}, %xmm2 +# INTEL: vreducebf16 xmm2, word ptr [eax]{1to8}, 123 0x62,0xf3,0x7f,0x18,0x56,0x10,0x7b -# ATT: vreducenepbf16 $123, -512(,%ebp,2), %xmm2 -# INTEL: vreducenepbf16 xmm2, xmmword ptr [2*ebp - 512], 123 +# ATT: vreducebf16 $123, -512(,%ebp,2), %xmm2 +# INTEL: vreducebf16 xmm2, xmmword ptr [2*ebp - 512], 123 0x62,0xf3,0x7f,0x08,0x56,0x14,0x6d,0x00,0xfe,0xff,0xff,0x7b -# ATT: vreducenepbf16 $123, 2032(%ecx), %xmm2 {%k7} {z} -# INTEL: vreducenepbf16 xmm2 {k7} {z}, xmmword ptr [ecx + 2032], 123 +# ATT: vreducebf16 $123, 2032(%ecx), %xmm2 {%k7} {z} +# INTEL: vreducebf16 xmm2 {k7} {z}, xmmword ptr [ecx + 2032], 123 0x62,0xf3,0x7f,0x8f,0x56,0x51,0x7f,0x7b -# ATT: vreducenepbf16 $123, -256(%edx){1to8}, %xmm2 {%k7} {z} -# INTEL: vreducenepbf16 xmm2 {k7} {z}, word ptr [edx - 256]{1to8}, 123 +# ATT: vreducebf16 $123, -256(%edx){1to8}, %xmm2 {%k7} {z} +# INTEL: vreducebf16 xmm2 {k7} {z}, word ptr [edx - 256]{1to8}, 123 0x62,0xf3,0x7f,0x9f,0x56,0x52,0x80,0x7b -# ATT: vreducenepbf16 $123, 268435456(%esp,%esi,8), %ymm2 -# INTEL: vreducenepbf16 ymm2, ymmword ptr [esp + 8*esi + 268435456], 123 +# ATT: vreducebf16 $123, 268435456(%esp,%esi,8), %ymm2 +# INTEL: vreducebf16 ymm2, ymmword ptr [esp + 8*esi + 268435456], 123 0x62,0xf3,0x7f,0x28,0x56,0x94,0xf4,0x00,0x00,0x00,0x10,0x7b -# ATT: vreducenepbf16 $123, 291(%edi,%eax,4), %ymm2 {%k7} -# INTEL: vreducenepbf16 ymm2 {k7}, ymmword ptr [edi + 4*eax + 291], 123 +# ATT: vreducebf16 $123, 291(%edi,%eax,4), %ymm2 {%k7} +# INTEL: vreducebf16 ymm2 {k7}, ymmword ptr [edi + 4*eax + 291], 123 0x62,0xf3,0x7f,0x2f,0x56,0x94,0x87,0x23,0x01,0x00,0x00,0x7b -# ATT: vreducenepbf16 $123, (%eax){1to16}, %ymm2 -# INTEL: vreducenepbf16 ymm2, word ptr [eax]{1to16}, 123 +# ATT: vreducebf16 $123, (%eax){1to16}, %ymm2 +# INTEL: vreducebf16 ymm2, word ptr [eax]{1to16}, 123 0x62,0xf3,0x7f,0x38,0x56,0x10,0x7b -# ATT: vreducenepbf16 $123, -1024(,%ebp,2), %ymm2 -# INTEL: vreducenepbf16 ymm2, ymmword ptr [2*ebp - 1024], 123 +# ATT: vreducebf16 $123, -1024(,%ebp,2), %ymm2 +# INTEL: vreducebf16 ymm2, ymmword ptr [2*ebp - 1024], 123 0x62,0xf3,0x7f,0x28,0x56,0x14,0x6d,0x00,0xfc,0xff,0xff,0x7b -# ATT: vreducenepbf16 $123, 4064(%ecx), %ymm2 {%k7} {z} -# INTEL: vreducenepbf16 ymm2 {k7} {z}, ymmword ptr [ecx + 4064], 123 +# ATT: vreducebf16 $123, 4064(%ecx), %ymm2 {%k7} {z} +# INTEL: vreducebf16 ymm2 {k7} {z}, ymmword ptr [ecx + 4064], 123 0x62,0xf3,0x7f,0xaf,0x56,0x51,0x7f,0x7b -# ATT: vreducenepbf16 $123, -256(%edx){1to16}, %ymm2 {%k7} {z} -# INTEL: vreducenepbf16 ymm2 {k7} {z}, word ptr [edx - 256]{1to16}, 123 +# ATT: vreducebf16 $123, -256(%edx){1to16}, %ymm2 {%k7} {z} +# INTEL: vreducebf16 ymm2 {k7} {z}, word ptr [edx - 256]{1to16}, 123 0x62,0xf3,0x7f,0xbf,0x56,0x52,0x80,0x7b -# ATT: vreducenepbf16 $123, 268435456(%esp,%esi,8), %zmm2 -# INTEL: vreducenepbf16 zmm2, zmmword ptr [esp + 8*esi + 268435456], 123 +# ATT: vreducebf16 $123, 268435456(%esp,%esi,8), %zmm2 +# INTEL: vreducebf16 zmm2, zmmword ptr [esp + 8*esi + 268435456], 123 0x62,0xf3,0x7f,0x48,0x56,0x94,0xf4,0x00,0x00,0x00,0x10,0x7b -# ATT: vreducenepbf16 $123, 291(%edi,%eax,4), %zmm2 {%k7} -# INTEL: vreducenepbf16 zmm2 {k7}, zmmword ptr [edi + 4*eax + 291], 123 +# ATT: vreducebf16 $123, 291(%edi,%eax,4), %zmm2 {%k7} +# INTEL: vreducebf16 zmm2 {k7}, zmmword ptr [edi + 4*eax + 291], 123 0x62,0xf3,0x7f,0x4f,0x56,0x94,0x87,0x23,0x01,0x00,0x00,0x7b -# ATT: vreducenepbf16 $123, (%eax){1to32}, %zmm2 -# INTEL: vreducenepbf16 zmm2, word ptr [eax]{1to32}, 123 +# ATT: vreducebf16 $123, (%eax){1to32}, %zmm2 +# INTEL: vreducebf16 zmm2, word ptr [eax]{1to32}, 123 0x62,0xf3,0x7f,0x58,0x56,0x10,0x7b -# ATT: vreducenepbf16 $123, -2048(,%ebp,2), %zmm2 -# INTEL: vreducenepbf16 zmm2, zmmword ptr [2*ebp - 2048], 123 +# ATT: vreducebf16 $123, -2048(,%ebp,2), %zmm2 +# INTEL: vreducebf16 zmm2, zmmword ptr [2*ebp - 2048], 123 0x62,0xf3,0x7f,0x48,0x56,0x14,0x6d,0x00,0xf8,0xff,0xff,0x7b -# ATT: vreducenepbf16 $123, 8128(%ecx), %zmm2 {%k7} {z} -# INTEL: vreducenepbf16 zmm2 {k7} {z}, zmmword ptr [ecx + 8128], 123 +# ATT: vreducebf16 $123, 8128(%ecx), %zmm2 {%k7} {z} +# INTEL: vreducebf16 zmm2 {k7} {z}, zmmword ptr [ecx + 8128], 123 0x62,0xf3,0x7f,0xcf,0x56,0x51,0x7f,0x7b -# ATT: vreducenepbf16 $123, -256(%edx){1to32}, %zmm2 {%k7} {z} -# INTEL: vreducenepbf16 zmm2 {k7} {z}, word ptr [edx - 256]{1to32}, 123 +# ATT: vreducebf16 $123, -256(%edx){1to32}, %zmm2 {%k7} {z} +# INTEL: vreducebf16 zmm2 {k7} {z}, word ptr [edx - 256]{1to32}, 123 0x62,0xf3,0x7f,0xdf,0x56,0x52,0x80,0x7b -# ATT: vrndscalenepbf16 $123, %zmm3, %zmm2 -# INTEL: vrndscalenepbf16 zmm2, zmm3, 123 +# ATT: vrndscalebf16 $123, %zmm3, %zmm2 +# INTEL: vrndscalebf16 zmm2, zmm3, 123 0x62,0xf3,0x7f,0x48,0x08,0xd3,0x7b -# ATT: vrndscalenepbf16 $123, %zmm3, %zmm2 {%k7} -# INTEL: vrndscalenepbf16 zmm2 {k7}, zmm3, 123 +# ATT: vrndscalebf16 $123, %zmm3, %zmm2 {%k7} +# INTEL: vrndscalebf16 zmm2 {k7}, zmm3, 123 0x62,0xf3,0x7f,0x4f,0x08,0xd3,0x7b -# ATT: vrndscalenepbf16 $123, %zmm3, %zmm2 {%k7} {z} -# INTEL: vrndscalenepbf16 zmm2 {k7} {z}, zmm3, 123 +# ATT: vrndscalebf16 $123, %zmm3, %zmm2 {%k7} {z} +# INTEL: vrndscalebf16 zmm2 {k7} {z}, zmm3, 123 0x62,0xf3,0x7f,0xcf,0x08,0xd3,0x7b -# ATT: vrndscalenepbf16 $123, %ymm3, %ymm2 -# INTEL: vrndscalenepbf16 ymm2, ymm3, 123 +# ATT: vrndscalebf16 $123, %ymm3, %ymm2 +# INTEL: vrndscalebf16 ymm2, ymm3, 123 0x62,0xf3,0x7f,0x28,0x08,0xd3,0x7b -# ATT: vrndscalenepbf16 $123, %ymm3, %ymm2 {%k7} -# INTEL: vrndscalenepbf16 ymm2 {k7}, ymm3, 123 +# ATT: vrndscalebf16 $123, %ymm3, %ymm2 {%k7} +# INTEL: vrndscalebf16 ymm2 {k7}, ymm3, 123 0x62,0xf3,0x7f,0x2f,0x08,0xd3,0x7b -# ATT: vrndscalenepbf16 $123, %ymm3, %ymm2 {%k7} {z} -# INTEL: vrndscalenepbf16 ymm2 {k7} {z}, ymm3, 123 +# ATT: vrndscalebf16 $123, %ymm3, %ymm2 {%k7} {z} +# INTEL: vrndscalebf16 ymm2 {k7} {z}, ymm3, 123 0x62,0xf3,0x7f,0xaf,0x08,0xd3,0x7b -# ATT: vrndscalenepbf16 $123, %xmm3, %xmm2 -# INTEL: vrndscalenepbf16 xmm2, xmm3, 123 +# ATT: vrndscalebf16 $123, %xmm3, %xmm2 +# INTEL: vrndscalebf16 xmm2, xmm3, 123 0x62,0xf3,0x7f,0x08,0x08,0xd3,0x7b -# ATT: vrndscalenepbf16 $123, %xmm3, %xmm2 {%k7} -# INTEL: vrndscalenepbf16 xmm2 {k7}, xmm3, 123 +# ATT: vrndscalebf16 $123, %xmm3, %xmm2 {%k7} +# INTEL: vrndscalebf16 xmm2 {k7}, xmm3, 123 0x62,0xf3,0x7f,0x0f,0x08,0xd3,0x7b -# ATT: vrndscalenepbf16 $123, %xmm3, %xmm2 {%k7} {z} -# INTEL: vrndscalenepbf16 xmm2 {k7} {z}, xmm3, 123 +# ATT: vrndscalebf16 $123, %xmm3, %xmm2 {%k7} {z} +# INTEL: vrndscalebf16 xmm2 {k7} {z}, xmm3, 123 0x62,0xf3,0x7f,0x8f,0x08,0xd3,0x7b -# ATT: vrndscalenepbf16 $123, 268435456(%esp,%esi,8), %xmm2 -# INTEL: vrndscalenepbf16 xmm2, xmmword ptr [esp + 8*esi + 268435456], 123 +# ATT: vrndscalebf16 $123, 268435456(%esp,%esi,8), %xmm2 +# INTEL: vrndscalebf16 xmm2, xmmword ptr [esp + 8*esi + 268435456], 123 0x62,0xf3,0x7f,0x08,0x08,0x94,0xf4,0x00,0x00,0x00,0x10,0x7b -# ATT: vrndscalenepbf16 $123, 291(%edi,%eax,4), %xmm2 {%k7} -# INTEL: vrndscalenepbf16 xmm2 {k7}, xmmword ptr [edi + 4*eax + 291], 123 +# ATT: vrndscalebf16 $123, 291(%edi,%eax,4), %xmm2 {%k7} +# INTEL: vrndscalebf16 xmm2 {k7}, xmmword ptr [edi + 4*eax + 291], 123 0x62,0xf3,0x7f,0x0f,0x08,0x94,0x87,0x23,0x01,0x00,0x00,0x7b -# ATT: vrndscalenepbf16 $123, (%eax){1to8}, %xmm2 -# INTEL: vrndscalenepbf16 xmm2, word ptr [eax]{1to8}, 123 +# ATT: vrndscalebf16 $123, (%eax){1to8}, %xmm2 +# INTEL: vrndscalebf16 xmm2, word ptr [eax]{1to8}, 123 0x62,0xf3,0x7f,0x18,0x08,0x10,0x7b -# ATT: vrndscalenepbf16 $123, -512(,%ebp,2), %xmm2 -# INTEL: vrndscalenepbf16 xmm2, xmmword ptr [2*ebp - 512], 123 +# ATT: vrndscalebf16 $123, -512(,%ebp,2), %xmm2 +# INTEL: vrndscalebf16 xmm2, xmmword ptr [2*ebp - 512], 123 0x62,0xf3,0x7f,0x08,0x08,0x14,0x6d,0x00,0xfe,0xff,0xff,0x7b -# ATT: vrndscalenepbf16 $123, 2032(%ecx), %xmm2 {%k7} {z} -# INTEL: vrndscalenepbf16 xmm2 {k7} {z}, xmmword ptr [ecx + 2032], 123 +# ATT: vrndscalebf16 $123, 2032(%ecx), %xmm2 {%k7} {z} +# INTEL: vrndscalebf16 xmm2 {k7} {z}, xmmword ptr [ecx + 2032], 123 0x62,0xf3,0x7f,0x8f,0x08,0x51,0x7f,0x7b -# ATT: vrndscalenepbf16 $123, -256(%edx){1to8}, %xmm2 {%k7} {z} -# INTEL: vrndscalenepbf16 xmm2 {k7} {z}, word ptr [edx - 256]{1to8}, 123 +# ATT: vrndscalebf16 $123, -256(%edx){1to8}, %xmm2 {%k7} {z} +# INTEL: vrndscalebf16 xmm2 {k7} {z}, word ptr [edx - 256]{1to8}, 123 0x62,0xf3,0x7f,0x9f,0x08,0x52,0x80,0x7b -# ATT: vrndscalenepbf16 $123, 268435456(%esp,%esi,8), %ymm2 -# INTEL: vrndscalenepbf16 ymm2, ymmword ptr [esp + 8*esi + 268435456], 123 +# ATT: vrndscalebf16 $123, 268435456(%esp,%esi,8), %ymm2 +# INTEL: vrndscalebf16 ymm2, ymmword ptr [esp + 8*esi + 268435456], 123 0x62,0xf3,0x7f,0x28,0x08,0x94,0xf4,0x00,0x00,0x00,0x10,0x7b -# ATT: vrndscalenepbf16 $123, 291(%edi,%eax,4), %ymm2 {%k7} -# INTEL: vrndscalenepbf16 ymm2 {k7}, ymmword ptr [edi + 4*eax + 291], 123 +# ATT: vrndscalebf16 $123, 291(%edi,%eax,4), %ymm2 {%k7} +# INTEL: vrndscalebf16 ymm2 {k7}, ymmword ptr [edi + 4*eax + 291], 123 0x62,0xf3,0x7f,0x2f,0x08,0x94,0x87,0x23,0x01,0x00,0x00,0x7b -# ATT: vrndscalenepbf16 $123, (%eax){1to16}, %ymm2 -# INTEL: vrndscalenepbf16 ymm2, word ptr [eax]{1to16}, 123 +# ATT: vrndscalebf16 $123, (%eax){1to16}, %ymm2 +# INTEL: vrndscalebf16 ymm2, word ptr [eax]{1to16}, 123 0x62,0xf3,0x7f,0x38,0x08,0x10,0x7b -# ATT: vrndscalenepbf16 $123, -1024(,%ebp,2), %ymm2 -# INTEL: vrndscalenepbf16 ymm2, ymmword ptr [2*ebp - 1024], 123 +# ATT: vrndscalebf16 $123, -1024(,%ebp,2), %ymm2 +# INTEL: vrndscalebf16 ymm2, ymmword ptr [2*ebp - 1024], 123 0x62,0xf3,0x7f,0x28,0x08,0x14,0x6d,0x00,0xfc,0xff,0xff,0x7b -# ATT: vrndscalenepbf16 $123, 4064(%ecx), %ymm2 {%k7} {z} -# INTEL: vrndscalenepbf16 ymm2 {k7} {z}, ymmword ptr [ecx + 4064], 123 +# ATT: vrndscalebf16 $123, 4064(%ecx), %ymm2 {%k7} {z} +# INTEL: vrndscalebf16 ymm2 {k7} {z}, ymmword ptr [ecx + 4064], 123 0x62,0xf3,0x7f,0xaf,0x08,0x51,0x7f,0x7b -# ATT: vrndscalenepbf16 $123, -256(%edx){1to16}, %ymm2 {%k7} {z} -# INTEL: vrndscalenepbf16 ymm2 {k7} {z}, word ptr [edx - 256]{1to16}, 123 +# ATT: vrndscalebf16 $123, -256(%edx){1to16}, %ymm2 {%k7} {z} +# INTEL: vrndscalebf16 ymm2 {k7} {z}, word ptr [edx - 256]{1to16}, 123 0x62,0xf3,0x7f,0xbf,0x08,0x52,0x80,0x7b -# ATT: vrndscalenepbf16 $123, 268435456(%esp,%esi,8), %zmm2 -# INTEL: vrndscalenepbf16 zmm2, zmmword ptr [esp + 8*esi + 268435456], 123 +# ATT: vrndscalebf16 $123, 268435456(%esp,%esi,8), %zmm2 +# INTEL: vrndscalebf16 zmm2, zmmword ptr [esp + 8*esi + 268435456], 123 0x62,0xf3,0x7f,0x48,0x08,0x94,0xf4,0x00,0x00,0x00,0x10,0x7b -# ATT: vrndscalenepbf16 $123, 291(%edi,%eax,4), %zmm2 {%k7} -# INTEL: vrndscalenepbf16 zmm2 {k7}, zmmword ptr [edi + 4*eax + 291], 123 +# ATT: vrndscalebf16 $123, 291(%edi,%eax,4), %zmm2 {%k7} +# INTEL: vrndscalebf16 zmm2 {k7}, zmmword ptr [edi + 4*eax + 291], 123 0x62,0xf3,0x7f,0x4f,0x08,0x94,0x87,0x23,0x01,0x00,0x00,0x7b -# ATT: vrndscalenepbf16 $123, (%eax){1to32}, %zmm2 -# INTEL: vrndscalenepbf16 zmm2, word ptr [eax]{1to32}, 123 +# ATT: vrndscalebf16 $123, (%eax){1to32}, %zmm2 +# INTEL: vrndscalebf16 zmm2, word ptr [eax]{1to32}, 123 0x62,0xf3,0x7f,0x58,0x08,0x10,0x7b -# ATT: vrndscalenepbf16 $123, -2048(,%ebp,2), %zmm2 -# INTEL: vrndscalenepbf16 zmm2, zmmword ptr [2*ebp - 2048], 123 +# ATT: vrndscalebf16 $123, -2048(,%ebp,2), %zmm2 +# INTEL: vrndscalebf16 zmm2, zmmword ptr [2*ebp - 2048], 123 0x62,0xf3,0x7f,0x48,0x08,0x14,0x6d,0x00,0xf8,0xff,0xff,0x7b -# ATT: vrndscalenepbf16 $123, 8128(%ecx), %zmm2 {%k7} {z} -# INTEL: vrndscalenepbf16 zmm2 {k7} {z}, zmmword ptr [ecx + 8128], 123 +# ATT: vrndscalebf16 $123, 8128(%ecx), %zmm2 {%k7} {z} +# INTEL: vrndscalebf16 zmm2 {k7} {z}, zmmword ptr [ecx + 8128], 123 0x62,0xf3,0x7f,0xcf,0x08,0x51,0x7f,0x7b -# ATT: vrndscalenepbf16 $123, -256(%edx){1to32}, %zmm2 {%k7} {z} -# INTEL: vrndscalenepbf16 zmm2 {k7} {z}, word ptr [edx - 256]{1to32}, 123 +# ATT: vrndscalebf16 $123, -256(%edx){1to32}, %zmm2 {%k7} {z} +# INTEL: vrndscalebf16 zmm2 {k7} {z}, word ptr [edx - 256]{1to32}, 123 0x62,0xf3,0x7f,0xdf,0x08,0x52,0x80,0x7b -# ATT: vrsqrtpbf16 %xmm3, %xmm2 -# INTEL: vrsqrtpbf16 xmm2, xmm3 +# ATT: vrsqrtbf16 %xmm3, %xmm2 +# INTEL: vrsqrtbf16 xmm2, xmm3 0x62,0xf6,0x7c,0x08,0x4e,0xd3 -# ATT: vrsqrtpbf16 %xmm3, %xmm2 {%k7} -# INTEL: vrsqrtpbf16 xmm2 {k7}, xmm3 +# ATT: vrsqrtbf16 %xmm3, %xmm2 {%k7} +# INTEL: vrsqrtbf16 xmm2 {k7}, xmm3 0x62,0xf6,0x7c,0x0f,0x4e,0xd3 -# ATT: vrsqrtpbf16 %xmm3, %xmm2 {%k7} {z} -# INTEL: vrsqrtpbf16 xmm2 {k7} {z}, xmm3 +# ATT: vrsqrtbf16 %xmm3, %xmm2 {%k7} {z} +# INTEL: vrsqrtbf16 xmm2 {k7} {z}, xmm3 0x62,0xf6,0x7c,0x8f,0x4e,0xd3 -# ATT: vrsqrtpbf16 %zmm3, %zmm2 -# INTEL: vrsqrtpbf16 zmm2, zmm3 +# ATT: vrsqrtbf16 %zmm3, %zmm2 +# INTEL: vrsqrtbf16 zmm2, zmm3 0x62,0xf6,0x7c,0x48,0x4e,0xd3 -# ATT: vrsqrtpbf16 %zmm3, %zmm2 {%k7} -# INTEL: vrsqrtpbf16 zmm2 {k7}, zmm3 +# ATT: vrsqrtbf16 %zmm3, %zmm2 {%k7} +# INTEL: vrsqrtbf16 zmm2 {k7}, zmm3 0x62,0xf6,0x7c,0x4f,0x4e,0xd3 -# ATT: vrsqrtpbf16 %zmm3, %zmm2 {%k7} {z} -# INTEL: vrsqrtpbf16 zmm2 {k7} {z}, zmm3 +# ATT: vrsqrtbf16 %zmm3, %zmm2 {%k7} {z} +# INTEL: vrsqrtbf16 zmm2 {k7} {z}, zmm3 0x62,0xf6,0x7c,0xcf,0x4e,0xd3 -# ATT: vrsqrtpbf16 %ymm3, %ymm2 -# INTEL: vrsqrtpbf16 ymm2, ymm3 +# ATT: vrsqrtbf16 %ymm3, %ymm2 +# INTEL: vrsqrtbf16 ymm2, ymm3 0x62,0xf6,0x7c,0x28,0x4e,0xd3 -# ATT: vrsqrtpbf16 %ymm3, %ymm2 {%k7} -# INTEL: vrsqrtpbf16 ymm2 {k7}, ymm3 +# ATT: vrsqrtbf16 %ymm3, %ymm2 {%k7} +# INTEL: vrsqrtbf16 ymm2 {k7}, ymm3 0x62,0xf6,0x7c,0x2f,0x4e,0xd3 -# ATT: vrsqrtpbf16 %ymm3, %ymm2 {%k7} {z} -# INTEL: vrsqrtpbf16 ymm2 {k7} {z}, ymm3 +# ATT: vrsqrtbf16 %ymm3, %ymm2 {%k7} {z} +# INTEL: vrsqrtbf16 ymm2 {k7} {z}, ymm3 0x62,0xf6,0x7c,0xaf,0x4e,0xd3 -# ATT: vrsqrtpbf16 268435456(%esp,%esi,8), %xmm2 -# INTEL: vrsqrtpbf16 xmm2, xmmword ptr [esp + 8*esi + 268435456] +# ATT: vrsqrtbf16 268435456(%esp,%esi,8), %xmm2 +# INTEL: vrsqrtbf16 xmm2, xmmword ptr [esp + 8*esi + 268435456] 0x62,0xf6,0x7c,0x08,0x4e,0x94,0xf4,0x00,0x00,0x00,0x10 -# ATT: vrsqrtpbf16 291(%edi,%eax,4), %xmm2 {%k7} -# INTEL: vrsqrtpbf16 xmm2 {k7}, xmmword ptr [edi + 4*eax + 291] +# ATT: vrsqrtbf16 291(%edi,%eax,4), %xmm2 {%k7} +# INTEL: vrsqrtbf16 xmm2 {k7}, xmmword ptr [edi + 4*eax + 291] 0x62,0xf6,0x7c,0x0f,0x4e,0x94,0x87,0x23,0x01,0x00,0x00 -# ATT: vrsqrtpbf16 (%eax){1to8}, %xmm2 -# INTEL: vrsqrtpbf16 xmm2, word ptr [eax]{1to8} +# ATT: vrsqrtbf16 (%eax){1to8}, %xmm2 +# INTEL: vrsqrtbf16 xmm2, word ptr [eax]{1to8} 0x62,0xf6,0x7c,0x18,0x4e,0x10 -# ATT: vrsqrtpbf16 -512(,%ebp,2), %xmm2 -# INTEL: vrsqrtpbf16 xmm2, xmmword ptr [2*ebp - 512] +# ATT: vrsqrtbf16 -512(,%ebp,2), %xmm2 +# INTEL: vrsqrtbf16 xmm2, xmmword ptr [2*ebp - 512] 0x62,0xf6,0x7c,0x08,0x4e,0x14,0x6d,0x00,0xfe,0xff,0xff -# ATT: vrsqrtpbf16 2032(%ecx), %xmm2 {%k7} {z} -# INTEL: vrsqrtpbf16 xmm2 {k7} {z}, xmmword ptr [ecx + 2032] +# ATT: vrsqrtbf16 2032(%ecx), %xmm2 {%k7} {z} +# INTEL: vrsqrtbf16 xmm2 {k7} {z}, xmmword ptr [ecx + 2032] 0x62,0xf6,0x7c,0x8f,0x4e,0x51,0x7f -# ATT: vrsqrtpbf16 -256(%edx){1to8}, %xmm2 {%k7} {z} -# INTEL: vrsqrtpbf16 xmm2 {k7} {z}, word ptr [edx - 256]{1to8} +# ATT: vrsqrtbf16 -256(%edx){1to8}, %xmm2 {%k7} {z} +# INTEL: vrsqrtbf16 xmm2 {k7} {z}, word ptr [edx - 256]{1to8} 0x62,0xf6,0x7c,0x9f,0x4e,0x52,0x80 -# ATT: vrsqrtpbf16 268435456(%esp,%esi,8), %ymm2 -# INTEL: vrsqrtpbf16 ymm2, ymmword ptr [esp + 8*esi + 268435456] +# ATT: vrsqrtbf16 268435456(%esp,%esi,8), %ymm2 +# INTEL: vrsqrtbf16 ymm2, ymmword ptr [esp + 8*esi + 268435456] 0x62,0xf6,0x7c,0x28,0x4e,0x94,0xf4,0x00,0x00,0x00,0x10 -# ATT: vrsqrtpbf16 291(%edi,%eax,4), %ymm2 {%k7} -# INTEL: vrsqrtpbf16 ymm2 {k7}, ymmword ptr [edi + 4*eax + 291] +# ATT: vrsqrtbf16 291(%edi,%eax,4), %ymm2 {%k7} +# INTEL: vrsqrtbf16 ymm2 {k7}, ymmword ptr [edi + 4*eax + 291] 0x62,0xf6,0x7c,0x2f,0x4e,0x94,0x87,0x23,0x01,0x00,0x00 -# ATT: vrsqrtpbf16 (%eax){1to16}, %ymm2 -# INTEL: vrsqrtpbf16 ymm2, word ptr [eax]{1to16} +# ATT: vrsqrtbf16 (%eax){1to16}, %ymm2 +# INTEL: vrsqrtbf16 ymm2, word ptr [eax]{1to16} 0x62,0xf6,0x7c,0x38,0x4e,0x10 -# ATT: vrsqrtpbf16 -1024(,%ebp,2), %ymm2 -# INTEL: vrsqrtpbf16 ymm2, ymmword ptr [2*ebp - 1024] +# ATT: vrsqrtbf16 -1024(,%ebp,2), %ymm2 +# INTEL: vrsqrtbf16 ymm2, ymmword ptr [2*ebp - 1024] 0x62,0xf6,0x7c,0x28,0x4e,0x14,0x6d,0x00,0xfc,0xff,0xff -# ATT: vrsqrtpbf16 4064(%ecx), %ymm2 {%k7} {z} -# INTEL: vrsqrtpbf16 ymm2 {k7} {z}, ymmword ptr [ecx + 4064] +# ATT: vrsqrtbf16 4064(%ecx), %ymm2 {%k7} {z} +# INTEL: vrsqrtbf16 ymm2 {k7} {z}, ymmword ptr [ecx + 4064] 0x62,0xf6,0x7c,0xaf,0x4e,0x51,0x7f -# ATT: vrsqrtpbf16 -256(%edx){1to16}, %ymm2 {%k7} {z} -# INTEL: vrsqrtpbf16 ymm2 {k7} {z}, word ptr [edx - 256]{1to16} +# ATT: vrsqrtbf16 -256(%edx){1to16}, %ymm2 {%k7} {z} +# INTEL: vrsqrtbf16 ymm2 {k7} {z}, word ptr [edx - 256]{1to16} 0x62,0xf6,0x7c,0xbf,0x4e,0x52,0x80 -# ATT: vrsqrtpbf16 268435456(%esp,%esi,8), %zmm2 -# INTEL: vrsqrtpbf16 zmm2, zmmword ptr [esp + 8*esi + 268435456] +# ATT: vrsqrtbf16 268435456(%esp,%esi,8), %zmm2 +# INTEL: vrsqrtbf16 zmm2, zmmword ptr [esp + 8*esi + 268435456] 0x62,0xf6,0x7c,0x48,0x4e,0x94,0xf4,0x00,0x00,0x00,0x10 -# ATT: vrsqrtpbf16 291(%edi,%eax,4), %zmm2 {%k7} -# INTEL: vrsqrtpbf16 zmm2 {k7}, zmmword ptr [edi + 4*eax + 291] +# ATT: vrsqrtbf16 291(%edi,%eax,4), %zmm2 {%k7} +# INTEL: vrsqrtbf16 zmm2 {k7}, zmmword ptr [edi + 4*eax + 291] 0x62,0xf6,0x7c,0x4f,0x4e,0x94,0x87,0x23,0x01,0x00,0x00 -# ATT: vrsqrtpbf16 (%eax){1to32}, %zmm2 -# INTEL: vrsqrtpbf16 zmm2, word ptr [eax]{1to32} +# ATT: vrsqrtbf16 (%eax){1to32}, %zmm2 +# INTEL: vrsqrtbf16 zmm2, word ptr [eax]{1to32} 0x62,0xf6,0x7c,0x58,0x4e,0x10 -# ATT: vrsqrtpbf16 -2048(,%ebp,2), %zmm2 -# INTEL: vrsqrtpbf16 zmm2, zmmword ptr [2*ebp - 2048] +# ATT: vrsqrtbf16 -2048(,%ebp,2), %zmm2 +# INTEL: vrsqrtbf16 zmm2, zmmword ptr [2*ebp - 2048] 0x62,0xf6,0x7c,0x48,0x4e,0x14,0x6d,0x00,0xf8,0xff,0xff -# ATT: vrsqrtpbf16 8128(%ecx), %zmm2 {%k7} {z} -# INTEL: vrsqrtpbf16 zmm2 {k7} {z}, zmmword ptr [ecx + 8128] +# ATT: vrsqrtbf16 8128(%ecx), %zmm2 {%k7} {z} +# INTEL: vrsqrtbf16 zmm2 {k7} {z}, zmmword ptr [ecx + 8128] 0x62,0xf6,0x7c,0xcf,0x4e,0x51,0x7f -# ATT: vrsqrtpbf16 -256(%edx){1to32}, %zmm2 {%k7} {z} -# INTEL: vrsqrtpbf16 zmm2 {k7} {z}, word ptr [edx - 256]{1to32} +# ATT: vrsqrtbf16 -256(%edx){1to32}, %zmm2 {%k7} {z} +# INTEL: vrsqrtbf16 zmm2 {k7} {z}, word ptr [edx - 256]{1to32} 0x62,0xf6,0x7c,0xdf,0x4e,0x52,0x80 -# ATT: vscalefpbf16 %ymm4, %ymm3, %ymm2 -# INTEL: vscalefpbf16 ymm2, ymm3, ymm4 +# ATT: vscalefbf16 %ymm4, %ymm3, %ymm2 +# INTEL: vscalefbf16 ymm2, ymm3, ymm4 0x62,0xf6,0x64,0x28,0x2c,0xd4 -# ATT: vscalefpbf16 %ymm4, %ymm3, %ymm2 {%k7} -# INTEL: vscalefpbf16 ymm2 {k7}, ymm3, ymm4 +# ATT: vscalefbf16 %ymm4, %ymm3, %ymm2 {%k7} +# INTEL: vscalefbf16 ymm2 {k7}, ymm3, ymm4 0x62,0xf6,0x64,0x2f,0x2c,0xd4 -# ATT: vscalefpbf16 %ymm4, %ymm3, %ymm2 {%k7} {z} -# INTEL: vscalefpbf16 ymm2 {k7} {z}, ymm3, ymm4 +# ATT: vscalefbf16 %ymm4, %ymm3, %ymm2 {%k7} {z} +# INTEL: vscalefbf16 ymm2 {k7} {z}, ymm3, ymm4 0x62,0xf6,0x64,0xaf,0x2c,0xd4 -# ATT: vscalefpbf16 %zmm4, %zmm3, %zmm2 -# INTEL: vscalefpbf16 zmm2, zmm3, zmm4 +# ATT: vscalefbf16 %zmm4, %zmm3, %zmm2 +# INTEL: vscalefbf16 zmm2, zmm3, zmm4 0x62,0xf6,0x64,0x48,0x2c,0xd4 -# ATT: vscalefpbf16 %zmm4, %zmm3, %zmm2 {%k7} -# INTEL: vscalefpbf16 zmm2 {k7}, zmm3, zmm4 +# ATT: vscalefbf16 %zmm4, %zmm3, %zmm2 {%k7} +# INTEL: vscalefbf16 zmm2 {k7}, zmm3, zmm4 0x62,0xf6,0x64,0x4f,0x2c,0xd4 -# ATT: vscalefpbf16 %zmm4, %zmm3, %zmm2 {%k7} {z} -# INTEL: vscalefpbf16 zmm2 {k7} {z}, zmm3, zmm4 +# ATT: vscalefbf16 %zmm4, %zmm3, %zmm2 {%k7} {z} +# INTEL: vscalefbf16 zmm2 {k7} {z}, zmm3, zmm4 0x62,0xf6,0x64,0xcf,0x2c,0xd4 -# ATT: vscalefpbf16 %xmm4, %xmm3, %xmm2 -# INTEL: vscalefpbf16 xmm2, xmm3, xmm4 +# ATT: vscalefbf16 %xmm4, %xmm3, %xmm2 +# INTEL: vscalefbf16 xmm2, xmm3, xmm4 0x62,0xf6,0x64,0x08,0x2c,0xd4 -# ATT: vscalefpbf16 %xmm4, %xmm3, %xmm2 {%k7} -# INTEL: vscalefpbf16 xmm2 {k7}, xmm3, xmm4 +# ATT: vscalefbf16 %xmm4, %xmm3, %xmm2 {%k7} +# INTEL: vscalefbf16 xmm2 {k7}, xmm3, xmm4 0x62,0xf6,0x64,0x0f,0x2c,0xd4 -# ATT: vscalefpbf16 %xmm4, %xmm3, %xmm2 {%k7} {z} -# INTEL: vscalefpbf16 xmm2 {k7} {z}, xmm3, xmm4 +# ATT: vscalefbf16 %xmm4, %xmm3, %xmm2 {%k7} {z} +# INTEL: vscalefbf16 xmm2 {k7} {z}, xmm3, xmm4 0x62,0xf6,0x64,0x8f,0x2c,0xd4 -# ATT: vscalefpbf16 268435456(%esp,%esi,8), %zmm3, %zmm2 -# INTEL: vscalefpbf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456] +# ATT: vscalefbf16 268435456(%esp,%esi,8), %zmm3, %zmm2 +# INTEL: vscalefbf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456] 0x62,0xf6,0x64,0x48,0x2c,0x94,0xf4,0x00,0x00,0x00,0x10 -# ATT: vscalefpbf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7} -# INTEL: vscalefpbf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291] +# ATT: vscalefbf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7} +# INTEL: vscalefbf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291] 0x62,0xf6,0x64,0x4f,0x2c,0x94,0x87,0x23,0x01,0x00,0x00 -# ATT: vscalefpbf16 (%eax){1to32}, %zmm3, %zmm2 -# INTEL: vscalefpbf16 zmm2, zmm3, word ptr [eax]{1to32} +# ATT: vscalefbf16 (%eax){1to32}, %zmm3, %zmm2 +# INTEL: vscalefbf16 zmm2, zmm3, word ptr [eax]{1to32} 0x62,0xf6,0x64,0x58,0x2c,0x10 -# ATT: vscalefpbf16 -2048(,%ebp,2), %zmm3, %zmm2 -# INTEL: vscalefpbf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048] +# ATT: vscalefbf16 -2048(,%ebp,2), %zmm3, %zmm2 +# INTEL: vscalefbf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048] 0x62,0xf6,0x64,0x48,0x2c,0x14,0x6d,0x00,0xf8,0xff,0xff -# ATT: vscalefpbf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z} -# INTEL: vscalefpbf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128] +# ATT: vscalefbf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z} +# INTEL: vscalefbf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128] 0x62,0xf6,0x64,0xcf,0x2c,0x51,0x7f -# ATT: vscalefpbf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z} -# INTEL: vscalefpbf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32} +# ATT: vscalefbf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z} +# INTEL: vscalefbf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32} 0x62,0xf6,0x64,0xdf,0x2c,0x52,0x80 -# ATT: vscalefpbf16 268435456(%esp,%esi,8), %ymm3, %ymm2 -# INTEL: vscalefpbf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456] +# ATT: vscalefbf16 268435456(%esp,%esi,8), %ymm3, %ymm2 +# INTEL: vscalefbf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456] 0x62,0xf6,0x64,0x28,0x2c,0x94,0xf4,0x00,0x00,0x00,0x10 -# ATT: vscalefpbf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7} -# INTEL: vscalefpbf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291] +# ATT: vscalefbf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7} +# INTEL: vscalefbf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291] 0x62,0xf6,0x64,0x2f,0x2c,0x94,0x87,0x23,0x01,0x00,0x00 -# ATT: vscalefpbf16 (%eax){1to16}, %ymm3, %ymm2 -# INTEL: vscalefpbf16 ymm2, ymm3, word ptr [eax]{1to16} +# ATT: vscalefbf16 (%eax){1to16}, %ymm3, %ymm2 +# INTEL: vscalefbf16 ymm2, ymm3, word ptr [eax]{1to16} 0x62,0xf6,0x64,0x38,0x2c,0x10 -# ATT: vscalefpbf16 -1024(,%ebp,2), %ymm3, %ymm2 -# INTEL: vscalefpbf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024] +# ATT: vscalefbf16 -1024(,%ebp,2), %ymm3, %ymm2 +# INTEL: vscalefbf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024] 0x62,0xf6,0x64,0x28,0x2c,0x14,0x6d,0x00,0xfc,0xff,0xff -# ATT: vscalefpbf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z} -# INTEL: vscalefpbf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064] +# ATT: vscalefbf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z} +# INTEL: vscalefbf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064] 0x62,0xf6,0x64,0xaf,0x2c,0x51,0x7f -# ATT: vscalefpbf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z} -# INTEL: vscalefpbf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16} +# ATT: vscalefbf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z} +# INTEL: vscalefbf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16} 0x62,0xf6,0x64,0xbf,0x2c,0x52,0x80 -# ATT: vscalefpbf16 268435456(%esp,%esi,8), %xmm3, %xmm2 -# INTEL: vscalefpbf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456] +# ATT: vscalefbf16 268435456(%esp,%esi,8), %xmm3, %xmm2 +# INTEL: vscalefbf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456] 0x62,0xf6,0x64,0x08,0x2c,0x94,0xf4,0x00,0x00,0x00,0x10 -# ATT: vscalefpbf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7} -# INTEL: vscalefpbf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291] +# ATT: vscalefbf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7} +# INTEL: vscalefbf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291] 0x62,0xf6,0x64,0x0f,0x2c,0x94,0x87,0x23,0x01,0x00,0x00 -# ATT: vscalefpbf16 (%eax){1to8}, %xmm3, %xmm2 -# INTEL: vscalefpbf16 xmm2, xmm3, word ptr [eax]{1to8} +# ATT: vscalefbf16 (%eax){1to8}, %xmm3, %xmm2 +# INTEL: vscalefbf16 xmm2, xmm3, word ptr [eax]{1to8} 0x62,0xf6,0x64,0x18,0x2c,0x10 -# ATT: vscalefpbf16 -512(,%ebp,2), %xmm3, %xmm2 -# INTEL: vscalefpbf16 xmm2, xmm3, xmmword ptr [2*ebp - 512] +# ATT: vscalefbf16 -512(,%ebp,2), %xmm3, %xmm2 +# INTEL: vscalefbf16 xmm2, xmm3, xmmword ptr [2*ebp - 512] 0x62,0xf6,0x64,0x08,0x2c,0x14,0x6d,0x00,0xfe,0xff,0xff -# ATT: vscalefpbf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z} -# INTEL: vscalefpbf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032] +# ATT: vscalefbf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z} +# INTEL: vscalefbf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032] 0x62,0xf6,0x64,0x8f,0x2c,0x51,0x7f -# ATT: vscalefpbf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z} -# INTEL: vscalefpbf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8} +# ATT: vscalefbf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z} +# INTEL: vscalefbf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8} 0x62,0xf6,0x64,0x9f,0x2c,0x52,0x80 -# ATT: vsqrtnepbf16 %xmm3, %xmm2 -# INTEL: vsqrtnepbf16 xmm2, xmm3 +# ATT: vsqrtbf16 %xmm3, %xmm2 +# INTEL: vsqrtbf16 xmm2, xmm3 0x62,0xf5,0x7d,0x08,0x51,0xd3 -# ATT: vsqrtnepbf16 %xmm3, %xmm2 {%k7} -# INTEL: vsqrtnepbf16 xmm2 {k7}, xmm3 +# ATT: vsqrtbf16 %xmm3, %xmm2 {%k7} +# INTEL: vsqrtbf16 xmm2 {k7}, xmm3 0x62,0xf5,0x7d,0x0f,0x51,0xd3 -# ATT: vsqrtnepbf16 %xmm3, %xmm2 {%k7} {z} -# INTEL: vsqrtnepbf16 xmm2 {k7} {z}, xmm3 +# ATT: vsqrtbf16 %xmm3, %xmm2 {%k7} {z} +# INTEL: vsqrtbf16 xmm2 {k7} {z}, xmm3 0x62,0xf5,0x7d,0x8f,0x51,0xd3 -# ATT: vsqrtnepbf16 %zmm3, %zmm2 -# INTEL: vsqrtnepbf16 zmm2, zmm3 +# ATT: vsqrtbf16 %zmm3, %zmm2 +# INTEL: vsqrtbf16 zmm2, zmm3 0x62,0xf5,0x7d,0x48,0x51,0xd3 -# ATT: vsqrtnepbf16 %zmm3, %zmm2 {%k7} -# INTEL: vsqrtnepbf16 zmm2 {k7}, zmm3 +# ATT: vsqrtbf16 %zmm3, %zmm2 {%k7} +# INTEL: vsqrtbf16 zmm2 {k7}, zmm3 0x62,0xf5,0x7d,0x4f,0x51,0xd3 -# ATT: vsqrtnepbf16 %zmm3, %zmm2 {%k7} {z} -# INTEL: vsqrtnepbf16 zmm2 {k7} {z}, zmm3 +# ATT: vsqrtbf16 %zmm3, %zmm2 {%k7} {z} +# INTEL: vsqrtbf16 zmm2 {k7} {z}, zmm3 0x62,0xf5,0x7d,0xcf,0x51,0xd3 -# ATT: vsqrtnepbf16 %ymm3, %ymm2 -# INTEL: vsqrtnepbf16 ymm2, ymm3 +# ATT: vsqrtbf16 %ymm3, %ymm2 +# INTEL: vsqrtbf16 ymm2, ymm3 0x62,0xf5,0x7d,0x28,0x51,0xd3 -# ATT: vsqrtnepbf16 %ymm3, %ymm2 {%k7} -# INTEL: vsqrtnepbf16 ymm2 {k7}, ymm3 +# ATT: vsqrtbf16 %ymm3, %ymm2 {%k7} +# INTEL: vsqrtbf16 ymm2 {k7}, ymm3 0x62,0xf5,0x7d,0x2f,0x51,0xd3 -# ATT: vsqrtnepbf16 %ymm3, %ymm2 {%k7} {z} -# INTEL: vsqrtnepbf16 ymm2 {k7} {z}, ymm3 +# ATT: vsqrtbf16 %ymm3, %ymm2 {%k7} {z} +# INTEL: vsqrtbf16 ymm2 {k7} {z}, ymm3 0x62,0xf5,0x7d,0xaf,0x51,0xd3 -# ATT: vsqrtnepbf16 268435456(%esp,%esi,8), %xmm2 -# INTEL: vsqrtnepbf16 xmm2, xmmword ptr [esp + 8*esi + 268435456] +# ATT: vsqrtbf16 268435456(%esp,%esi,8), %xmm2 +# INTEL: vsqrtbf16 xmm2, xmmword ptr [esp + 8*esi + 268435456] 0x62,0xf5,0x7d,0x08,0x51,0x94,0xf4,0x00,0x00,0x00,0x10 -# ATT: vsqrtnepbf16 291(%edi,%eax,4), %xmm2 {%k7} -# INTEL: vsqrtnepbf16 xmm2 {k7}, xmmword ptr [edi + 4*eax + 291] +# ATT: vsqrtbf16 291(%edi,%eax,4), %xmm2 {%k7} +# INTEL: vsqrtbf16 xmm2 {k7}, xmmword ptr [edi + 4*eax + 291] 0x62,0xf5,0x7d,0x0f,0x51,0x94,0x87,0x23,0x01,0x00,0x00 -# ATT: vsqrtnepbf16 (%eax){1to8}, %xmm2 -# INTEL: vsqrtnepbf16 xmm2, word ptr [eax]{1to8} +# ATT: vsqrtbf16 (%eax){1to8}, %xmm2 +# INTEL: vsqrtbf16 xmm2, word ptr [eax]{1to8} 0x62,0xf5,0x7d,0x18,0x51,0x10 -# ATT: vsqrtnepbf16 -512(,%ebp,2), %xmm2 -# INTEL: vsqrtnepbf16 xmm2, xmmword ptr [2*ebp - 512] +# ATT: vsqrtbf16 -512(,%ebp,2), %xmm2 +# INTEL: vsqrtbf16 xmm2, xmmword ptr [2*ebp - 512] 0x62,0xf5,0x7d,0x08,0x51,0x14,0x6d,0x00,0xfe,0xff,0xff -# ATT: vsqrtnepbf16 2032(%ecx), %xmm2 {%k7} {z} -# INTEL: vsqrtnepbf16 xmm2 {k7} {z}, xmmword ptr [ecx + 2032] +# ATT: vsqrtbf16 2032(%ecx), %xmm2 {%k7} {z} +# INTEL: vsqrtbf16 xmm2 {k7} {z}, xmmword ptr [ecx + 2032] 0x62,0xf5,0x7d,0x8f,0x51,0x51,0x7f -# ATT: vsqrtnepbf16 -256(%edx){1to8}, %xmm2 {%k7} {z} -# INTEL: vsqrtnepbf16 xmm2 {k7} {z}, word ptr [edx - 256]{1to8} +# ATT: vsqrtbf16 -256(%edx){1to8}, %xmm2 {%k7} {z} +# INTEL: vsqrtbf16 xmm2 {k7} {z}, word ptr [edx - 256]{1to8} 0x62,0xf5,0x7d,0x9f,0x51,0x52,0x80 -# ATT: vsqrtnepbf16 268435456(%esp,%esi,8), %ymm2 -# INTEL: vsqrtnepbf16 ymm2, ymmword ptr [esp + 8*esi + 268435456] +# ATT: vsqrtbf16 268435456(%esp,%esi,8), %ymm2 +# INTEL: vsqrtbf16 ymm2, ymmword ptr [esp + 8*esi + 268435456] 0x62,0xf5,0x7d,0x28,0x51,0x94,0xf4,0x00,0x00,0x00,0x10 -# ATT: vsqrtnepbf16 291(%edi,%eax,4), %ymm2 {%k7} -# INTEL: vsqrtnepbf16 ymm2 {k7}, ymmword ptr [edi + 4*eax + 291] +# ATT: vsqrtbf16 291(%edi,%eax,4), %ymm2 {%k7} +# INTEL: vsqrtbf16 ymm2 {k7}, ymmword ptr [edi + 4*eax + 291] 0x62,0xf5,0x7d,0x2f,0x51,0x94,0x87,0x23,0x01,0x00,0x00 -# ATT: vsqrtnepbf16 (%eax){1to16}, %ymm2 -# INTEL: vsqrtnepbf16 ymm2, word ptr [eax]{1to16} +# ATT: vsqrtbf16 (%eax){1to16}, %ymm2 +# INTEL: vsqrtbf16 ymm2, word ptr [eax]{1to16} 0x62,0xf5,0x7d,0x38,0x51,0x10 -# ATT: vsqrtnepbf16 -1024(,%ebp,2), %ymm2 -# INTEL: vsqrtnepbf16 ymm2, ymmword ptr [2*ebp - 1024] +# ATT: vsqrtbf16 -1024(,%ebp,2), %ymm2 +# INTEL: vsqrtbf16 ymm2, ymmword ptr [2*ebp - 1024] 0x62,0xf5,0x7d,0x28,0x51,0x14,0x6d,0x00,0xfc,0xff,0xff -# ATT: vsqrtnepbf16 4064(%ecx), %ymm2 {%k7} {z} -# INTEL: vsqrtnepbf16 ymm2 {k7} {z}, ymmword ptr [ecx + 4064] +# ATT: vsqrtbf16 4064(%ecx), %ymm2 {%k7} {z} +# INTEL: vsqrtbf16 ymm2 {k7} {z}, ymmword ptr [ecx + 4064] 0x62,0xf5,0x7d,0xaf,0x51,0x51,0x7f -# ATT: vsqrtnepbf16 -256(%edx){1to16}, %ymm2 {%k7} {z} -# INTEL: vsqrtnepbf16 ymm2 {k7} {z}, word ptr [edx - 256]{1to16} +# ATT: vsqrtbf16 -256(%edx){1to16}, %ymm2 {%k7} {z} +# INTEL: vsqrtbf16 ymm2 {k7} {z}, word ptr [edx - 256]{1to16} 0x62,0xf5,0x7d,0xbf,0x51,0x52,0x80 -# ATT: vsqrtnepbf16 268435456(%esp,%esi,8), %zmm2 -# INTEL: vsqrtnepbf16 zmm2, zmmword ptr [esp + 8*esi + 268435456] +# ATT: vsqrtbf16 268435456(%esp,%esi,8), %zmm2 +# INTEL: vsqrtbf16 zmm2, zmmword ptr [esp + 8*esi + 268435456] 0x62,0xf5,0x7d,0x48,0x51,0x94,0xf4,0x00,0x00,0x00,0x10 -# ATT: vsqrtnepbf16 291(%edi,%eax,4), %zmm2 {%k7} -# INTEL: vsqrtnepbf16 zmm2 {k7}, zmmword ptr [edi + 4*eax + 291] +# ATT: vsqrtbf16 291(%edi,%eax,4), %zmm2 {%k7} +# INTEL: vsqrtbf16 zmm2 {k7}, zmmword ptr [edi + 4*eax + 291] 0x62,0xf5,0x7d,0x4f,0x51,0x94,0x87,0x23,0x01,0x00,0x00 -# ATT: vsqrtnepbf16 (%eax){1to32}, %zmm2 -# INTEL: vsqrtnepbf16 zmm2, word ptr [eax]{1to32} +# ATT: vsqrtbf16 (%eax){1to32}, %zmm2 +# INTEL: vsqrtbf16 zmm2, word ptr [eax]{1to32} 0x62,0xf5,0x7d,0x58,0x51,0x10 -# ATT: vsqrtnepbf16 -2048(,%ebp,2), %zmm2 -# INTEL: vsqrtnepbf16 zmm2, zmmword ptr [2*ebp - 2048] +# ATT: vsqrtbf16 -2048(,%ebp,2), %zmm2 +# INTEL: vsqrtbf16 zmm2, zmmword ptr [2*ebp - 2048] 0x62,0xf5,0x7d,0x48,0x51,0x14,0x6d,0x00,0xf8,0xff,0xff -# ATT: vsqrtnepbf16 8128(%ecx), %zmm2 {%k7} {z} -# INTEL: vsqrtnepbf16 zmm2 {k7} {z}, zmmword ptr [ecx + 8128] +# ATT: vsqrtbf16 8128(%ecx), %zmm2 {%k7} {z} +# INTEL: vsqrtbf16 zmm2 {k7} {z}, zmmword ptr [ecx + 8128] 0x62,0xf5,0x7d,0xcf,0x51,0x51,0x7f -# ATT: vsqrtnepbf16 -256(%edx){1to32}, %zmm2 {%k7} {z} -# INTEL: vsqrtnepbf16 zmm2 {k7} {z}, word ptr [edx - 256]{1to32} +# ATT: vsqrtbf16 -256(%edx){1to32}, %zmm2 {%k7} {z} +# INTEL: vsqrtbf16 zmm2 {k7} {z}, word ptr [edx - 256]{1to32} 0x62,0xf5,0x7d,0xdf,0x51,0x52,0x80 -# ATT: vsubnepbf16 %ymm4, %ymm3, %ymm2 -# INTEL: vsubnepbf16 ymm2, ymm3, ymm4 +# ATT: vsubbf16 %ymm4, %ymm3, %ymm2 +# INTEL: vsubbf16 ymm2, ymm3, ymm4 0x62,0xf5,0x65,0x28,0x5c,0xd4 -# ATT: vsubnepbf16 %ymm4, %ymm3, %ymm2 {%k7} -# INTEL: vsubnepbf16 ymm2 {k7}, ymm3, ymm4 +# ATT: vsubbf16 %ymm4, %ymm3, %ymm2 {%k7} +# INTEL: vsubbf16 ymm2 {k7}, ymm3, ymm4 0x62,0xf5,0x65,0x2f,0x5c,0xd4 -# ATT: vsubnepbf16 %ymm4, %ymm3, %ymm2 {%k7} {z} -# INTEL: vsubnepbf16 ymm2 {k7} {z}, ymm3, ymm4 +# ATT: vsubbf16 %ymm4, %ymm3, %ymm2 {%k7} {z} +# INTEL: vsubbf16 ymm2 {k7} {z}, ymm3, ymm4 0x62,0xf5,0x65,0xaf,0x5c,0xd4 -# ATT: vsubnepbf16 %zmm4, %zmm3, %zmm2 -# INTEL: vsubnepbf16 zmm2, zmm3, zmm4 +# ATT: vsubbf16 %zmm4, %zmm3, %zmm2 +# INTEL: vsubbf16 zmm2, zmm3, zmm4 0x62,0xf5,0x65,0x48,0x5c,0xd4 -# ATT: vsubnepbf16 %zmm4, %zmm3, %zmm2 {%k7} -# INTEL: vsubnepbf16 zmm2 {k7}, zmm3, zmm4 +# ATT: vsubbf16 %zmm4, %zmm3, %zmm2 {%k7} +# INTEL: vsubbf16 zmm2 {k7}, zmm3, zmm4 0x62,0xf5,0x65,0x4f,0x5c,0xd4 -# ATT: vsubnepbf16 %zmm4, %zmm3, %zmm2 {%k7} {z} -# INTEL: vsubnepbf16 zmm2 {k7} {z}, zmm3, zmm4 +# ATT: vsubbf16 %zmm4, %zmm3, %zmm2 {%k7} {z} +# INTEL: vsubbf16 zmm2 {k7} {z}, zmm3, zmm4 0x62,0xf5,0x65,0xcf,0x5c,0xd4 -# ATT: vsubnepbf16 %xmm4, %xmm3, %xmm2 -# INTEL: vsubnepbf16 xmm2, xmm3, xmm4 +# ATT: vsubbf16 %xmm4, %xmm3, %xmm2 +# INTEL: vsubbf16 xmm2, xmm3, xmm4 0x62,0xf5,0x65,0x08,0x5c,0xd4 -# ATT: vsubnepbf16 %xmm4, %xmm3, %xmm2 {%k7} -# INTEL: vsubnepbf16 xmm2 {k7}, xmm3, xmm4 +# ATT: vsubbf16 %xmm4, %xmm3, %xmm2 {%k7} +# INTEL: vsubbf16 xmm2 {k7}, xmm3, xmm4 0x62,0xf5,0x65,0x0f,0x5c,0xd4 -# ATT: vsubnepbf16 %xmm4, %xmm3, %xmm2 {%k7} {z} -# INTEL: vsubnepbf16 xmm2 {k7} {z}, xmm3, xmm4 +# ATT: vsubbf16 %xmm4, %xmm3, %xmm2 {%k7} {z} +# INTEL: vsubbf16 xmm2 {k7} {z}, xmm3, xmm4 0x62,0xf5,0x65,0x8f,0x5c,0xd4 -# ATT: vsubnepbf16 268435456(%esp,%esi,8), %zmm3, %zmm2 -# INTEL: vsubnepbf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456] +# ATT: vsubbf16 268435456(%esp,%esi,8), %zmm3, %zmm2 +# INTEL: vsubbf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456] 0x62,0xf5,0x65,0x48,0x5c,0x94,0xf4,0x00,0x00,0x00,0x10 -# ATT: vsubnepbf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7} -# INTEL: vsubnepbf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291] +# ATT: vsubbf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7} +# INTEL: vsubbf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291] 0x62,0xf5,0x65,0x4f,0x5c,0x94,0x87,0x23,0x01,0x00,0x00 -# ATT: vsubnepbf16 (%eax){1to32}, %zmm3, %zmm2 -# INTEL: vsubnepbf16 zmm2, zmm3, word ptr [eax]{1to32} +# ATT: vsubbf16 (%eax){1to32}, %zmm3, %zmm2 +# INTEL: vsubbf16 zmm2, zmm3, word ptr [eax]{1to32} 0x62,0xf5,0x65,0x58,0x5c,0x10 -# ATT: vsubnepbf16 -2048(,%ebp,2), %zmm3, %zmm2 -# INTEL: vsubnepbf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048] +# ATT: vsubbf16 -2048(,%ebp,2), %zmm3, %zmm2 +# INTEL: vsubbf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048] 0x62,0xf5,0x65,0x48,0x5c,0x14,0x6d,0x00,0xf8,0xff,0xff -# ATT: vsubnepbf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z} -# INTEL: vsubnepbf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128] +# ATT: vsubbf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z} +# INTEL: vsubbf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128] 0x62,0xf5,0x65,0xcf,0x5c,0x51,0x7f -# ATT: vsubnepbf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z} -# INTEL: vsubnepbf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32} +# ATT: vsubbf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z} +# INTEL: vsubbf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32} 0x62,0xf5,0x65,0xdf,0x5c,0x52,0x80 -# ATT: vsubnepbf16 268435456(%esp,%esi,8), %ymm3, %ymm2 -# INTEL: vsubnepbf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456] +# ATT: vsubbf16 268435456(%esp,%esi,8), %ymm3, %ymm2 +# INTEL: vsubbf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456] 0x62,0xf5,0x65,0x28,0x5c,0x94,0xf4,0x00,0x00,0x00,0x10 -# ATT: vsubnepbf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7} -# INTEL: vsubnepbf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291] +# ATT: vsubbf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7} +# INTEL: vsubbf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291] 0x62,0xf5,0x65,0x2f,0x5c,0x94,0x87,0x23,0x01,0x00,0x00 -# ATT: vsubnepbf16 (%eax){1to16}, %ymm3, %ymm2 -# INTEL: vsubnepbf16 ymm2, ymm3, word ptr [eax]{1to16} +# ATT: vsubbf16 (%eax){1to16}, %ymm3, %ymm2 +# INTEL: vsubbf16 ymm2, ymm3, word ptr [eax]{1to16} 0x62,0xf5,0x65,0x38,0x5c,0x10 -# ATT: vsubnepbf16 -1024(,%ebp,2), %ymm3, %ymm2 -# INTEL: vsubnepbf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024] +# ATT: vsubbf16 -1024(,%ebp,2), %ymm3, %ymm2 +# INTEL: vsubbf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024] 0x62,0xf5,0x65,0x28,0x5c,0x14,0x6d,0x00,0xfc,0xff,0xff -# ATT: vsubnepbf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z} -# INTEL: vsubnepbf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064] +# ATT: vsubbf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z} +# INTEL: vsubbf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064] 0x62,0xf5,0x65,0xaf,0x5c,0x51,0x7f -# ATT: vsubnepbf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z} -# INTEL: vsubnepbf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16} +# ATT: vsubbf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z} +# INTEL: vsubbf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16} 0x62,0xf5,0x65,0xbf,0x5c,0x52,0x80 -# ATT: vsubnepbf16 268435456(%esp,%esi,8), %xmm3, %xmm2 -# INTEL: vsubnepbf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456] +# ATT: vsubbf16 268435456(%esp,%esi,8), %xmm3, %xmm2 +# INTEL: vsubbf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456] 0x62,0xf5,0x65,0x08,0x5c,0x94,0xf4,0x00,0x00,0x00,0x10 -# ATT: vsubnepbf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7} -# INTEL: vsubnepbf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291] +# ATT: vsubbf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7} +# INTEL: vsubbf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291] 0x62,0xf5,0x65,0x0f,0x5c,0x94,0x87,0x23,0x01,0x00,0x00 -# ATT: vsubnepbf16 (%eax){1to8}, %xmm3, %xmm2 -# INTEL: vsubnepbf16 xmm2, xmm3, word ptr [eax]{1to8} +# ATT: vsubbf16 (%eax){1to8}, %xmm3, %xmm2 +# INTEL: vsubbf16 xmm2, xmm3, word ptr [eax]{1to8} 0x62,0xf5,0x65,0x18,0x5c,0x10 -# ATT: vsubnepbf16 -512(,%ebp,2), %xmm3, %xmm2 -# INTEL: vsubnepbf16 xmm2, xmm3, xmmword ptr [2*ebp - 512] +# ATT: vsubbf16 -512(,%ebp,2), %xmm3, %xmm2 +# INTEL: vsubbf16 xmm2, xmm3, xmmword ptr [2*ebp - 512] 0x62,0xf5,0x65,0x08,0x5c,0x14,0x6d,0x00,0xfe,0xff,0xff -# ATT: vsubnepbf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z} -# INTEL: vsubnepbf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032] +# ATT: vsubbf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z} +# INTEL: vsubbf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032] 0x62,0xf5,0x65,0x8f,0x5c,0x51,0x7f -# ATT: vsubnepbf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z} -# INTEL: vsubnepbf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8} +# ATT: vsubbf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z} +# INTEL: vsubbf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8} 0x62,0xf5,0x65,0x9f,0x5c,0x52,0x80 diff --git a/llvm/test/MC/Disassembler/X86/avx10.2-bf16-64.txt b/llvm/test/MC/Disassembler/X86/avx10.2-bf16-64.txt index 953ef8dd8a14c..ff321ed3488c7 100644 --- a/llvm/test/MC/Disassembler/X86/avx10.2-bf16-64.txt +++ b/llvm/test/MC/Disassembler/X86/avx10.2-bf16-64.txt @@ -1,208 +1,208 @@ # RUN: llvm-mc --disassemble %s -triple=x86_64 | FileCheck %s --check-prefixes=ATT # RUN: llvm-mc --disassemble %s -triple=x86_64 --output-asm-variant=1 | FileCheck %s --check-prefixes=INTEL -# ATT: vaddnepbf16 %ymm24, %ymm23, %ymm22 -# INTEL: vaddnepbf16 ymm22, ymm23, ymm24 +# ATT: vaddbf16 %ymm24, %ymm23, %ymm22 +# INTEL: vaddbf16 ymm22, ymm23, ymm24 0x62,0x85,0x45,0x20,0x58,0xf0 -# ATT: vaddnepbf16 %ymm24, %ymm23, %ymm22 {%k7} -# INTEL: vaddnepbf16 ymm22 {k7}, ymm23, ymm24 +# ATT: vaddbf16 %ymm24, %ymm23, %ymm22 {%k7} +# INTEL: vaddbf16 ymm22 {k7}, ymm23, ymm24 0x62,0x85,0x45,0x27,0x58,0xf0 -# ATT: vaddnepbf16 %ymm24, %ymm23, %ymm22 {%k7} {z} -# INTEL: vaddnepbf16 ymm22 {k7} {z}, ymm23, ymm24 +# ATT: vaddbf16 %ymm24, %ymm23, %ymm22 {%k7} {z} +# INTEL: vaddbf16 ymm22 {k7} {z}, ymm23, ymm24 0x62,0x85,0x45,0xa7,0x58,0xf0 -# ATT: vaddnepbf16 %zmm24, %zmm23, %zmm22 -# INTEL: vaddnepbf16 zmm22, zmm23, zmm24 +# ATT: vaddbf16 %zmm24, %zmm23, %zmm22 +# INTEL: vaddbf16 zmm22, zmm23, zmm24 0x62,0x85,0x45,0x40,0x58,0xf0 -# ATT: vaddnepbf16 %zmm24, %zmm23, %zmm22 {%k7} -# INTEL: vaddnepbf16 zmm22 {k7}, zmm23, zmm24 +# ATT: vaddbf16 %zmm24, %zmm23, %zmm22 {%k7} +# INTEL: vaddbf16 zmm22 {k7}, zmm23, zmm24 0x62,0x85,0x45,0x47,0x58,0xf0 -# ATT: vaddnepbf16 %zmm24, %zmm23, %zmm22 {%k7} {z} -# INTEL: vaddnepbf16 zmm22 {k7} {z}, zmm23, zmm24 +# ATT: vaddbf16 %zmm24, %zmm23, %zmm22 {%k7} {z} +# INTEL: vaddbf16 zmm22 {k7} {z}, zmm23, zmm24 0x62,0x85,0x45,0xc7,0x58,0xf0 -# ATT: vaddnepbf16 %xmm24, %xmm23, %xmm22 -# INTEL: vaddnepbf16 xmm22, xmm23, xmm24 +# ATT: vaddbf16 %xmm24, %xmm23, %xmm22 +# INTEL: vaddbf16 xmm22, xmm23, xmm24 0x62,0x85,0x45,0x00,0x58,0xf0 -# ATT: vaddnepbf16 %xmm24, %xmm23, %xmm22 {%k7} -# INTEL: vaddnepbf16 xmm22 {k7}, xmm23, xmm24 +# ATT: vaddbf16 %xmm24, %xmm23, %xmm22 {%k7} +# INTEL: vaddbf16 xmm22 {k7}, xmm23, xmm24 0x62,0x85,0x45,0x07,0x58,0xf0 -# ATT: vaddnepbf16 %xmm24, %xmm23, %xmm22 {%k7} {z} -# INTEL: vaddnepbf16 xmm22 {k7} {z}, xmm23, xmm24 +# ATT: vaddbf16 %xmm24, %xmm23, %xmm22 {%k7} {z} +# INTEL: vaddbf16 xmm22 {k7} {z}, xmm23, xmm24 0x62,0x85,0x45,0x87,0x58,0xf0 -# ATT: vaddnepbf16 268435456(%rbp,%r14,8), %zmm23, %zmm22 -# INTEL: vaddnepbf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456] +# ATT: vaddbf16 268435456(%rbp,%r14,8), %zmm23, %zmm22 +# INTEL: vaddbf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456] 0x62,0xa5,0x45,0x40,0x58,0xb4,0xf5,0x00,0x00,0x00,0x10 -# ATT: vaddnepbf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7} -# INTEL: vaddnepbf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291] +# ATT: vaddbf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7} +# INTEL: vaddbf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291] 0x62,0xc5,0x45,0x47,0x58,0xb4,0x80,0x23,0x01,0x00,0x00 -# ATT: vaddnepbf16 (%rip){1to32}, %zmm23, %zmm22 -# INTEL: vaddnepbf16 zmm22, zmm23, word ptr [rip]{1to32} +# ATT: vaddbf16 (%rip){1to32}, %zmm23, %zmm22 +# INTEL: vaddbf16 zmm22, zmm23, word ptr [rip]{1to32} 0x62,0xe5,0x45,0x50,0x58,0x35,0x00,0x00,0x00,0x00 -# ATT: vaddnepbf16 -2048(,%rbp,2), %zmm23, %zmm22 -# INTEL: vaddnepbf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048] +# ATT: vaddbf16 -2048(,%rbp,2), %zmm23, %zmm22 +# INTEL: vaddbf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048] 0x62,0xe5,0x45,0x40,0x58,0x34,0x6d,0x00,0xf8,0xff,0xff -# ATT: vaddnepbf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z} -# INTEL: vaddnepbf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128] +# ATT: vaddbf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z} +# INTEL: vaddbf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128] 0x62,0xe5,0x45,0xc7,0x58,0x71,0x7f -# ATT: vaddnepbf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z} -# INTEL: vaddnepbf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32} +# ATT: vaddbf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z} +# INTEL: vaddbf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32} 0x62,0xe5,0x45,0xd7,0x58,0x72,0x80 -# ATT: vaddnepbf16 268435456(%rbp,%r14,8), %ymm23, %ymm22 -# INTEL: vaddnepbf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456] +# ATT: vaddbf16 268435456(%rbp,%r14,8), %ymm23, %ymm22 +# INTEL: vaddbf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456] 0x62,0xa5,0x45,0x20,0x58,0xb4,0xf5,0x00,0x00,0x00,0x10 -# ATT: vaddnepbf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7} -# INTEL: vaddnepbf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291] +# ATT: vaddbf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7} +# INTEL: vaddbf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291] 0x62,0xc5,0x45,0x27,0x58,0xb4,0x80,0x23,0x01,0x00,0x00 -# ATT: vaddnepbf16 (%rip){1to16}, %ymm23, %ymm22 -# INTEL: vaddnepbf16 ymm22, ymm23, word ptr [rip]{1to16} +# ATT: vaddbf16 (%rip){1to16}, %ymm23, %ymm22 +# INTEL: vaddbf16 ymm22, ymm23, word ptr [rip]{1to16} 0x62,0xe5,0x45,0x30,0x58,0x35,0x00,0x00,0x00,0x00 -# ATT: vaddnepbf16 -1024(,%rbp,2), %ymm23, %ymm22 -# INTEL: vaddnepbf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024] +# ATT: vaddbf16 -1024(,%rbp,2), %ymm23, %ymm22 +# INTEL: vaddbf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024] 0x62,0xe5,0x45,0x20,0x58,0x34,0x6d,0x00,0xfc,0xff,0xff -# ATT: vaddnepbf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z} -# INTEL: vaddnepbf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064] +# ATT: vaddbf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z} +# INTEL: vaddbf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064] 0x62,0xe5,0x45,0xa7,0x58,0x71,0x7f -# ATT: vaddnepbf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z} -# INTEL: vaddnepbf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16} +# ATT: vaddbf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z} +# INTEL: vaddbf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16} 0x62,0xe5,0x45,0xb7,0x58,0x72,0x80 -# ATT: vaddnepbf16 268435456(%rbp,%r14,8), %xmm23, %xmm22 -# INTEL: vaddnepbf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456] +# ATT: vaddbf16 268435456(%rbp,%r14,8), %xmm23, %xmm22 +# INTEL: vaddbf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456] 0x62,0xa5,0x45,0x00,0x58,0xb4,0xf5,0x00,0x00,0x00,0x10 -# ATT: vaddnepbf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7} -# INTEL: vaddnepbf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291] +# ATT: vaddbf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7} +# INTEL: vaddbf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291] 0x62,0xc5,0x45,0x07,0x58,0xb4,0x80,0x23,0x01,0x00,0x00 -# ATT: vaddnepbf16 (%rip){1to8}, %xmm23, %xmm22 -# INTEL: vaddnepbf16 xmm22, xmm23, word ptr [rip]{1to8} +# ATT: vaddbf16 (%rip){1to8}, %xmm23, %xmm22 +# INTEL: vaddbf16 xmm22, xmm23, word ptr [rip]{1to8} 0x62,0xe5,0x45,0x10,0x58,0x35,0x00,0x00,0x00,0x00 -# ATT: vaddnepbf16 -512(,%rbp,2), %xmm23, %xmm22 -# INTEL: vaddnepbf16 xmm22, xmm23, xmmword ptr [2*rbp - 512] +# ATT: vaddbf16 -512(,%rbp,2), %xmm23, %xmm22 +# INTEL: vaddbf16 xmm22, xmm23, xmmword ptr [2*rbp - 512] 0x62,0xe5,0x45,0x00,0x58,0x34,0x6d,0x00,0xfe,0xff,0xff -# ATT: vaddnepbf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z} -# INTEL: vaddnepbf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032] +# ATT: vaddbf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z} +# INTEL: vaddbf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032] 0x62,0xe5,0x45,0x87,0x58,0x71,0x7f -# ATT: vaddnepbf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z} -# INTEL: vaddnepbf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8} +# ATT: vaddbf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z} +# INTEL: vaddbf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8} 0x62,0xe5,0x45,0x97,0x58,0x72,0x80 -# ATT: vcmppbf16 $123, %ymm24, %ymm23, %k5 -# INTEL: vcmppbf16 k5, ymm23, ymm24, 123 +# ATT: vcmpbf16 $123, %ymm24, %ymm23, %k5 +# INTEL: vcmpbf16 k5, ymm23, ymm24, 123 0x62,0x93,0x47,0x20,0xc2,0xe8,0x7b -# ATT: vcmppbf16 $123, %ymm24, %ymm23, %k5 {%k7} -# INTEL: vcmppbf16 k5 {k7}, ymm23, ymm24, 123 +# ATT: vcmpbf16 $123, %ymm24, %ymm23, %k5 {%k7} +# INTEL: vcmpbf16 k5 {k7}, ymm23, ymm24, 123 0x62,0x93,0x47,0x27,0xc2,0xe8,0x7b -# ATT: vcmppbf16 $123, %xmm24, %xmm23, %k5 -# INTEL: vcmppbf16 k5, xmm23, xmm24, 123 +# ATT: vcmpbf16 $123, %xmm24, %xmm23, %k5 +# INTEL: vcmpbf16 k5, xmm23, xmm24, 123 0x62,0x93,0x47,0x00,0xc2,0xe8,0x7b -# ATT: vcmppbf16 $123, %xmm24, %xmm23, %k5 {%k7} -# INTEL: vcmppbf16 k5 {k7}, xmm23, xmm24, 123 +# ATT: vcmpbf16 $123, %xmm24, %xmm23, %k5 {%k7} +# INTEL: vcmpbf16 k5 {k7}, xmm23, xmm24, 123 0x62,0x93,0x47,0x07,0xc2,0xe8,0x7b -# ATT: vcmppbf16 $123, %zmm24, %zmm23, %k5 -# INTEL: vcmppbf16 k5, zmm23, zmm24, 123 +# ATT: vcmpbf16 $123, %zmm24, %zmm23, %k5 +# INTEL: vcmpbf16 k5, zmm23, zmm24, 123 0x62,0x93,0x47,0x40,0xc2,0xe8,0x7b -# ATT: vcmppbf16 $123, %zmm24, %zmm23, %k5 {%k7} -# INTEL: vcmppbf16 k5 {k7}, zmm23, zmm24, 123 +# ATT: vcmpbf16 $123, %zmm24, %zmm23, %k5 {%k7} +# INTEL: vcmpbf16 k5 {k7}, zmm23, zmm24, 123 0x62,0x93,0x47,0x47,0xc2,0xe8,0x7b -# ATT: vcmppbf16 $123, 268435456(%rbp,%r14,8), %zmm23, %k5 -# INTEL: vcmppbf16 k5, zmm23, zmmword ptr [rbp + 8*r14 + 268435456], 123 +# ATT: vcmpbf16 $123, 268435456(%rbp,%r14,8), %zmm23, %k5 +# INTEL: vcmpbf16 k5, zmm23, zmmword ptr [rbp + 8*r14 + 268435456], 123 0x62,0xb3,0x47,0x40,0xc2,0xac,0xf5,0x00,0x00,0x00,0x10,0x7b -# ATT: vcmppbf16 $123, 291(%r8,%rax,4), %zmm23, %k5 {%k7} -# INTEL: vcmppbf16 k5 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291], 123 +# ATT: vcmpbf16 $123, 291(%r8,%rax,4), %zmm23, %k5 {%k7} +# INTEL: vcmpbf16 k5 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291], 123 0x62,0xd3,0x47,0x47,0xc2,0xac,0x80,0x23,0x01,0x00,0x00,0x7b -# ATT: vcmppbf16 $123, (%rip){1to32}, %zmm23, %k5 -# INTEL: vcmppbf16 k5, zmm23, word ptr [rip]{1to32}, 123 +# ATT: vcmpbf16 $123, (%rip){1to32}, %zmm23, %k5 +# INTEL: vcmpbf16 k5, zmm23, word ptr [rip]{1to32}, 123 0x62,0xf3,0x47,0x50,0xc2,0x2d,0x00,0x00,0x00,0x00,0x7b -# ATT: vcmppbf16 $123, -2048(,%rbp,2), %zmm23, %k5 -# INTEL: vcmppbf16 k5, zmm23, zmmword ptr [2*rbp - 2048], 123 +# ATT: vcmpbf16 $123, -2048(,%rbp,2), %zmm23, %k5 +# INTEL: vcmpbf16 k5, zmm23, zmmword ptr [2*rbp - 2048], 123 0x62,0xf3,0x47,0x40,0xc2,0x2c,0x6d,0x00,0xf8,0xff,0xff,0x7b -# ATT: vcmppbf16 $123, 8128(%rcx), %zmm23, %k5 {%k7} -# INTEL: vcmppbf16 k5 {k7}, zmm23, zmmword ptr [rcx + 8128], 123 +# ATT: vcmpbf16 $123, 8128(%rcx), %zmm23, %k5 {%k7} +# INTEL: vcmpbf16 k5 {k7}, zmm23, zmmword ptr [rcx + 8128], 123 0x62,0xf3,0x47,0x47,0xc2,0x69,0x7f,0x7b -# ATT: vcmppbf16 $123, -256(%rdx){1to32}, %zmm23, %k5 {%k7} -# INTEL: vcmppbf16 k5 {k7}, zmm23, word ptr [rdx - 256]{1to32}, 123 +# ATT: vcmpbf16 $123, -256(%rdx){1to32}, %zmm23, %k5 {%k7} +# INTEL: vcmpbf16 k5 {k7}, zmm23, word ptr [rdx - 256]{1to32}, 123 0x62,0xf3,0x47,0x57,0xc2,0x6a,0x80,0x7b -# ATT: vcmppbf16 $123, 268435456(%rbp,%r14,8), %xmm23, %k5 -# INTEL: vcmppbf16 k5, xmm23, xmmword ptr [rbp + 8*r14 + 268435456], 123 +# ATT: vcmpbf16 $123, 268435456(%rbp,%r14,8), %xmm23, %k5 +# INTEL: vcmpbf16 k5, xmm23, xmmword ptr [rbp + 8*r14 + 268435456], 123 0x62,0xb3,0x47,0x00,0xc2,0xac,0xf5,0x00,0x00,0x00,0x10,0x7b -# ATT: vcmppbf16 $123, 291(%r8,%rax,4), %xmm23, %k5 {%k7} -# INTEL: vcmppbf16 k5 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291], 123 +# ATT: vcmpbf16 $123, 291(%r8,%rax,4), %xmm23, %k5 {%k7} +# INTEL: vcmpbf16 k5 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291], 123 0x62,0xd3,0x47,0x07,0xc2,0xac,0x80,0x23,0x01,0x00,0x00,0x7b -# ATT: vcmppbf16 $123, (%rip){1to8}, %xmm23, %k5 -# INTEL: vcmppbf16 k5, xmm23, word ptr [rip]{1to8}, 123 +# ATT: vcmpbf16 $123, (%rip){1to8}, %xmm23, %k5 +# INTEL: vcmpbf16 k5, xmm23, word ptr [rip]{1to8}, 123 0x62,0xf3,0x47,0x10,0xc2,0x2d,0x00,0x00,0x00,0x00,0x7b -# ATT: vcmppbf16 $123, -512(,%rbp,2), %xmm23, %k5 -# INTEL: vcmppbf16 k5, xmm23, xmmword ptr [2*rbp - 512], 123 +# ATT: vcmpbf16 $123, -512(,%rbp,2), %xmm23, %k5 +# INTEL: vcmpbf16 k5, xmm23, xmmword ptr [2*rbp - 512], 123 0x62,0xf3,0x47,0x00,0xc2,0x2c,0x6d,0x00,0xfe,0xff,0xff,0x7b -# ATT: vcmppbf16 $123, 2032(%rcx), %xmm23, %k5 {%k7} -# INTEL: vcmppbf16 k5 {k7}, xmm23, xmmword ptr [rcx + 2032], 123 +# ATT: vcmpbf16 $123, 2032(%rcx), %xmm23, %k5 {%k7} +# INTEL: vcmpbf16 k5 {k7}, xmm23, xmmword ptr [rcx + 2032], 123 0x62,0xf3,0x47,0x07,0xc2,0x69,0x7f,0x7b -# ATT: vcmppbf16 $123, -256(%rdx){1to8}, %xmm23, %k5 {%k7} -# INTEL: vcmppbf16 k5 {k7}, xmm23, word ptr [rdx - 256]{1to8}, 123 +# ATT: vcmpbf16 $123, -256(%rdx){1to8}, %xmm23, %k5 {%k7} +# INTEL: vcmpbf16 k5 {k7}, xmm23, word ptr [rdx - 256]{1to8}, 123 0x62,0xf3,0x47,0x17,0xc2,0x6a,0x80,0x7b -# ATT: vcmppbf16 $123, 268435456(%rbp,%r14,8), %ymm23, %k5 -# INTEL: vcmppbf16 k5, ymm23, ymmword ptr [rbp + 8*r14 + 268435456], 123 +# ATT: vcmpbf16 $123, 268435456(%rbp,%r14,8), %ymm23, %k5 +# INTEL: vcmpbf16 k5, ymm23, ymmword ptr [rbp + 8*r14 + 268435456], 123 0x62,0xb3,0x47,0x20,0xc2,0xac,0xf5,0x00,0x00,0x00,0x10,0x7b -# ATT: vcmppbf16 $123, 291(%r8,%rax,4), %ymm23, %k5 {%k7} -# INTEL: vcmppbf16 k5 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291], 123 +# ATT: vcmpbf16 $123, 291(%r8,%rax,4), %ymm23, %k5 {%k7} +# INTEL: vcmpbf16 k5 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291], 123 0x62,0xd3,0x47,0x27,0xc2,0xac,0x80,0x23,0x01,0x00,0x00,0x7b -# ATT: vcmppbf16 $123, (%rip){1to16}, %ymm23, %k5 -# INTEL: vcmppbf16 k5, ymm23, word ptr [rip]{1to16}, 123 +# ATT: vcmpbf16 $123, (%rip){1to16}, %ymm23, %k5 +# INTEL: vcmpbf16 k5, ymm23, word ptr [rip]{1to16}, 123 0x62,0xf3,0x47,0x30,0xc2,0x2d,0x00,0x00,0x00,0x00,0x7b -# ATT: vcmppbf16 $123, -1024(,%rbp,2), %ymm23, %k5 -# INTEL: vcmppbf16 k5, ymm23, ymmword ptr [2*rbp - 1024], 123 +# ATT: vcmpbf16 $123, -1024(,%rbp,2), %ymm23, %k5 +# INTEL: vcmpbf16 k5, ymm23, ymmword ptr [2*rbp - 1024], 123 0x62,0xf3,0x47,0x20,0xc2,0x2c,0x6d,0x00,0xfc,0xff,0xff,0x7b -# ATT: vcmppbf16 $123, 4064(%rcx), %ymm23, %k5 {%k7} -# INTEL: vcmppbf16 k5 {k7}, ymm23, ymmword ptr [rcx + 4064], 123 +# ATT: vcmpbf16 $123, 4064(%rcx), %ymm23, %k5 {%k7} +# INTEL: vcmpbf16 k5 {k7}, ymm23, ymmword ptr [rcx + 4064], 123 0x62,0xf3,0x47,0x27,0xc2,0x69,0x7f,0x7b -# ATT: vcmppbf16 $123, -256(%rdx){1to16}, %ymm23, %k5 {%k7} -# INTEL: vcmppbf16 k5 {k7}, ymm23, word ptr [rdx - 256]{1to16}, 123 +# ATT: vcmpbf16 $123, -256(%rdx){1to16}, %ymm23, %k5 {%k7} +# INTEL: vcmpbf16 k5 {k7}, ymm23, word ptr [rdx - 256]{1to16}, 123 0x62,0xf3,0x47,0x37,0xc2,0x6a,0x80,0x7b # ATT: vcomsbf16 %xmm23, %xmm22 @@ -233,2783 +233,2783 @@ # INTEL: vcomsbf16 xmm22, word ptr [rdx - 256] 0x62,0xe5,0x7d,0x08,0x2f,0x72,0x80 -# ATT: vdivnepbf16 %ymm24, %ymm23, %ymm22 -# INTEL: vdivnepbf16 ymm22, ymm23, ymm24 +# ATT: vdivbf16 %ymm24, %ymm23, %ymm22 +# INTEL: vdivbf16 ymm22, ymm23, ymm24 0x62,0x85,0x45,0x20,0x5e,0xf0 -# ATT: vdivnepbf16 %ymm24, %ymm23, %ymm22 {%k7} -# INTEL: vdivnepbf16 ymm22 {k7}, ymm23, ymm24 +# ATT: vdivbf16 %ymm24, %ymm23, %ymm22 {%k7} +# INTEL: vdivbf16 ymm22 {k7}, ymm23, ymm24 0x62,0x85,0x45,0x27,0x5e,0xf0 -# ATT: vdivnepbf16 %ymm24, %ymm23, %ymm22 {%k7} {z} -# INTEL: vdivnepbf16 ymm22 {k7} {z}, ymm23, ymm24 +# ATT: vdivbf16 %ymm24, %ymm23, %ymm22 {%k7} {z} +# INTEL: vdivbf16 ymm22 {k7} {z}, ymm23, ymm24 0x62,0x85,0x45,0xa7,0x5e,0xf0 -# ATT: vdivnepbf16 %zmm24, %zmm23, %zmm22 -# INTEL: vdivnepbf16 zmm22, zmm23, zmm24 +# ATT: vdivbf16 %zmm24, %zmm23, %zmm22 +# INTEL: vdivbf16 zmm22, zmm23, zmm24 0x62,0x85,0x45,0x40,0x5e,0xf0 -# ATT: vdivnepbf16 %zmm24, %zmm23, %zmm22 {%k7} -# INTEL: vdivnepbf16 zmm22 {k7}, zmm23, zmm24 +# ATT: vdivbf16 %zmm24, %zmm23, %zmm22 {%k7} +# INTEL: vdivbf16 zmm22 {k7}, zmm23, zmm24 0x62,0x85,0x45,0x47,0x5e,0xf0 -# ATT: vdivnepbf16 %zmm24, %zmm23, %zmm22 {%k7} {z} -# INTEL: vdivnepbf16 zmm22 {k7} {z}, zmm23, zmm24 +# ATT: vdivbf16 %zmm24, %zmm23, %zmm22 {%k7} {z} +# INTEL: vdivbf16 zmm22 {k7} {z}, zmm23, zmm24 0x62,0x85,0x45,0xc7,0x5e,0xf0 -# ATT: vdivnepbf16 %xmm24, %xmm23, %xmm22 -# INTEL: vdivnepbf16 xmm22, xmm23, xmm24 +# ATT: vdivbf16 %xmm24, %xmm23, %xmm22 +# INTEL: vdivbf16 xmm22, xmm23, xmm24 0x62,0x85,0x45,0x00,0x5e,0xf0 -# ATT: vdivnepbf16 %xmm24, %xmm23, %xmm22 {%k7} -# INTEL: vdivnepbf16 xmm22 {k7}, xmm23, xmm24 +# ATT: vdivbf16 %xmm24, %xmm23, %xmm22 {%k7} +# INTEL: vdivbf16 xmm22 {k7}, xmm23, xmm24 0x62,0x85,0x45,0x07,0x5e,0xf0 -# ATT: vdivnepbf16 %xmm24, %xmm23, %xmm22 {%k7} {z} -# INTEL: vdivnepbf16 xmm22 {k7} {z}, xmm23, xmm24 +# ATT: vdivbf16 %xmm24, %xmm23, %xmm22 {%k7} {z} +# INTEL: vdivbf16 xmm22 {k7} {z}, xmm23, xmm24 0x62,0x85,0x45,0x87,0x5e,0xf0 -# ATT: vdivnepbf16 268435456(%rbp,%r14,8), %zmm23, %zmm22 -# INTEL: vdivnepbf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456] +# ATT: vdivbf16 268435456(%rbp,%r14,8), %zmm23, %zmm22 +# INTEL: vdivbf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456] 0x62,0xa5,0x45,0x40,0x5e,0xb4,0xf5,0x00,0x00,0x00,0x10 -# ATT: vdivnepbf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7} -# INTEL: vdivnepbf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291] +# ATT: vdivbf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7} +# INTEL: vdivbf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291] 0x62,0xc5,0x45,0x47,0x5e,0xb4,0x80,0x23,0x01,0x00,0x00 -# ATT: vdivnepbf16 (%rip){1to32}, %zmm23, %zmm22 -# INTEL: vdivnepbf16 zmm22, zmm23, word ptr [rip]{1to32} +# ATT: vdivbf16 (%rip){1to32}, %zmm23, %zmm22 +# INTEL: vdivbf16 zmm22, zmm23, word ptr [rip]{1to32} 0x62,0xe5,0x45,0x50,0x5e,0x35,0x00,0x00,0x00,0x00 -# ATT: vdivnepbf16 -2048(,%rbp,2), %zmm23, %zmm22 -# INTEL: vdivnepbf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048] +# ATT: vdivbf16 -2048(,%rbp,2), %zmm23, %zmm22 +# INTEL: vdivbf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048] 0x62,0xe5,0x45,0x40,0x5e,0x34,0x6d,0x00,0xf8,0xff,0xff -# ATT: vdivnepbf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z} -# INTEL: vdivnepbf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128] +# ATT: vdivbf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z} +# INTEL: vdivbf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128] 0x62,0xe5,0x45,0xc7,0x5e,0x71,0x7f -# ATT: vdivnepbf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z} -# INTEL: vdivnepbf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32} +# ATT: vdivbf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z} +# INTEL: vdivbf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32} 0x62,0xe5,0x45,0xd7,0x5e,0x72,0x80 -# ATT: vdivnepbf16 268435456(%rbp,%r14,8), %ymm23, %ymm22 -# INTEL: vdivnepbf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456] +# ATT: vdivbf16 268435456(%rbp,%r14,8), %ymm23, %ymm22 +# INTEL: vdivbf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456] 0x62,0xa5,0x45,0x20,0x5e,0xb4,0xf5,0x00,0x00,0x00,0x10 -# ATT: vdivnepbf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7} -# INTEL: vdivnepbf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291] +# ATT: vdivbf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7} +# INTEL: vdivbf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291] 0x62,0xc5,0x45,0x27,0x5e,0xb4,0x80,0x23,0x01,0x00,0x00 -# ATT: vdivnepbf16 (%rip){1to16}, %ymm23, %ymm22 -# INTEL: vdivnepbf16 ymm22, ymm23, word ptr [rip]{1to16} +# ATT: vdivbf16 (%rip){1to16}, %ymm23, %ymm22 +# INTEL: vdivbf16 ymm22, ymm23, word ptr [rip]{1to16} 0x62,0xe5,0x45,0x30,0x5e,0x35,0x00,0x00,0x00,0x00 -# ATT: vdivnepbf16 -1024(,%rbp,2), %ymm23, %ymm22 -# INTEL: vdivnepbf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024] +# ATT: vdivbf16 -1024(,%rbp,2), %ymm23, %ymm22 +# INTEL: vdivbf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024] 0x62,0xe5,0x45,0x20,0x5e,0x34,0x6d,0x00,0xfc,0xff,0xff -# ATT: vdivnepbf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z} -# INTEL: vdivnepbf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064] +# ATT: vdivbf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z} +# INTEL: vdivbf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064] 0x62,0xe5,0x45,0xa7,0x5e,0x71,0x7f -# ATT: vdivnepbf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z} -# INTEL: vdivnepbf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16} +# ATT: vdivbf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z} +# INTEL: vdivbf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16} 0x62,0xe5,0x45,0xb7,0x5e,0x72,0x80 -# ATT: vdivnepbf16 268435456(%rbp,%r14,8), %xmm23, %xmm22 -# INTEL: vdivnepbf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456] +# ATT: vdivbf16 268435456(%rbp,%r14,8), %xmm23, %xmm22 +# INTEL: vdivbf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456] 0x62,0xa5,0x45,0x00,0x5e,0xb4,0xf5,0x00,0x00,0x00,0x10 -# ATT: vdivnepbf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7} -# INTEL: vdivnepbf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291] +# ATT: vdivbf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7} +# INTEL: vdivbf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291] 0x62,0xc5,0x45,0x07,0x5e,0xb4,0x80,0x23,0x01,0x00,0x00 -# ATT: vdivnepbf16 (%rip){1to8}, %xmm23, %xmm22 -# INTEL: vdivnepbf16 xmm22, xmm23, word ptr [rip]{1to8} +# ATT: vdivbf16 (%rip){1to8}, %xmm23, %xmm22 +# INTEL: vdivbf16 xmm22, xmm23, word ptr [rip]{1to8} 0x62,0xe5,0x45,0x10,0x5e,0x35,0x00,0x00,0x00,0x00 -# ATT: vdivnepbf16 -512(,%rbp,2), %xmm23, %xmm22 -# INTEL: vdivnepbf16 xmm22, xmm23, xmmword ptr [2*rbp - 512] +# ATT: vdivbf16 -512(,%rbp,2), %xmm23, %xmm22 +# INTEL: vdivbf16 xmm22, xmm23, xmmword ptr [2*rbp - 512] 0x62,0xe5,0x45,0x00,0x5e,0x34,0x6d,0x00,0xfe,0xff,0xff -# ATT: vdivnepbf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z} -# INTEL: vdivnepbf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032] +# ATT: vdivbf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z} +# INTEL: vdivbf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032] 0x62,0xe5,0x45,0x87,0x5e,0x71,0x7f -# ATT: vdivnepbf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z} -# INTEL: vdivnepbf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8} +# ATT: vdivbf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z} +# INTEL: vdivbf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8} 0x62,0xe5,0x45,0x97,0x5e,0x72,0x80 -# ATT: vfmadd132nepbf16 %ymm24, %ymm23, %ymm22 -# INTEL: vfmadd132nepbf16 ymm22, ymm23, ymm24 +# ATT: vfmadd132bf16 %ymm24, %ymm23, %ymm22 +# INTEL: vfmadd132bf16 ymm22, ymm23, ymm24 0x62,0x86,0x44,0x20,0x98,0xf0 -# ATT: vfmadd132nepbf16 %ymm24, %ymm23, %ymm22 {%k7} -# INTEL: vfmadd132nepbf16 ymm22 {k7}, ymm23, ymm24 +# ATT: vfmadd132bf16 %ymm24, %ymm23, %ymm22 {%k7} +# INTEL: vfmadd132bf16 ymm22 {k7}, ymm23, ymm24 0x62,0x86,0x44,0x27,0x98,0xf0 -# ATT: vfmadd132nepbf16 %ymm24, %ymm23, %ymm22 {%k7} {z} -# INTEL: vfmadd132nepbf16 ymm22 {k7} {z}, ymm23, ymm24 +# ATT: vfmadd132bf16 %ymm24, %ymm23, %ymm22 {%k7} {z} +# INTEL: vfmadd132bf16 ymm22 {k7} {z}, ymm23, ymm24 0x62,0x86,0x44,0xa7,0x98,0xf0 -# ATT: vfmadd132nepbf16 %zmm24, %zmm23, %zmm22 -# INTEL: vfmadd132nepbf16 zmm22, zmm23, zmm24 +# ATT: vfmadd132bf16 %zmm24, %zmm23, %zmm22 +# INTEL: vfmadd132bf16 zmm22, zmm23, zmm24 0x62,0x86,0x44,0x40,0x98,0xf0 -# ATT: vfmadd132nepbf16 %zmm24, %zmm23, %zmm22 {%k7} -# INTEL: vfmadd132nepbf16 zmm22 {k7}, zmm23, zmm24 +# ATT: vfmadd132bf16 %zmm24, %zmm23, %zmm22 {%k7} +# INTEL: vfmadd132bf16 zmm22 {k7}, zmm23, zmm24 0x62,0x86,0x44,0x47,0x98,0xf0 -# ATT: vfmadd132nepbf16 %zmm24, %zmm23, %zmm22 {%k7} {z} -# INTEL: vfmadd132nepbf16 zmm22 {k7} {z}, zmm23, zmm24 +# ATT: vfmadd132bf16 %zmm24, %zmm23, %zmm22 {%k7} {z} +# INTEL: vfmadd132bf16 zmm22 {k7} {z}, zmm23, zmm24 0x62,0x86,0x44,0xc7,0x98,0xf0 -# ATT: vfmadd132nepbf16 %xmm24, %xmm23, %xmm22 -# INTEL: vfmadd132nepbf16 xmm22, xmm23, xmm24 +# ATT: vfmadd132bf16 %xmm24, %xmm23, %xmm22 +# INTEL: vfmadd132bf16 xmm22, xmm23, xmm24 0x62,0x86,0x44,0x00,0x98,0xf0 -# ATT: vfmadd132nepbf16 %xmm24, %xmm23, %xmm22 {%k7} -# INTEL: vfmadd132nepbf16 xmm22 {k7}, xmm23, xmm24 +# ATT: vfmadd132bf16 %xmm24, %xmm23, %xmm22 {%k7} +# INTEL: vfmadd132bf16 xmm22 {k7}, xmm23, xmm24 0x62,0x86,0x44,0x07,0x98,0xf0 -# ATT: vfmadd132nepbf16 %xmm24, %xmm23, %xmm22 {%k7} {z} -# INTEL: vfmadd132nepbf16 xmm22 {k7} {z}, xmm23, xmm24 +# ATT: vfmadd132bf16 %xmm24, %xmm23, %xmm22 {%k7} {z} +# INTEL: vfmadd132bf16 xmm22 {k7} {z}, xmm23, xmm24 0x62,0x86,0x44,0x87,0x98,0xf0 -# ATT: vfmadd132nepbf16 268435456(%rbp,%r14,8), %zmm23, %zmm22 -# INTEL: vfmadd132nepbf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456] +# ATT: vfmadd132bf16 268435456(%rbp,%r14,8), %zmm23, %zmm22 +# INTEL: vfmadd132bf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456] 0x62,0xa6,0x44,0x40,0x98,0xb4,0xf5,0x00,0x00,0x00,0x10 -# ATT: vfmadd132nepbf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7} -# INTEL: vfmadd132nepbf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291] +# ATT: vfmadd132bf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7} +# INTEL: vfmadd132bf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291] 0x62,0xc6,0x44,0x47,0x98,0xb4,0x80,0x23,0x01,0x00,0x00 -# ATT: vfmadd132nepbf16 (%rip){1to32}, %zmm23, %zmm22 -# INTEL: vfmadd132nepbf16 zmm22, zmm23, word ptr [rip]{1to32} +# ATT: vfmadd132bf16 (%rip){1to32}, %zmm23, %zmm22 +# INTEL: vfmadd132bf16 zmm22, zmm23, word ptr [rip]{1to32} 0x62,0xe6,0x44,0x50,0x98,0x35,0x00,0x00,0x00,0x00 -# ATT: vfmadd132nepbf16 -2048(,%rbp,2), %zmm23, %zmm22 -# INTEL: vfmadd132nepbf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048] +# ATT: vfmadd132bf16 -2048(,%rbp,2), %zmm23, %zmm22 +# INTEL: vfmadd132bf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048] 0x62,0xe6,0x44,0x40,0x98,0x34,0x6d,0x00,0xf8,0xff,0xff -# ATT: vfmadd132nepbf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z} -# INTEL: vfmadd132nepbf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128] +# ATT: vfmadd132bf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z} +# INTEL: vfmadd132bf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128] 0x62,0xe6,0x44,0xc7,0x98,0x71,0x7f -# ATT: vfmadd132nepbf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z} -# INTEL: vfmadd132nepbf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32} +# ATT: vfmadd132bf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z} +# INTEL: vfmadd132bf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32} 0x62,0xe6,0x44,0xd7,0x98,0x72,0x80 -# ATT: vfmadd132nepbf16 268435456(%rbp,%r14,8), %ymm23, %ymm22 -# INTEL: vfmadd132nepbf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456] +# ATT: vfmadd132bf16 268435456(%rbp,%r14,8), %ymm23, %ymm22 +# INTEL: vfmadd132bf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456] 0x62,0xa6,0x44,0x20,0x98,0xb4,0xf5,0x00,0x00,0x00,0x10 -# ATT: vfmadd132nepbf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7} -# INTEL: vfmadd132nepbf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291] +# ATT: vfmadd132bf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7} +# INTEL: vfmadd132bf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291] 0x62,0xc6,0x44,0x27,0x98,0xb4,0x80,0x23,0x01,0x00,0x00 -# ATT: vfmadd132nepbf16 (%rip){1to16}, %ymm23, %ymm22 -# INTEL: vfmadd132nepbf16 ymm22, ymm23, word ptr [rip]{1to16} +# ATT: vfmadd132bf16 (%rip){1to16}, %ymm23, %ymm22 +# INTEL: vfmadd132bf16 ymm22, ymm23, word ptr [rip]{1to16} 0x62,0xe6,0x44,0x30,0x98,0x35,0x00,0x00,0x00,0x00 -# ATT: vfmadd132nepbf16 -1024(,%rbp,2), %ymm23, %ymm22 -# INTEL: vfmadd132nepbf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024] +# ATT: vfmadd132bf16 -1024(,%rbp,2), %ymm23, %ymm22 +# INTEL: vfmadd132bf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024] 0x62,0xe6,0x44,0x20,0x98,0x34,0x6d,0x00,0xfc,0xff,0xff -# ATT: vfmadd132nepbf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z} -# INTEL: vfmadd132nepbf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064] +# ATT: vfmadd132bf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z} +# INTEL: vfmadd132bf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064] 0x62,0xe6,0x44,0xa7,0x98,0x71,0x7f -# ATT: vfmadd132nepbf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z} -# INTEL: vfmadd132nepbf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16} +# ATT: vfmadd132bf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z} +# INTEL: vfmadd132bf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16} 0x62,0xe6,0x44,0xb7,0x98,0x72,0x80 -# ATT: vfmadd132nepbf16 268435456(%rbp,%r14,8), %xmm23, %xmm22 -# INTEL: vfmadd132nepbf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456] +# ATT: vfmadd132bf16 268435456(%rbp,%r14,8), %xmm23, %xmm22 +# INTEL: vfmadd132bf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456] 0x62,0xa6,0x44,0x00,0x98,0xb4,0xf5,0x00,0x00,0x00,0x10 -# ATT: vfmadd132nepbf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7} -# INTEL: vfmadd132nepbf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291] +# ATT: vfmadd132bf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7} +# INTEL: vfmadd132bf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291] 0x62,0xc6,0x44,0x07,0x98,0xb4,0x80,0x23,0x01,0x00,0x00 -# ATT: vfmadd132nepbf16 (%rip){1to8}, %xmm23, %xmm22 -# INTEL: vfmadd132nepbf16 xmm22, xmm23, word ptr [rip]{1to8} +# ATT: vfmadd132bf16 (%rip){1to8}, %xmm23, %xmm22 +# INTEL: vfmadd132bf16 xmm22, xmm23, word ptr [rip]{1to8} 0x62,0xe6,0x44,0x10,0x98,0x35,0x00,0x00,0x00,0x00 -# ATT: vfmadd132nepbf16 -512(,%rbp,2), %xmm23, %xmm22 -# INTEL: vfmadd132nepbf16 xmm22, xmm23, xmmword ptr [2*rbp - 512] +# ATT: vfmadd132bf16 -512(,%rbp,2), %xmm23, %xmm22 +# INTEL: vfmadd132bf16 xmm22, xmm23, xmmword ptr [2*rbp - 512] 0x62,0xe6,0x44,0x00,0x98,0x34,0x6d,0x00,0xfe,0xff,0xff -# ATT: vfmadd132nepbf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z} -# INTEL: vfmadd132nepbf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032] +# ATT: vfmadd132bf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z} +# INTEL: vfmadd132bf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032] 0x62,0xe6,0x44,0x87,0x98,0x71,0x7f -# ATT: vfmadd132nepbf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z} -# INTEL: vfmadd132nepbf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8} +# ATT: vfmadd132bf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z} +# INTEL: vfmadd132bf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8} 0x62,0xe6,0x44,0x97,0x98,0x72,0x80 -# ATT: vfmadd213nepbf16 %ymm24, %ymm23, %ymm22 -# INTEL: vfmadd213nepbf16 ymm22, ymm23, ymm24 +# ATT: vfmadd213bf16 %ymm24, %ymm23, %ymm22 +# INTEL: vfmadd213bf16 ymm22, ymm23, ymm24 0x62,0x86,0x44,0x20,0xa8,0xf0 -# ATT: vfmadd213nepbf16 %ymm24, %ymm23, %ymm22 {%k7} -# INTEL: vfmadd213nepbf16 ymm22 {k7}, ymm23, ymm24 +# ATT: vfmadd213bf16 %ymm24, %ymm23, %ymm22 {%k7} +# INTEL: vfmadd213bf16 ymm22 {k7}, ymm23, ymm24 0x62,0x86,0x44,0x27,0xa8,0xf0 -# ATT: vfmadd213nepbf16 %ymm24, %ymm23, %ymm22 {%k7} {z} -# INTEL: vfmadd213nepbf16 ymm22 {k7} {z}, ymm23, ymm24 +# ATT: vfmadd213bf16 %ymm24, %ymm23, %ymm22 {%k7} {z} +# INTEL: vfmadd213bf16 ymm22 {k7} {z}, ymm23, ymm24 0x62,0x86,0x44,0xa7,0xa8,0xf0 -# ATT: vfmadd213nepbf16 %zmm24, %zmm23, %zmm22 -# INTEL: vfmadd213nepbf16 zmm22, zmm23, zmm24 +# ATT: vfmadd213bf16 %zmm24, %zmm23, %zmm22 +# INTEL: vfmadd213bf16 zmm22, zmm23, zmm24 0x62,0x86,0x44,0x40,0xa8,0xf0 -# ATT: vfmadd213nepbf16 %zmm24, %zmm23, %zmm22 {%k7} -# INTEL: vfmadd213nepbf16 zmm22 {k7}, zmm23, zmm24 +# ATT: vfmadd213bf16 %zmm24, %zmm23, %zmm22 {%k7} +# INTEL: vfmadd213bf16 zmm22 {k7}, zmm23, zmm24 0x62,0x86,0x44,0x47,0xa8,0xf0 -# ATT: vfmadd213nepbf16 %zmm24, %zmm23, %zmm22 {%k7} {z} -# INTEL: vfmadd213nepbf16 zmm22 {k7} {z}, zmm23, zmm24 +# ATT: vfmadd213bf16 %zmm24, %zmm23, %zmm22 {%k7} {z} +# INTEL: vfmadd213bf16 zmm22 {k7} {z}, zmm23, zmm24 0x62,0x86,0x44,0xc7,0xa8,0xf0 -# ATT: vfmadd213nepbf16 %xmm24, %xmm23, %xmm22 -# INTEL: vfmadd213nepbf16 xmm22, xmm23, xmm24 +# ATT: vfmadd213bf16 %xmm24, %xmm23, %xmm22 +# INTEL: vfmadd213bf16 xmm22, xmm23, xmm24 0x62,0x86,0x44,0x00,0xa8,0xf0 -# ATT: vfmadd213nepbf16 %xmm24, %xmm23, %xmm22 {%k7} -# INTEL: vfmadd213nepbf16 xmm22 {k7}, xmm23, xmm24 +# ATT: vfmadd213bf16 %xmm24, %xmm23, %xmm22 {%k7} +# INTEL: vfmadd213bf16 xmm22 {k7}, xmm23, xmm24 0x62,0x86,0x44,0x07,0xa8,0xf0 -# ATT: vfmadd213nepbf16 %xmm24, %xmm23, %xmm22 {%k7} {z} -# INTEL: vfmadd213nepbf16 xmm22 {k7} {z}, xmm23, xmm24 +# ATT: vfmadd213bf16 %xmm24, %xmm23, %xmm22 {%k7} {z} +# INTEL: vfmadd213bf16 xmm22 {k7} {z}, xmm23, xmm24 0x62,0x86,0x44,0x87,0xa8,0xf0 -# ATT: vfmadd213nepbf16 268435456(%rbp,%r14,8), %zmm23, %zmm22 -# INTEL: vfmadd213nepbf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456] +# ATT: vfmadd213bf16 268435456(%rbp,%r14,8), %zmm23, %zmm22 +# INTEL: vfmadd213bf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456] 0x62,0xa6,0x44,0x40,0xa8,0xb4,0xf5,0x00,0x00,0x00,0x10 -# ATT: vfmadd213nepbf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7} -# INTEL: vfmadd213nepbf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291] +# ATT: vfmadd213bf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7} +# INTEL: vfmadd213bf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291] 0x62,0xc6,0x44,0x47,0xa8,0xb4,0x80,0x23,0x01,0x00,0x00 -# ATT: vfmadd213nepbf16 (%rip){1to32}, %zmm23, %zmm22 -# INTEL: vfmadd213nepbf16 zmm22, zmm23, word ptr [rip]{1to32} +# ATT: vfmadd213bf16 (%rip){1to32}, %zmm23, %zmm22 +# INTEL: vfmadd213bf16 zmm22, zmm23, word ptr [rip]{1to32} 0x62,0xe6,0x44,0x50,0xa8,0x35,0x00,0x00,0x00,0x00 -# ATT: vfmadd213nepbf16 -2048(,%rbp,2), %zmm23, %zmm22 -# INTEL: vfmadd213nepbf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048] +# ATT: vfmadd213bf16 -2048(,%rbp,2), %zmm23, %zmm22 +# INTEL: vfmadd213bf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048] 0x62,0xe6,0x44,0x40,0xa8,0x34,0x6d,0x00,0xf8,0xff,0xff -# ATT: vfmadd213nepbf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z} -# INTEL: vfmadd213nepbf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128] +# ATT: vfmadd213bf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z} +# INTEL: vfmadd213bf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128] 0x62,0xe6,0x44,0xc7,0xa8,0x71,0x7f -# ATT: vfmadd213nepbf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z} -# INTEL: vfmadd213nepbf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32} +# ATT: vfmadd213bf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z} +# INTEL: vfmadd213bf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32} 0x62,0xe6,0x44,0xd7,0xa8,0x72,0x80 -# ATT: vfmadd213nepbf16 268435456(%rbp,%r14,8), %ymm23, %ymm22 -# INTEL: vfmadd213nepbf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456] +# ATT: vfmadd213bf16 268435456(%rbp,%r14,8), %ymm23, %ymm22 +# INTEL: vfmadd213bf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456] 0x62,0xa6,0x44,0x20,0xa8,0xb4,0xf5,0x00,0x00,0x00,0x10 -# ATT: vfmadd213nepbf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7} -# INTEL: vfmadd213nepbf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291] +# ATT: vfmadd213bf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7} +# INTEL: vfmadd213bf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291] 0x62,0xc6,0x44,0x27,0xa8,0xb4,0x80,0x23,0x01,0x00,0x00 -# ATT: vfmadd213nepbf16 (%rip){1to16}, %ymm23, %ymm22 -# INTEL: vfmadd213nepbf16 ymm22, ymm23, word ptr [rip]{1to16} +# ATT: vfmadd213bf16 (%rip){1to16}, %ymm23, %ymm22 +# INTEL: vfmadd213bf16 ymm22, ymm23, word ptr [rip]{1to16} 0x62,0xe6,0x44,0x30,0xa8,0x35,0x00,0x00,0x00,0x00 -# ATT: vfmadd213nepbf16 -1024(,%rbp,2), %ymm23, %ymm22 -# INTEL: vfmadd213nepbf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024] +# ATT: vfmadd213bf16 -1024(,%rbp,2), %ymm23, %ymm22 +# INTEL: vfmadd213bf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024] 0x62,0xe6,0x44,0x20,0xa8,0x34,0x6d,0x00,0xfc,0xff,0xff -# ATT: vfmadd213nepbf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z} -# INTEL: vfmadd213nepbf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064] +# ATT: vfmadd213bf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z} +# INTEL: vfmadd213bf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064] 0x62,0xe6,0x44,0xa7,0xa8,0x71,0x7f -# ATT: vfmadd213nepbf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z} -# INTEL: vfmadd213nepbf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16} +# ATT: vfmadd213bf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z} +# INTEL: vfmadd213bf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16} 0x62,0xe6,0x44,0xb7,0xa8,0x72,0x80 -# ATT: vfmadd213nepbf16 268435456(%rbp,%r14,8), %xmm23, %xmm22 -# INTEL: vfmadd213nepbf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456] +# ATT: vfmadd213bf16 268435456(%rbp,%r14,8), %xmm23, %xmm22 +# INTEL: vfmadd213bf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456] 0x62,0xa6,0x44,0x00,0xa8,0xb4,0xf5,0x00,0x00,0x00,0x10 -# ATT: vfmadd213nepbf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7} -# INTEL: vfmadd213nepbf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291] +# ATT: vfmadd213bf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7} +# INTEL: vfmadd213bf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291] 0x62,0xc6,0x44,0x07,0xa8,0xb4,0x80,0x23,0x01,0x00,0x00 -# ATT: vfmadd213nepbf16 (%rip){1to8}, %xmm23, %xmm22 -# INTEL: vfmadd213nepbf16 xmm22, xmm23, word ptr [rip]{1to8} +# ATT: vfmadd213bf16 (%rip){1to8}, %xmm23, %xmm22 +# INTEL: vfmadd213bf16 xmm22, xmm23, word ptr [rip]{1to8} 0x62,0xe6,0x44,0x10,0xa8,0x35,0x00,0x00,0x00,0x00 -# ATT: vfmadd213nepbf16 -512(,%rbp,2), %xmm23, %xmm22 -# INTEL: vfmadd213nepbf16 xmm22, xmm23, xmmword ptr [2*rbp - 512] +# ATT: vfmadd213bf16 -512(,%rbp,2), %xmm23, %xmm22 +# INTEL: vfmadd213bf16 xmm22, xmm23, xmmword ptr [2*rbp - 512] 0x62,0xe6,0x44,0x00,0xa8,0x34,0x6d,0x00,0xfe,0xff,0xff -# ATT: vfmadd213nepbf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z} -# INTEL: vfmadd213nepbf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032] +# ATT: vfmadd213bf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z} +# INTEL: vfmadd213bf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032] 0x62,0xe6,0x44,0x87,0xa8,0x71,0x7f -# ATT: vfmadd213nepbf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z} -# INTEL: vfmadd213nepbf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8} +# ATT: vfmadd213bf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z} +# INTEL: vfmadd213bf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8} 0x62,0xe6,0x44,0x97,0xa8,0x72,0x80 -# ATT: vfmadd231nepbf16 %ymm24, %ymm23, %ymm22 -# INTEL: vfmadd231nepbf16 ymm22, ymm23, ymm24 +# ATT: vfmadd231bf16 %ymm24, %ymm23, %ymm22 +# INTEL: vfmadd231bf16 ymm22, ymm23, ymm24 0x62,0x86,0x44,0x20,0xb8,0xf0 -# ATT: vfmadd231nepbf16 %ymm24, %ymm23, %ymm22 {%k7} -# INTEL: vfmadd231nepbf16 ymm22 {k7}, ymm23, ymm24 +# ATT: vfmadd231bf16 %ymm24, %ymm23, %ymm22 {%k7} +# INTEL: vfmadd231bf16 ymm22 {k7}, ymm23, ymm24 0x62,0x86,0x44,0x27,0xb8,0xf0 -# ATT: vfmadd231nepbf16 %ymm24, %ymm23, %ymm22 {%k7} {z} -# INTEL: vfmadd231nepbf16 ymm22 {k7} {z}, ymm23, ymm24 +# ATT: vfmadd231bf16 %ymm24, %ymm23, %ymm22 {%k7} {z} +# INTEL: vfmadd231bf16 ymm22 {k7} {z}, ymm23, ymm24 0x62,0x86,0x44,0xa7,0xb8,0xf0 -# ATT: vfmadd231nepbf16 %zmm24, %zmm23, %zmm22 -# INTEL: vfmadd231nepbf16 zmm22, zmm23, zmm24 +# ATT: vfmadd231bf16 %zmm24, %zmm23, %zmm22 +# INTEL: vfmadd231bf16 zmm22, zmm23, zmm24 0x62,0x86,0x44,0x40,0xb8,0xf0 -# ATT: vfmadd231nepbf16 %zmm24, %zmm23, %zmm22 {%k7} -# INTEL: vfmadd231nepbf16 zmm22 {k7}, zmm23, zmm24 +# ATT: vfmadd231bf16 %zmm24, %zmm23, %zmm22 {%k7} +# INTEL: vfmadd231bf16 zmm22 {k7}, zmm23, zmm24 0x62,0x86,0x44,0x47,0xb8,0xf0 -# ATT: vfmadd231nepbf16 %zmm24, %zmm23, %zmm22 {%k7} {z} -# INTEL: vfmadd231nepbf16 zmm22 {k7} {z}, zmm23, zmm24 +# ATT: vfmadd231bf16 %zmm24, %zmm23, %zmm22 {%k7} {z} +# INTEL: vfmadd231bf16 zmm22 {k7} {z}, zmm23, zmm24 0x62,0x86,0x44,0xc7,0xb8,0xf0 -# ATT: vfmadd231nepbf16 %xmm24, %xmm23, %xmm22 -# INTEL: vfmadd231nepbf16 xmm22, xmm23, xmm24 +# ATT: vfmadd231bf16 %xmm24, %xmm23, %xmm22 +# INTEL: vfmadd231bf16 xmm22, xmm23, xmm24 0x62,0x86,0x44,0x00,0xb8,0xf0 -# ATT: vfmadd231nepbf16 %xmm24, %xmm23, %xmm22 {%k7} -# INTEL: vfmadd231nepbf16 xmm22 {k7}, xmm23, xmm24 +# ATT: vfmadd231bf16 %xmm24, %xmm23, %xmm22 {%k7} +# INTEL: vfmadd231bf16 xmm22 {k7}, xmm23, xmm24 0x62,0x86,0x44,0x07,0xb8,0xf0 -# ATT: vfmadd231nepbf16 %xmm24, %xmm23, %xmm22 {%k7} {z} -# INTEL: vfmadd231nepbf16 xmm22 {k7} {z}, xmm23, xmm24 +# ATT: vfmadd231bf16 %xmm24, %xmm23, %xmm22 {%k7} {z} +# INTEL: vfmadd231bf16 xmm22 {k7} {z}, xmm23, xmm24 0x62,0x86,0x44,0x87,0xb8,0xf0 -# ATT: vfmadd231nepbf16 268435456(%rbp,%r14,8), %zmm23, %zmm22 -# INTEL: vfmadd231nepbf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456] +# ATT: vfmadd231bf16 268435456(%rbp,%r14,8), %zmm23, %zmm22 +# INTEL: vfmadd231bf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456] 0x62,0xa6,0x44,0x40,0xb8,0xb4,0xf5,0x00,0x00,0x00,0x10 -# ATT: vfmadd231nepbf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7} -# INTEL: vfmadd231nepbf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291] +# ATT: vfmadd231bf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7} +# INTEL: vfmadd231bf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291] 0x62,0xc6,0x44,0x47,0xb8,0xb4,0x80,0x23,0x01,0x00,0x00 -# ATT: vfmadd231nepbf16 (%rip){1to32}, %zmm23, %zmm22 -# INTEL: vfmadd231nepbf16 zmm22, zmm23, word ptr [rip]{1to32} +# ATT: vfmadd231bf16 (%rip){1to32}, %zmm23, %zmm22 +# INTEL: vfmadd231bf16 zmm22, zmm23, word ptr [rip]{1to32} 0x62,0xe6,0x44,0x50,0xb8,0x35,0x00,0x00,0x00,0x00 -# ATT: vfmadd231nepbf16 -2048(,%rbp,2), %zmm23, %zmm22 -# INTEL: vfmadd231nepbf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048] +# ATT: vfmadd231bf16 -2048(,%rbp,2), %zmm23, %zmm22 +# INTEL: vfmadd231bf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048] 0x62,0xe6,0x44,0x40,0xb8,0x34,0x6d,0x00,0xf8,0xff,0xff -# ATT: vfmadd231nepbf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z} -# INTEL: vfmadd231nepbf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128] +# ATT: vfmadd231bf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z} +# INTEL: vfmadd231bf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128] 0x62,0xe6,0x44,0xc7,0xb8,0x71,0x7f -# ATT: vfmadd231nepbf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z} -# INTEL: vfmadd231nepbf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32} +# ATT: vfmadd231bf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z} +# INTEL: vfmadd231bf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32} 0x62,0xe6,0x44,0xd7,0xb8,0x72,0x80 -# ATT: vfmadd231nepbf16 268435456(%rbp,%r14,8), %ymm23, %ymm22 -# INTEL: vfmadd231nepbf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456] +# ATT: vfmadd231bf16 268435456(%rbp,%r14,8), %ymm23, %ymm22 +# INTEL: vfmadd231bf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456] 0x62,0xa6,0x44,0x20,0xb8,0xb4,0xf5,0x00,0x00,0x00,0x10 -# ATT: vfmadd231nepbf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7} -# INTEL: vfmadd231nepbf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291] +# ATT: vfmadd231bf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7} +# INTEL: vfmadd231bf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291] 0x62,0xc6,0x44,0x27,0xb8,0xb4,0x80,0x23,0x01,0x00,0x00 -# ATT: vfmadd231nepbf16 (%rip){1to16}, %ymm23, %ymm22 -# INTEL: vfmadd231nepbf16 ymm22, ymm23, word ptr [rip]{1to16} +# ATT: vfmadd231bf16 (%rip){1to16}, %ymm23, %ymm22 +# INTEL: vfmadd231bf16 ymm22, ymm23, word ptr [rip]{1to16} 0x62,0xe6,0x44,0x30,0xb8,0x35,0x00,0x00,0x00,0x00 -# ATT: vfmadd231nepbf16 -1024(,%rbp,2), %ymm23, %ymm22 -# INTEL: vfmadd231nepbf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024] +# ATT: vfmadd231bf16 -1024(,%rbp,2), %ymm23, %ymm22 +# INTEL: vfmadd231bf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024] 0x62,0xe6,0x44,0x20,0xb8,0x34,0x6d,0x00,0xfc,0xff,0xff -# ATT: vfmadd231nepbf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z} -# INTEL: vfmadd231nepbf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064] +# ATT: vfmadd231bf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z} +# INTEL: vfmadd231bf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064] 0x62,0xe6,0x44,0xa7,0xb8,0x71,0x7f -# ATT: vfmadd231nepbf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z} -# INTEL: vfmadd231nepbf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16} +# ATT: vfmadd231bf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z} +# INTEL: vfmadd231bf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16} 0x62,0xe6,0x44,0xb7,0xb8,0x72,0x80 -# ATT: vfmadd231nepbf16 268435456(%rbp,%r14,8), %xmm23, %xmm22 -# INTEL: vfmadd231nepbf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456] +# ATT: vfmadd231bf16 268435456(%rbp,%r14,8), %xmm23, %xmm22 +# INTEL: vfmadd231bf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456] 0x62,0xa6,0x44,0x00,0xb8,0xb4,0xf5,0x00,0x00,0x00,0x10 -# ATT: vfmadd231nepbf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7} -# INTEL: vfmadd231nepbf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291] +# ATT: vfmadd231bf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7} +# INTEL: vfmadd231bf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291] 0x62,0xc6,0x44,0x07,0xb8,0xb4,0x80,0x23,0x01,0x00,0x00 -# ATT: vfmadd231nepbf16 (%rip){1to8}, %xmm23, %xmm22 -# INTEL: vfmadd231nepbf16 xmm22, xmm23, word ptr [rip]{1to8} +# ATT: vfmadd231bf16 (%rip){1to8}, %xmm23, %xmm22 +# INTEL: vfmadd231bf16 xmm22, xmm23, word ptr [rip]{1to8} 0x62,0xe6,0x44,0x10,0xb8,0x35,0x00,0x00,0x00,0x00 -# ATT: vfmadd231nepbf16 -512(,%rbp,2), %xmm23, %xmm22 -# INTEL: vfmadd231nepbf16 xmm22, xmm23, xmmword ptr [2*rbp - 512] +# ATT: vfmadd231bf16 -512(,%rbp,2), %xmm23, %xmm22 +# INTEL: vfmadd231bf16 xmm22, xmm23, xmmword ptr [2*rbp - 512] 0x62,0xe6,0x44,0x00,0xb8,0x34,0x6d,0x00,0xfe,0xff,0xff -# ATT: vfmadd231nepbf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z} -# INTEL: vfmadd231nepbf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032] +# ATT: vfmadd231bf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z} +# INTEL: vfmadd231bf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032] 0x62,0xe6,0x44,0x87,0xb8,0x71,0x7f -# ATT: vfmadd231nepbf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z} -# INTEL: vfmadd231nepbf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8} +# ATT: vfmadd231bf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z} +# INTEL: vfmadd231bf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8} 0x62,0xe6,0x44,0x97,0xb8,0x72,0x80 -# ATT: vfmsub132nepbf16 %ymm24, %ymm23, %ymm22 -# INTEL: vfmsub132nepbf16 ymm22, ymm23, ymm24 +# ATT: vfmsub132bf16 %ymm24, %ymm23, %ymm22 +# INTEL: vfmsub132bf16 ymm22, ymm23, ymm24 0x62,0x86,0x44,0x20,0x9a,0xf0 -# ATT: vfmsub132nepbf16 %ymm24, %ymm23, %ymm22 {%k7} -# INTEL: vfmsub132nepbf16 ymm22 {k7}, ymm23, ymm24 +# ATT: vfmsub132bf16 %ymm24, %ymm23, %ymm22 {%k7} +# INTEL: vfmsub132bf16 ymm22 {k7}, ymm23, ymm24 0x62,0x86,0x44,0x27,0x9a,0xf0 -# ATT: vfmsub132nepbf16 %ymm24, %ymm23, %ymm22 {%k7} {z} -# INTEL: vfmsub132nepbf16 ymm22 {k7} {z}, ymm23, ymm24 +# ATT: vfmsub132bf16 %ymm24, %ymm23, %ymm22 {%k7} {z} +# INTEL: vfmsub132bf16 ymm22 {k7} {z}, ymm23, ymm24 0x62,0x86,0x44,0xa7,0x9a,0xf0 -# ATT: vfmsub132nepbf16 %zmm24, %zmm23, %zmm22 -# INTEL: vfmsub132nepbf16 zmm22, zmm23, zmm24 +# ATT: vfmsub132bf16 %zmm24, %zmm23, %zmm22 +# INTEL: vfmsub132bf16 zmm22, zmm23, zmm24 0x62,0x86,0x44,0x40,0x9a,0xf0 -# ATT: vfmsub132nepbf16 %zmm24, %zmm23, %zmm22 {%k7} -# INTEL: vfmsub132nepbf16 zmm22 {k7}, zmm23, zmm24 +# ATT: vfmsub132bf16 %zmm24, %zmm23, %zmm22 {%k7} +# INTEL: vfmsub132bf16 zmm22 {k7}, zmm23, zmm24 0x62,0x86,0x44,0x47,0x9a,0xf0 -# ATT: vfmsub132nepbf16 %zmm24, %zmm23, %zmm22 {%k7} {z} -# INTEL: vfmsub132nepbf16 zmm22 {k7} {z}, zmm23, zmm24 +# ATT: vfmsub132bf16 %zmm24, %zmm23, %zmm22 {%k7} {z} +# INTEL: vfmsub132bf16 zmm22 {k7} {z}, zmm23, zmm24 0x62,0x86,0x44,0xc7,0x9a,0xf0 -# ATT: vfmsub132nepbf16 %xmm24, %xmm23, %xmm22 -# INTEL: vfmsub132nepbf16 xmm22, xmm23, xmm24 +# ATT: vfmsub132bf16 %xmm24, %xmm23, %xmm22 +# INTEL: vfmsub132bf16 xmm22, xmm23, xmm24 0x62,0x86,0x44,0x00,0x9a,0xf0 -# ATT: vfmsub132nepbf16 %xmm24, %xmm23, %xmm22 {%k7} -# INTEL: vfmsub132nepbf16 xmm22 {k7}, xmm23, xmm24 +# ATT: vfmsub132bf16 %xmm24, %xmm23, %xmm22 {%k7} +# INTEL: vfmsub132bf16 xmm22 {k7}, xmm23, xmm24 0x62,0x86,0x44,0x07,0x9a,0xf0 -# ATT: vfmsub132nepbf16 %xmm24, %xmm23, %xmm22 {%k7} {z} -# INTEL: vfmsub132nepbf16 xmm22 {k7} {z}, xmm23, xmm24 +# ATT: vfmsub132bf16 %xmm24, %xmm23, %xmm22 {%k7} {z} +# INTEL: vfmsub132bf16 xmm22 {k7} {z}, xmm23, xmm24 0x62,0x86,0x44,0x87,0x9a,0xf0 -# ATT: vfmsub132nepbf16 268435456(%rbp,%r14,8), %zmm23, %zmm22 -# INTEL: vfmsub132nepbf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456] +# ATT: vfmsub132bf16 268435456(%rbp,%r14,8), %zmm23, %zmm22 +# INTEL: vfmsub132bf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456] 0x62,0xa6,0x44,0x40,0x9a,0xb4,0xf5,0x00,0x00,0x00,0x10 -# ATT: vfmsub132nepbf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7} -# INTEL: vfmsub132nepbf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291] +# ATT: vfmsub132bf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7} +# INTEL: vfmsub132bf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291] 0x62,0xc6,0x44,0x47,0x9a,0xb4,0x80,0x23,0x01,0x00,0x00 -# ATT: vfmsub132nepbf16 (%rip){1to32}, %zmm23, %zmm22 -# INTEL: vfmsub132nepbf16 zmm22, zmm23, word ptr [rip]{1to32} +# ATT: vfmsub132bf16 (%rip){1to32}, %zmm23, %zmm22 +# INTEL: vfmsub132bf16 zmm22, zmm23, word ptr [rip]{1to32} 0x62,0xe6,0x44,0x50,0x9a,0x35,0x00,0x00,0x00,0x00 -# ATT: vfmsub132nepbf16 -2048(,%rbp,2), %zmm23, %zmm22 -# INTEL: vfmsub132nepbf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048] +# ATT: vfmsub132bf16 -2048(,%rbp,2), %zmm23, %zmm22 +# INTEL: vfmsub132bf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048] 0x62,0xe6,0x44,0x40,0x9a,0x34,0x6d,0x00,0xf8,0xff,0xff -# ATT: vfmsub132nepbf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z} -# INTEL: vfmsub132nepbf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128] +# ATT: vfmsub132bf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z} +# INTEL: vfmsub132bf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128] 0x62,0xe6,0x44,0xc7,0x9a,0x71,0x7f -# ATT: vfmsub132nepbf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z} -# INTEL: vfmsub132nepbf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32} +# ATT: vfmsub132bf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z} +# INTEL: vfmsub132bf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32} 0x62,0xe6,0x44,0xd7,0x9a,0x72,0x80 -# ATT: vfmsub132nepbf16 268435456(%rbp,%r14,8), %ymm23, %ymm22 -# INTEL: vfmsub132nepbf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456] +# ATT: vfmsub132bf16 268435456(%rbp,%r14,8), %ymm23, %ymm22 +# INTEL: vfmsub132bf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456] 0x62,0xa6,0x44,0x20,0x9a,0xb4,0xf5,0x00,0x00,0x00,0x10 -# ATT: vfmsub132nepbf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7} -# INTEL: vfmsub132nepbf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291] +# ATT: vfmsub132bf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7} +# INTEL: vfmsub132bf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291] 0x62,0xc6,0x44,0x27,0x9a,0xb4,0x80,0x23,0x01,0x00,0x00 -# ATT: vfmsub132nepbf16 (%rip){1to16}, %ymm23, %ymm22 -# INTEL: vfmsub132nepbf16 ymm22, ymm23, word ptr [rip]{1to16} +# ATT: vfmsub132bf16 (%rip){1to16}, %ymm23, %ymm22 +# INTEL: vfmsub132bf16 ymm22, ymm23, word ptr [rip]{1to16} 0x62,0xe6,0x44,0x30,0x9a,0x35,0x00,0x00,0x00,0x00 -# ATT: vfmsub132nepbf16 -1024(,%rbp,2), %ymm23, %ymm22 -# INTEL: vfmsub132nepbf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024] +# ATT: vfmsub132bf16 -1024(,%rbp,2), %ymm23, %ymm22 +# INTEL: vfmsub132bf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024] 0x62,0xe6,0x44,0x20,0x9a,0x34,0x6d,0x00,0xfc,0xff,0xff -# ATT: vfmsub132nepbf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z} -# INTEL: vfmsub132nepbf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064] +# ATT: vfmsub132bf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z} +# INTEL: vfmsub132bf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064] 0x62,0xe6,0x44,0xa7,0x9a,0x71,0x7f -# ATT: vfmsub132nepbf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z} -# INTEL: vfmsub132nepbf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16} +# ATT: vfmsub132bf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z} +# INTEL: vfmsub132bf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16} 0x62,0xe6,0x44,0xb7,0x9a,0x72,0x80 -# ATT: vfmsub132nepbf16 268435456(%rbp,%r14,8), %xmm23, %xmm22 -# INTEL: vfmsub132nepbf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456] +# ATT: vfmsub132bf16 268435456(%rbp,%r14,8), %xmm23, %xmm22 +# INTEL: vfmsub132bf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456] 0x62,0xa6,0x44,0x00,0x9a,0xb4,0xf5,0x00,0x00,0x00,0x10 -# ATT: vfmsub132nepbf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7} -# INTEL: vfmsub132nepbf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291] +# ATT: vfmsub132bf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7} +# INTEL: vfmsub132bf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291] 0x62,0xc6,0x44,0x07,0x9a,0xb4,0x80,0x23,0x01,0x00,0x00 -# ATT: vfmsub132nepbf16 (%rip){1to8}, %xmm23, %xmm22 -# INTEL: vfmsub132nepbf16 xmm22, xmm23, word ptr [rip]{1to8} +# ATT: vfmsub132bf16 (%rip){1to8}, %xmm23, %xmm22 +# INTEL: vfmsub132bf16 xmm22, xmm23, word ptr [rip]{1to8} 0x62,0xe6,0x44,0x10,0x9a,0x35,0x00,0x00,0x00,0x00 -# ATT: vfmsub132nepbf16 -512(,%rbp,2), %xmm23, %xmm22 -# INTEL: vfmsub132nepbf16 xmm22, xmm23, xmmword ptr [2*rbp - 512] +# ATT: vfmsub132bf16 -512(,%rbp,2), %xmm23, %xmm22 +# INTEL: vfmsub132bf16 xmm22, xmm23, xmmword ptr [2*rbp - 512] 0x62,0xe6,0x44,0x00,0x9a,0x34,0x6d,0x00,0xfe,0xff,0xff -# ATT: vfmsub132nepbf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z} -# INTEL: vfmsub132nepbf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032] +# ATT: vfmsub132bf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z} +# INTEL: vfmsub132bf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032] 0x62,0xe6,0x44,0x87,0x9a,0x71,0x7f -# ATT: vfmsub132nepbf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z} -# INTEL: vfmsub132nepbf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8} +# ATT: vfmsub132bf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z} +# INTEL: vfmsub132bf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8} 0x62,0xe6,0x44,0x97,0x9a,0x72,0x80 -# ATT: vfmsub213nepbf16 %ymm24, %ymm23, %ymm22 -# INTEL: vfmsub213nepbf16 ymm22, ymm23, ymm24 +# ATT: vfmsub213bf16 %ymm24, %ymm23, %ymm22 +# INTEL: vfmsub213bf16 ymm22, ymm23, ymm24 0x62,0x86,0x44,0x20,0xaa,0xf0 -# ATT: vfmsub213nepbf16 %ymm24, %ymm23, %ymm22 {%k7} -# INTEL: vfmsub213nepbf16 ymm22 {k7}, ymm23, ymm24 +# ATT: vfmsub213bf16 %ymm24, %ymm23, %ymm22 {%k7} +# INTEL: vfmsub213bf16 ymm22 {k7}, ymm23, ymm24 0x62,0x86,0x44,0x27,0xaa,0xf0 -# ATT: vfmsub213nepbf16 %ymm24, %ymm23, %ymm22 {%k7} {z} -# INTEL: vfmsub213nepbf16 ymm22 {k7} {z}, ymm23, ymm24 +# ATT: vfmsub213bf16 %ymm24, %ymm23, %ymm22 {%k7} {z} +# INTEL: vfmsub213bf16 ymm22 {k7} {z}, ymm23, ymm24 0x62,0x86,0x44,0xa7,0xaa,0xf0 -# ATT: vfmsub213nepbf16 %zmm24, %zmm23, %zmm22 -# INTEL: vfmsub213nepbf16 zmm22, zmm23, zmm24 +# ATT: vfmsub213bf16 %zmm24, %zmm23, %zmm22 +# INTEL: vfmsub213bf16 zmm22, zmm23, zmm24 0x62,0x86,0x44,0x40,0xaa,0xf0 -# ATT: vfmsub213nepbf16 %zmm24, %zmm23, %zmm22 {%k7} -# INTEL: vfmsub213nepbf16 zmm22 {k7}, zmm23, zmm24 +# ATT: vfmsub213bf16 %zmm24, %zmm23, %zmm22 {%k7} +# INTEL: vfmsub213bf16 zmm22 {k7}, zmm23, zmm24 0x62,0x86,0x44,0x47,0xaa,0xf0 -# ATT: vfmsub213nepbf16 %zmm24, %zmm23, %zmm22 {%k7} {z} -# INTEL: vfmsub213nepbf16 zmm22 {k7} {z}, zmm23, zmm24 +# ATT: vfmsub213bf16 %zmm24, %zmm23, %zmm22 {%k7} {z} +# INTEL: vfmsub213bf16 zmm22 {k7} {z}, zmm23, zmm24 0x62,0x86,0x44,0xc7,0xaa,0xf0 -# ATT: vfmsub213nepbf16 %xmm24, %xmm23, %xmm22 -# INTEL: vfmsub213nepbf16 xmm22, xmm23, xmm24 +# ATT: vfmsub213bf16 %xmm24, %xmm23, %xmm22 +# INTEL: vfmsub213bf16 xmm22, xmm23, xmm24 0x62,0x86,0x44,0x00,0xaa,0xf0 -# ATT: vfmsub213nepbf16 %xmm24, %xmm23, %xmm22 {%k7} -# INTEL: vfmsub213nepbf16 xmm22 {k7}, xmm23, xmm24 +# ATT: vfmsub213bf16 %xmm24, %xmm23, %xmm22 {%k7} +# INTEL: vfmsub213bf16 xmm22 {k7}, xmm23, xmm24 0x62,0x86,0x44,0x07,0xaa,0xf0 -# ATT: vfmsub213nepbf16 %xmm24, %xmm23, %xmm22 {%k7} {z} -# INTEL: vfmsub213nepbf16 xmm22 {k7} {z}, xmm23, xmm24 +# ATT: vfmsub213bf16 %xmm24, %xmm23, %xmm22 {%k7} {z} +# INTEL: vfmsub213bf16 xmm22 {k7} {z}, xmm23, xmm24 0x62,0x86,0x44,0x87,0xaa,0xf0 -# ATT: vfmsub213nepbf16 268435456(%rbp,%r14,8), %zmm23, %zmm22 -# INTEL: vfmsub213nepbf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456] +# ATT: vfmsub213bf16 268435456(%rbp,%r14,8), %zmm23, %zmm22 +# INTEL: vfmsub213bf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456] 0x62,0xa6,0x44,0x40,0xaa,0xb4,0xf5,0x00,0x00,0x00,0x10 -# ATT: vfmsub213nepbf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7} -# INTEL: vfmsub213nepbf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291] +# ATT: vfmsub213bf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7} +# INTEL: vfmsub213bf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291] 0x62,0xc6,0x44,0x47,0xaa,0xb4,0x80,0x23,0x01,0x00,0x00 -# ATT: vfmsub213nepbf16 (%rip){1to32}, %zmm23, %zmm22 -# INTEL: vfmsub213nepbf16 zmm22, zmm23, word ptr [rip]{1to32} +# ATT: vfmsub213bf16 (%rip){1to32}, %zmm23, %zmm22 +# INTEL: vfmsub213bf16 zmm22, zmm23, word ptr [rip]{1to32} 0x62,0xe6,0x44,0x50,0xaa,0x35,0x00,0x00,0x00,0x00 -# ATT: vfmsub213nepbf16 -2048(,%rbp,2), %zmm23, %zmm22 -# INTEL: vfmsub213nepbf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048] +# ATT: vfmsub213bf16 -2048(,%rbp,2), %zmm23, %zmm22 +# INTEL: vfmsub213bf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048] 0x62,0xe6,0x44,0x40,0xaa,0x34,0x6d,0x00,0xf8,0xff,0xff -# ATT: vfmsub213nepbf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z} -# INTEL: vfmsub213nepbf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128] +# ATT: vfmsub213bf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z} +# INTEL: vfmsub213bf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128] 0x62,0xe6,0x44,0xc7,0xaa,0x71,0x7f -# ATT: vfmsub213nepbf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z} -# INTEL: vfmsub213nepbf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32} +# ATT: vfmsub213bf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z} +# INTEL: vfmsub213bf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32} 0x62,0xe6,0x44,0xd7,0xaa,0x72,0x80 -# ATT: vfmsub213nepbf16 268435456(%rbp,%r14,8), %ymm23, %ymm22 -# INTEL: vfmsub213nepbf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456] +# ATT: vfmsub213bf16 268435456(%rbp,%r14,8), %ymm23, %ymm22 +# INTEL: vfmsub213bf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456] 0x62,0xa6,0x44,0x20,0xaa,0xb4,0xf5,0x00,0x00,0x00,0x10 -# ATT: vfmsub213nepbf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7} -# INTEL: vfmsub213nepbf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291] +# ATT: vfmsub213bf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7} +# INTEL: vfmsub213bf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291] 0x62,0xc6,0x44,0x27,0xaa,0xb4,0x80,0x23,0x01,0x00,0x00 -# ATT: vfmsub213nepbf16 (%rip){1to16}, %ymm23, %ymm22 -# INTEL: vfmsub213nepbf16 ymm22, ymm23, word ptr [rip]{1to16} +# ATT: vfmsub213bf16 (%rip){1to16}, %ymm23, %ymm22 +# INTEL: vfmsub213bf16 ymm22, ymm23, word ptr [rip]{1to16} 0x62,0xe6,0x44,0x30,0xaa,0x35,0x00,0x00,0x00,0x00 -# ATT: vfmsub213nepbf16 -1024(,%rbp,2), %ymm23, %ymm22 -# INTEL: vfmsub213nepbf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024] +# ATT: vfmsub213bf16 -1024(,%rbp,2), %ymm23, %ymm22 +# INTEL: vfmsub213bf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024] 0x62,0xe6,0x44,0x20,0xaa,0x34,0x6d,0x00,0xfc,0xff,0xff -# ATT: vfmsub213nepbf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z} -# INTEL: vfmsub213nepbf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064] +# ATT: vfmsub213bf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z} +# INTEL: vfmsub213bf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064] 0x62,0xe6,0x44,0xa7,0xaa,0x71,0x7f -# ATT: vfmsub213nepbf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z} -# INTEL: vfmsub213nepbf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16} +# ATT: vfmsub213bf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z} +# INTEL: vfmsub213bf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16} 0x62,0xe6,0x44,0xb7,0xaa,0x72,0x80 -# ATT: vfmsub213nepbf16 268435456(%rbp,%r14,8), %xmm23, %xmm22 -# INTEL: vfmsub213nepbf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456] +# ATT: vfmsub213bf16 268435456(%rbp,%r14,8), %xmm23, %xmm22 +# INTEL: vfmsub213bf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456] 0x62,0xa6,0x44,0x00,0xaa,0xb4,0xf5,0x00,0x00,0x00,0x10 -# ATT: vfmsub213nepbf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7} -# INTEL: vfmsub213nepbf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291] +# ATT: vfmsub213bf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7} +# INTEL: vfmsub213bf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291] 0x62,0xc6,0x44,0x07,0xaa,0xb4,0x80,0x23,0x01,0x00,0x00 -# ATT: vfmsub213nepbf16 (%rip){1to8}, %xmm23, %xmm22 -# INTEL: vfmsub213nepbf16 xmm22, xmm23, word ptr [rip]{1to8} +# ATT: vfmsub213bf16 (%rip){1to8}, %xmm23, %xmm22 +# INTEL: vfmsub213bf16 xmm22, xmm23, word ptr [rip]{1to8} 0x62,0xe6,0x44,0x10,0xaa,0x35,0x00,0x00,0x00,0x00 -# ATT: vfmsub213nepbf16 -512(,%rbp,2), %xmm23, %xmm22 -# INTEL: vfmsub213nepbf16 xmm22, xmm23, xmmword ptr [2*rbp - 512] +# ATT: vfmsub213bf16 -512(,%rbp,2), %xmm23, %xmm22 +# INTEL: vfmsub213bf16 xmm22, xmm23, xmmword ptr [2*rbp - 512] 0x62,0xe6,0x44,0x00,0xaa,0x34,0x6d,0x00,0xfe,0xff,0xff -# ATT: vfmsub213nepbf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z} -# INTEL: vfmsub213nepbf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032] +# ATT: vfmsub213bf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z} +# INTEL: vfmsub213bf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032] 0x62,0xe6,0x44,0x87,0xaa,0x71,0x7f -# ATT: vfmsub213nepbf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z} -# INTEL: vfmsub213nepbf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8} +# ATT: vfmsub213bf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z} +# INTEL: vfmsub213bf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8} 0x62,0xe6,0x44,0x97,0xaa,0x72,0x80 -# ATT: vfmsub231nepbf16 %ymm24, %ymm23, %ymm22 -# INTEL: vfmsub231nepbf16 ymm22, ymm23, ymm24 +# ATT: vfmsub231bf16 %ymm24, %ymm23, %ymm22 +# INTEL: vfmsub231bf16 ymm22, ymm23, ymm24 0x62,0x86,0x44,0x20,0xba,0xf0 -# ATT: vfmsub231nepbf16 %ymm24, %ymm23, %ymm22 {%k7} -# INTEL: vfmsub231nepbf16 ymm22 {k7}, ymm23, ymm24 +# ATT: vfmsub231bf16 %ymm24, %ymm23, %ymm22 {%k7} +# INTEL: vfmsub231bf16 ymm22 {k7}, ymm23, ymm24 0x62,0x86,0x44,0x27,0xba,0xf0 -# ATT: vfmsub231nepbf16 %ymm24, %ymm23, %ymm22 {%k7} {z} -# INTEL: vfmsub231nepbf16 ymm22 {k7} {z}, ymm23, ymm24 +# ATT: vfmsub231bf16 %ymm24, %ymm23, %ymm22 {%k7} {z} +# INTEL: vfmsub231bf16 ymm22 {k7} {z}, ymm23, ymm24 0x62,0x86,0x44,0xa7,0xba,0xf0 -# ATT: vfmsub231nepbf16 %zmm24, %zmm23, %zmm22 -# INTEL: vfmsub231nepbf16 zmm22, zmm23, zmm24 +# ATT: vfmsub231bf16 %zmm24, %zmm23, %zmm22 +# INTEL: vfmsub231bf16 zmm22, zmm23, zmm24 0x62,0x86,0x44,0x40,0xba,0xf0 -# ATT: vfmsub231nepbf16 %zmm24, %zmm23, %zmm22 {%k7} -# INTEL: vfmsub231nepbf16 zmm22 {k7}, zmm23, zmm24 +# ATT: vfmsub231bf16 %zmm24, %zmm23, %zmm22 {%k7} +# INTEL: vfmsub231bf16 zmm22 {k7}, zmm23, zmm24 0x62,0x86,0x44,0x47,0xba,0xf0 -# ATT: vfmsub231nepbf16 %zmm24, %zmm23, %zmm22 {%k7} {z} -# INTEL: vfmsub231nepbf16 zmm22 {k7} {z}, zmm23, zmm24 +# ATT: vfmsub231bf16 %zmm24, %zmm23, %zmm22 {%k7} {z} +# INTEL: vfmsub231bf16 zmm22 {k7} {z}, zmm23, zmm24 0x62,0x86,0x44,0xc7,0xba,0xf0 -# ATT: vfmsub231nepbf16 %xmm24, %xmm23, %xmm22 -# INTEL: vfmsub231nepbf16 xmm22, xmm23, xmm24 +# ATT: vfmsub231bf16 %xmm24, %xmm23, %xmm22 +# INTEL: vfmsub231bf16 xmm22, xmm23, xmm24 0x62,0x86,0x44,0x00,0xba,0xf0 -# ATT: vfmsub231nepbf16 %xmm24, %xmm23, %xmm22 {%k7} -# INTEL: vfmsub231nepbf16 xmm22 {k7}, xmm23, xmm24 +# ATT: vfmsub231bf16 %xmm24, %xmm23, %xmm22 {%k7} +# INTEL: vfmsub231bf16 xmm22 {k7}, xmm23, xmm24 0x62,0x86,0x44,0x07,0xba,0xf0 -# ATT: vfmsub231nepbf16 %xmm24, %xmm23, %xmm22 {%k7} {z} -# INTEL: vfmsub231nepbf16 xmm22 {k7} {z}, xmm23, xmm24 +# ATT: vfmsub231bf16 %xmm24, %xmm23, %xmm22 {%k7} {z} +# INTEL: vfmsub231bf16 xmm22 {k7} {z}, xmm23, xmm24 0x62,0x86,0x44,0x87,0xba,0xf0 -# ATT: vfmsub231nepbf16 268435456(%rbp,%r14,8), %zmm23, %zmm22 -# INTEL: vfmsub231nepbf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456] +# ATT: vfmsub231bf16 268435456(%rbp,%r14,8), %zmm23, %zmm22 +# INTEL: vfmsub231bf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456] 0x62,0xa6,0x44,0x40,0xba,0xb4,0xf5,0x00,0x00,0x00,0x10 -# ATT: vfmsub231nepbf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7} -# INTEL: vfmsub231nepbf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291] +# ATT: vfmsub231bf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7} +# INTEL: vfmsub231bf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291] 0x62,0xc6,0x44,0x47,0xba,0xb4,0x80,0x23,0x01,0x00,0x00 -# ATT: vfmsub231nepbf16 (%rip){1to32}, %zmm23, %zmm22 -# INTEL: vfmsub231nepbf16 zmm22, zmm23, word ptr [rip]{1to32} +# ATT: vfmsub231bf16 (%rip){1to32}, %zmm23, %zmm22 +# INTEL: vfmsub231bf16 zmm22, zmm23, word ptr [rip]{1to32} 0x62,0xe6,0x44,0x50,0xba,0x35,0x00,0x00,0x00,0x00 -# ATT: vfmsub231nepbf16 -2048(,%rbp,2), %zmm23, %zmm22 -# INTEL: vfmsub231nepbf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048] +# ATT: vfmsub231bf16 -2048(,%rbp,2), %zmm23, %zmm22 +# INTEL: vfmsub231bf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048] 0x62,0xe6,0x44,0x40,0xba,0x34,0x6d,0x00,0xf8,0xff,0xff -# ATT: vfmsub231nepbf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z} -# INTEL: vfmsub231nepbf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128] +# ATT: vfmsub231bf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z} +# INTEL: vfmsub231bf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128] 0x62,0xe6,0x44,0xc7,0xba,0x71,0x7f -# ATT: vfmsub231nepbf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z} -# INTEL: vfmsub231nepbf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32} +# ATT: vfmsub231bf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z} +# INTEL: vfmsub231bf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32} 0x62,0xe6,0x44,0xd7,0xba,0x72,0x80 -# ATT: vfmsub231nepbf16 268435456(%rbp,%r14,8), %ymm23, %ymm22 -# INTEL: vfmsub231nepbf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456] +# ATT: vfmsub231bf16 268435456(%rbp,%r14,8), %ymm23, %ymm22 +# INTEL: vfmsub231bf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456] 0x62,0xa6,0x44,0x20,0xba,0xb4,0xf5,0x00,0x00,0x00,0x10 -# ATT: vfmsub231nepbf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7} -# INTEL: vfmsub231nepbf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291] +# ATT: vfmsub231bf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7} +# INTEL: vfmsub231bf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291] 0x62,0xc6,0x44,0x27,0xba,0xb4,0x80,0x23,0x01,0x00,0x00 -# ATT: vfmsub231nepbf16 (%rip){1to16}, %ymm23, %ymm22 -# INTEL: vfmsub231nepbf16 ymm22, ymm23, word ptr [rip]{1to16} +# ATT: vfmsub231bf16 (%rip){1to16}, %ymm23, %ymm22 +# INTEL: vfmsub231bf16 ymm22, ymm23, word ptr [rip]{1to16} 0x62,0xe6,0x44,0x30,0xba,0x35,0x00,0x00,0x00,0x00 -# ATT: vfmsub231nepbf16 -1024(,%rbp,2), %ymm23, %ymm22 -# INTEL: vfmsub231nepbf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024] +# ATT: vfmsub231bf16 -1024(,%rbp,2), %ymm23, %ymm22 +# INTEL: vfmsub231bf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024] 0x62,0xe6,0x44,0x20,0xba,0x34,0x6d,0x00,0xfc,0xff,0xff -# ATT: vfmsub231nepbf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z} -# INTEL: vfmsub231nepbf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064] +# ATT: vfmsub231bf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z} +# INTEL: vfmsub231bf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064] 0x62,0xe6,0x44,0xa7,0xba,0x71,0x7f -# ATT: vfmsub231nepbf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z} -# INTEL: vfmsub231nepbf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16} +# ATT: vfmsub231bf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z} +# INTEL: vfmsub231bf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16} 0x62,0xe6,0x44,0xb7,0xba,0x72,0x80 -# ATT: vfmsub231nepbf16 268435456(%rbp,%r14,8), %xmm23, %xmm22 -# INTEL: vfmsub231nepbf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456] +# ATT: vfmsub231bf16 268435456(%rbp,%r14,8), %xmm23, %xmm22 +# INTEL: vfmsub231bf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456] 0x62,0xa6,0x44,0x00,0xba,0xb4,0xf5,0x00,0x00,0x00,0x10 -# ATT: vfmsub231nepbf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7} -# INTEL: vfmsub231nepbf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291] +# ATT: vfmsub231bf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7} +# INTEL: vfmsub231bf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291] 0x62,0xc6,0x44,0x07,0xba,0xb4,0x80,0x23,0x01,0x00,0x00 -# ATT: vfmsub231nepbf16 (%rip){1to8}, %xmm23, %xmm22 -# INTEL: vfmsub231nepbf16 xmm22, xmm23, word ptr [rip]{1to8} +# ATT: vfmsub231bf16 (%rip){1to8}, %xmm23, %xmm22 +# INTEL: vfmsub231bf16 xmm22, xmm23, word ptr [rip]{1to8} 0x62,0xe6,0x44,0x10,0xba,0x35,0x00,0x00,0x00,0x00 -# ATT: vfmsub231nepbf16 -512(,%rbp,2), %xmm23, %xmm22 -# INTEL: vfmsub231nepbf16 xmm22, xmm23, xmmword ptr [2*rbp - 512] +# ATT: vfmsub231bf16 -512(,%rbp,2), %xmm23, %xmm22 +# INTEL: vfmsub231bf16 xmm22, xmm23, xmmword ptr [2*rbp - 512] 0x62,0xe6,0x44,0x00,0xba,0x34,0x6d,0x00,0xfe,0xff,0xff -# ATT: vfmsub231nepbf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z} -# INTEL: vfmsub231nepbf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032] +# ATT: vfmsub231bf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z} +# INTEL: vfmsub231bf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032] 0x62,0xe6,0x44,0x87,0xba,0x71,0x7f -# ATT: vfmsub231nepbf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z} -# INTEL: vfmsub231nepbf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8} +# ATT: vfmsub231bf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z} +# INTEL: vfmsub231bf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8} 0x62,0xe6,0x44,0x97,0xba,0x72,0x80 -# ATT: vfnmadd132nepbf16 %ymm24, %ymm23, %ymm22 -# INTEL: vfnmadd132nepbf16 ymm22, ymm23, ymm24 +# ATT: vfnmadd132bf16 %ymm24, %ymm23, %ymm22 +# INTEL: vfnmadd132bf16 ymm22, ymm23, ymm24 0x62,0x86,0x44,0x20,0x9c,0xf0 -# ATT: vfnmadd132nepbf16 %ymm24, %ymm23, %ymm22 {%k7} -# INTEL: vfnmadd132nepbf16 ymm22 {k7}, ymm23, ymm24 +# ATT: vfnmadd132bf16 %ymm24, %ymm23, %ymm22 {%k7} +# INTEL: vfnmadd132bf16 ymm22 {k7}, ymm23, ymm24 0x62,0x86,0x44,0x27,0x9c,0xf0 -# ATT: vfnmadd132nepbf16 %ymm24, %ymm23, %ymm22 {%k7} {z} -# INTEL: vfnmadd132nepbf16 ymm22 {k7} {z}, ymm23, ymm24 +# ATT: vfnmadd132bf16 %ymm24, %ymm23, %ymm22 {%k7} {z} +# INTEL: vfnmadd132bf16 ymm22 {k7} {z}, ymm23, ymm24 0x62,0x86,0x44,0xa7,0x9c,0xf0 -# ATT: vfnmadd132nepbf16 %zmm24, %zmm23, %zmm22 -# INTEL: vfnmadd132nepbf16 zmm22, zmm23, zmm24 +# ATT: vfnmadd132bf16 %zmm24, %zmm23, %zmm22 +# INTEL: vfnmadd132bf16 zmm22, zmm23, zmm24 0x62,0x86,0x44,0x40,0x9c,0xf0 -# ATT: vfnmadd132nepbf16 %zmm24, %zmm23, %zmm22 {%k7} -# INTEL: vfnmadd132nepbf16 zmm22 {k7}, zmm23, zmm24 +# ATT: vfnmadd132bf16 %zmm24, %zmm23, %zmm22 {%k7} +# INTEL: vfnmadd132bf16 zmm22 {k7}, zmm23, zmm24 0x62,0x86,0x44,0x47,0x9c,0xf0 -# ATT: vfnmadd132nepbf16 %zmm24, %zmm23, %zmm22 {%k7} {z} -# INTEL: vfnmadd132nepbf16 zmm22 {k7} {z}, zmm23, zmm24 +# ATT: vfnmadd132bf16 %zmm24, %zmm23, %zmm22 {%k7} {z} +# INTEL: vfnmadd132bf16 zmm22 {k7} {z}, zmm23, zmm24 0x62,0x86,0x44,0xc7,0x9c,0xf0 -# ATT: vfnmadd132nepbf16 %xmm24, %xmm23, %xmm22 -# INTEL: vfnmadd132nepbf16 xmm22, xmm23, xmm24 +# ATT: vfnmadd132bf16 %xmm24, %xmm23, %xmm22 +# INTEL: vfnmadd132bf16 xmm22, xmm23, xmm24 0x62,0x86,0x44,0x00,0x9c,0xf0 -# ATT: vfnmadd132nepbf16 %xmm24, %xmm23, %xmm22 {%k7} -# INTEL: vfnmadd132nepbf16 xmm22 {k7}, xmm23, xmm24 +# ATT: vfnmadd132bf16 %xmm24, %xmm23, %xmm22 {%k7} +# INTEL: vfnmadd132bf16 xmm22 {k7}, xmm23, xmm24 0x62,0x86,0x44,0x07,0x9c,0xf0 -# ATT: vfnmadd132nepbf16 %xmm24, %xmm23, %xmm22 {%k7} {z} -# INTEL: vfnmadd132nepbf16 xmm22 {k7} {z}, xmm23, xmm24 +# ATT: vfnmadd132bf16 %xmm24, %xmm23, %xmm22 {%k7} {z} +# INTEL: vfnmadd132bf16 xmm22 {k7} {z}, xmm23, xmm24 0x62,0x86,0x44,0x87,0x9c,0xf0 -# ATT: vfnmadd132nepbf16 268435456(%rbp,%r14,8), %zmm23, %zmm22 -# INTEL: vfnmadd132nepbf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456] +# ATT: vfnmadd132bf16 268435456(%rbp,%r14,8), %zmm23, %zmm22 +# INTEL: vfnmadd132bf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456] 0x62,0xa6,0x44,0x40,0x9c,0xb4,0xf5,0x00,0x00,0x00,0x10 -# ATT: vfnmadd132nepbf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7} -# INTEL: vfnmadd132nepbf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291] +# ATT: vfnmadd132bf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7} +# INTEL: vfnmadd132bf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291] 0x62,0xc6,0x44,0x47,0x9c,0xb4,0x80,0x23,0x01,0x00,0x00 -# ATT: vfnmadd132nepbf16 (%rip){1to32}, %zmm23, %zmm22 -# INTEL: vfnmadd132nepbf16 zmm22, zmm23, word ptr [rip]{1to32} +# ATT: vfnmadd132bf16 (%rip){1to32}, %zmm23, %zmm22 +# INTEL: vfnmadd132bf16 zmm22, zmm23, word ptr [rip]{1to32} 0x62,0xe6,0x44,0x50,0x9c,0x35,0x00,0x00,0x00,0x00 -# ATT: vfnmadd132nepbf16 -2048(,%rbp,2), %zmm23, %zmm22 -# INTEL: vfnmadd132nepbf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048] +# ATT: vfnmadd132bf16 -2048(,%rbp,2), %zmm23, %zmm22 +# INTEL: vfnmadd132bf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048] 0x62,0xe6,0x44,0x40,0x9c,0x34,0x6d,0x00,0xf8,0xff,0xff -# ATT: vfnmadd132nepbf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z} -# INTEL: vfnmadd132nepbf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128] +# ATT: vfnmadd132bf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z} +# INTEL: vfnmadd132bf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128] 0x62,0xe6,0x44,0xc7,0x9c,0x71,0x7f -# ATT: vfnmadd132nepbf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z} -# INTEL: vfnmadd132nepbf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32} +# ATT: vfnmadd132bf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z} +# INTEL: vfnmadd132bf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32} 0x62,0xe6,0x44,0xd7,0x9c,0x72,0x80 -# ATT: vfnmadd132nepbf16 268435456(%rbp,%r14,8), %ymm23, %ymm22 -# INTEL: vfnmadd132nepbf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456] +# ATT: vfnmadd132bf16 268435456(%rbp,%r14,8), %ymm23, %ymm22 +# INTEL: vfnmadd132bf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456] 0x62,0xa6,0x44,0x20,0x9c,0xb4,0xf5,0x00,0x00,0x00,0x10 -# ATT: vfnmadd132nepbf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7} -# INTEL: vfnmadd132nepbf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291] +# ATT: vfnmadd132bf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7} +# INTEL: vfnmadd132bf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291] 0x62,0xc6,0x44,0x27,0x9c,0xb4,0x80,0x23,0x01,0x00,0x00 -# ATT: vfnmadd132nepbf16 (%rip){1to16}, %ymm23, %ymm22 -# INTEL: vfnmadd132nepbf16 ymm22, ymm23, word ptr [rip]{1to16} +# ATT: vfnmadd132bf16 (%rip){1to16}, %ymm23, %ymm22 +# INTEL: vfnmadd132bf16 ymm22, ymm23, word ptr [rip]{1to16} 0x62,0xe6,0x44,0x30,0x9c,0x35,0x00,0x00,0x00,0x00 -# ATT: vfnmadd132nepbf16 -1024(,%rbp,2), %ymm23, %ymm22 -# INTEL: vfnmadd132nepbf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024] +# ATT: vfnmadd132bf16 -1024(,%rbp,2), %ymm23, %ymm22 +# INTEL: vfnmadd132bf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024] 0x62,0xe6,0x44,0x20,0x9c,0x34,0x6d,0x00,0xfc,0xff,0xff -# ATT: vfnmadd132nepbf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z} -# INTEL: vfnmadd132nepbf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064] +# ATT: vfnmadd132bf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z} +# INTEL: vfnmadd132bf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064] 0x62,0xe6,0x44,0xa7,0x9c,0x71,0x7f -# ATT: vfnmadd132nepbf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z} -# INTEL: vfnmadd132nepbf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16} +# ATT: vfnmadd132bf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z} +# INTEL: vfnmadd132bf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16} 0x62,0xe6,0x44,0xb7,0x9c,0x72,0x80 -# ATT: vfnmadd132nepbf16 268435456(%rbp,%r14,8), %xmm23, %xmm22 -# INTEL: vfnmadd132nepbf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456] +# ATT: vfnmadd132bf16 268435456(%rbp,%r14,8), %xmm23, %xmm22 +# INTEL: vfnmadd132bf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456] 0x62,0xa6,0x44,0x00,0x9c,0xb4,0xf5,0x00,0x00,0x00,0x10 -# ATT: vfnmadd132nepbf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7} -# INTEL: vfnmadd132nepbf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291] +# ATT: vfnmadd132bf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7} +# INTEL: vfnmadd132bf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291] 0x62,0xc6,0x44,0x07,0x9c,0xb4,0x80,0x23,0x01,0x00,0x00 -# ATT: vfnmadd132nepbf16 (%rip){1to8}, %xmm23, %xmm22 -# INTEL: vfnmadd132nepbf16 xmm22, xmm23, word ptr [rip]{1to8} +# ATT: vfnmadd132bf16 (%rip){1to8}, %xmm23, %xmm22 +# INTEL: vfnmadd132bf16 xmm22, xmm23, word ptr [rip]{1to8} 0x62,0xe6,0x44,0x10,0x9c,0x35,0x00,0x00,0x00,0x00 -# ATT: vfnmadd132nepbf16 -512(,%rbp,2), %xmm23, %xmm22 -# INTEL: vfnmadd132nepbf16 xmm22, xmm23, xmmword ptr [2*rbp - 512] +# ATT: vfnmadd132bf16 -512(,%rbp,2), %xmm23, %xmm22 +# INTEL: vfnmadd132bf16 xmm22, xmm23, xmmword ptr [2*rbp - 512] 0x62,0xe6,0x44,0x00,0x9c,0x34,0x6d,0x00,0xfe,0xff,0xff -# ATT: vfnmadd132nepbf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z} -# INTEL: vfnmadd132nepbf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032] +# ATT: vfnmadd132bf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z} +# INTEL: vfnmadd132bf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032] 0x62,0xe6,0x44,0x87,0x9c,0x71,0x7f -# ATT: vfnmadd132nepbf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z} -# INTEL: vfnmadd132nepbf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8} +# ATT: vfnmadd132bf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z} +# INTEL: vfnmadd132bf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8} 0x62,0xe6,0x44,0x97,0x9c,0x72,0x80 -# ATT: vfnmadd213nepbf16 %ymm24, %ymm23, %ymm22 -# INTEL: vfnmadd213nepbf16 ymm22, ymm23, ymm24 +# ATT: vfnmadd213bf16 %ymm24, %ymm23, %ymm22 +# INTEL: vfnmadd213bf16 ymm22, ymm23, ymm24 0x62,0x86,0x44,0x20,0xac,0xf0 -# ATT: vfnmadd213nepbf16 %ymm24, %ymm23, %ymm22 {%k7} -# INTEL: vfnmadd213nepbf16 ymm22 {k7}, ymm23, ymm24 +# ATT: vfnmadd213bf16 %ymm24, %ymm23, %ymm22 {%k7} +# INTEL: vfnmadd213bf16 ymm22 {k7}, ymm23, ymm24 0x62,0x86,0x44,0x27,0xac,0xf0 -# ATT: vfnmadd213nepbf16 %ymm24, %ymm23, %ymm22 {%k7} {z} -# INTEL: vfnmadd213nepbf16 ymm22 {k7} {z}, ymm23, ymm24 +# ATT: vfnmadd213bf16 %ymm24, %ymm23, %ymm22 {%k7} {z} +# INTEL: vfnmadd213bf16 ymm22 {k7} {z}, ymm23, ymm24 0x62,0x86,0x44,0xa7,0xac,0xf0 -# ATT: vfnmadd213nepbf16 %zmm24, %zmm23, %zmm22 -# INTEL: vfnmadd213nepbf16 zmm22, zmm23, zmm24 +# ATT: vfnmadd213bf16 %zmm24, %zmm23, %zmm22 +# INTEL: vfnmadd213bf16 zmm22, zmm23, zmm24 0x62,0x86,0x44,0x40,0xac,0xf0 -# ATT: vfnmadd213nepbf16 %zmm24, %zmm23, %zmm22 {%k7} -# INTEL: vfnmadd213nepbf16 zmm22 {k7}, zmm23, zmm24 +# ATT: vfnmadd213bf16 %zmm24, %zmm23, %zmm22 {%k7} +# INTEL: vfnmadd213bf16 zmm22 {k7}, zmm23, zmm24 0x62,0x86,0x44,0x47,0xac,0xf0 -# ATT: vfnmadd213nepbf16 %zmm24, %zmm23, %zmm22 {%k7} {z} -# INTEL: vfnmadd213nepbf16 zmm22 {k7} {z}, zmm23, zmm24 +# ATT: vfnmadd213bf16 %zmm24, %zmm23, %zmm22 {%k7} {z} +# INTEL: vfnmadd213bf16 zmm22 {k7} {z}, zmm23, zmm24 0x62,0x86,0x44,0xc7,0xac,0xf0 -# ATT: vfnmadd213nepbf16 %xmm24, %xmm23, %xmm22 -# INTEL: vfnmadd213nepbf16 xmm22, xmm23, xmm24 +# ATT: vfnmadd213bf16 %xmm24, %xmm23, %xmm22 +# INTEL: vfnmadd213bf16 xmm22, xmm23, xmm24 0x62,0x86,0x44,0x00,0xac,0xf0 -# ATT: vfnmadd213nepbf16 %xmm24, %xmm23, %xmm22 {%k7} -# INTEL: vfnmadd213nepbf16 xmm22 {k7}, xmm23, xmm24 +# ATT: vfnmadd213bf16 %xmm24, %xmm23, %xmm22 {%k7} +# INTEL: vfnmadd213bf16 xmm22 {k7}, xmm23, xmm24 0x62,0x86,0x44,0x07,0xac,0xf0 -# ATT: vfnmadd213nepbf16 %xmm24, %xmm23, %xmm22 {%k7} {z} -# INTEL: vfnmadd213nepbf16 xmm22 {k7} {z}, xmm23, xmm24 +# ATT: vfnmadd213bf16 %xmm24, %xmm23, %xmm22 {%k7} {z} +# INTEL: vfnmadd213bf16 xmm22 {k7} {z}, xmm23, xmm24 0x62,0x86,0x44,0x87,0xac,0xf0 -# ATT: vfnmadd213nepbf16 268435456(%rbp,%r14,8), %zmm23, %zmm22 -# INTEL: vfnmadd213nepbf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456] +# ATT: vfnmadd213bf16 268435456(%rbp,%r14,8), %zmm23, %zmm22 +# INTEL: vfnmadd213bf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456] 0x62,0xa6,0x44,0x40,0xac,0xb4,0xf5,0x00,0x00,0x00,0x10 -# ATT: vfnmadd213nepbf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7} -# INTEL: vfnmadd213nepbf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291] +# ATT: vfnmadd213bf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7} +# INTEL: vfnmadd213bf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291] 0x62,0xc6,0x44,0x47,0xac,0xb4,0x80,0x23,0x01,0x00,0x00 -# ATT: vfnmadd213nepbf16 (%rip){1to32}, %zmm23, %zmm22 -# INTEL: vfnmadd213nepbf16 zmm22, zmm23, word ptr [rip]{1to32} +# ATT: vfnmadd213bf16 (%rip){1to32}, %zmm23, %zmm22 +# INTEL: vfnmadd213bf16 zmm22, zmm23, word ptr [rip]{1to32} 0x62,0xe6,0x44,0x50,0xac,0x35,0x00,0x00,0x00,0x00 -# ATT: vfnmadd213nepbf16 -2048(,%rbp,2), %zmm23, %zmm22 -# INTEL: vfnmadd213nepbf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048] +# ATT: vfnmadd213bf16 -2048(,%rbp,2), %zmm23, %zmm22 +# INTEL: vfnmadd213bf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048] 0x62,0xe6,0x44,0x40,0xac,0x34,0x6d,0x00,0xf8,0xff,0xff -# ATT: vfnmadd213nepbf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z} -# INTEL: vfnmadd213nepbf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128] +# ATT: vfnmadd213bf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z} +# INTEL: vfnmadd213bf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128] 0x62,0xe6,0x44,0xc7,0xac,0x71,0x7f -# ATT: vfnmadd213nepbf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z} -# INTEL: vfnmadd213nepbf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32} +# ATT: vfnmadd213bf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z} +# INTEL: vfnmadd213bf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32} 0x62,0xe6,0x44,0xd7,0xac,0x72,0x80 -# ATT: vfnmadd213nepbf16 268435456(%rbp,%r14,8), %ymm23, %ymm22 -# INTEL: vfnmadd213nepbf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456] +# ATT: vfnmadd213bf16 268435456(%rbp,%r14,8), %ymm23, %ymm22 +# INTEL: vfnmadd213bf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456] 0x62,0xa6,0x44,0x20,0xac,0xb4,0xf5,0x00,0x00,0x00,0x10 -# ATT: vfnmadd213nepbf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7} -# INTEL: vfnmadd213nepbf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291] +# ATT: vfnmadd213bf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7} +# INTEL: vfnmadd213bf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291] 0x62,0xc6,0x44,0x27,0xac,0xb4,0x80,0x23,0x01,0x00,0x00 -# ATT: vfnmadd213nepbf16 (%rip){1to16}, %ymm23, %ymm22 -# INTEL: vfnmadd213nepbf16 ymm22, ymm23, word ptr [rip]{1to16} +# ATT: vfnmadd213bf16 (%rip){1to16}, %ymm23, %ymm22 +# INTEL: vfnmadd213bf16 ymm22, ymm23, word ptr [rip]{1to16} 0x62,0xe6,0x44,0x30,0xac,0x35,0x00,0x00,0x00,0x00 -# ATT: vfnmadd213nepbf16 -1024(,%rbp,2), %ymm23, %ymm22 -# INTEL: vfnmadd213nepbf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024] +# ATT: vfnmadd213bf16 -1024(,%rbp,2), %ymm23, %ymm22 +# INTEL: vfnmadd213bf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024] 0x62,0xe6,0x44,0x20,0xac,0x34,0x6d,0x00,0xfc,0xff,0xff -# ATT: vfnmadd213nepbf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z} -# INTEL: vfnmadd213nepbf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064] +# ATT: vfnmadd213bf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z} +# INTEL: vfnmadd213bf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064] 0x62,0xe6,0x44,0xa7,0xac,0x71,0x7f -# ATT: vfnmadd213nepbf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z} -# INTEL: vfnmadd213nepbf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16} +# ATT: vfnmadd213bf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z} +# INTEL: vfnmadd213bf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16} 0x62,0xe6,0x44,0xb7,0xac,0x72,0x80 -# ATT: vfnmadd213nepbf16 268435456(%rbp,%r14,8), %xmm23, %xmm22 -# INTEL: vfnmadd213nepbf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456] +# ATT: vfnmadd213bf16 268435456(%rbp,%r14,8), %xmm23, %xmm22 +# INTEL: vfnmadd213bf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456] 0x62,0xa6,0x44,0x00,0xac,0xb4,0xf5,0x00,0x00,0x00,0x10 -# ATT: vfnmadd213nepbf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7} -# INTEL: vfnmadd213nepbf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291] +# ATT: vfnmadd213bf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7} +# INTEL: vfnmadd213bf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291] 0x62,0xc6,0x44,0x07,0xac,0xb4,0x80,0x23,0x01,0x00,0x00 -# ATT: vfnmadd213nepbf16 (%rip){1to8}, %xmm23, %xmm22 -# INTEL: vfnmadd213nepbf16 xmm22, xmm23, word ptr [rip]{1to8} +# ATT: vfnmadd213bf16 (%rip){1to8}, %xmm23, %xmm22 +# INTEL: vfnmadd213bf16 xmm22, xmm23, word ptr [rip]{1to8} 0x62,0xe6,0x44,0x10,0xac,0x35,0x00,0x00,0x00,0x00 -# ATT: vfnmadd213nepbf16 -512(,%rbp,2), %xmm23, %xmm22 -# INTEL: vfnmadd213nepbf16 xmm22, xmm23, xmmword ptr [2*rbp - 512] +# ATT: vfnmadd213bf16 -512(,%rbp,2), %xmm23, %xmm22 +# INTEL: vfnmadd213bf16 xmm22, xmm23, xmmword ptr [2*rbp - 512] 0x62,0xe6,0x44,0x00,0xac,0x34,0x6d,0x00,0xfe,0xff,0xff -# ATT: vfnmadd213nepbf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z} -# INTEL: vfnmadd213nepbf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032] +# ATT: vfnmadd213bf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z} +# INTEL: vfnmadd213bf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032] 0x62,0xe6,0x44,0x87,0xac,0x71,0x7f -# ATT: vfnmadd213nepbf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z} -# INTEL: vfnmadd213nepbf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8} +# ATT: vfnmadd213bf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z} +# INTEL: vfnmadd213bf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8} 0x62,0xe6,0x44,0x97,0xac,0x72,0x80 -# ATT: vfnmadd231nepbf16 %ymm24, %ymm23, %ymm22 -# INTEL: vfnmadd231nepbf16 ymm22, ymm23, ymm24 +# ATT: vfnmadd231bf16 %ymm24, %ymm23, %ymm22 +# INTEL: vfnmadd231bf16 ymm22, ymm23, ymm24 0x62,0x86,0x44,0x20,0xbc,0xf0 -# ATT: vfnmadd231nepbf16 %ymm24, %ymm23, %ymm22 {%k7} -# INTEL: vfnmadd231nepbf16 ymm22 {k7}, ymm23, ymm24 +# ATT: vfnmadd231bf16 %ymm24, %ymm23, %ymm22 {%k7} +# INTEL: vfnmadd231bf16 ymm22 {k7}, ymm23, ymm24 0x62,0x86,0x44,0x27,0xbc,0xf0 -# ATT: vfnmadd231nepbf16 %ymm24, %ymm23, %ymm22 {%k7} {z} -# INTEL: vfnmadd231nepbf16 ymm22 {k7} {z}, ymm23, ymm24 +# ATT: vfnmadd231bf16 %ymm24, %ymm23, %ymm22 {%k7} {z} +# INTEL: vfnmadd231bf16 ymm22 {k7} {z}, ymm23, ymm24 0x62,0x86,0x44,0xa7,0xbc,0xf0 -# ATT: vfnmadd231nepbf16 %zmm24, %zmm23, %zmm22 -# INTEL: vfnmadd231nepbf16 zmm22, zmm23, zmm24 +# ATT: vfnmadd231bf16 %zmm24, %zmm23, %zmm22 +# INTEL: vfnmadd231bf16 zmm22, zmm23, zmm24 0x62,0x86,0x44,0x40,0xbc,0xf0 -# ATT: vfnmadd231nepbf16 %zmm24, %zmm23, %zmm22 {%k7} -# INTEL: vfnmadd231nepbf16 zmm22 {k7}, zmm23, zmm24 +# ATT: vfnmadd231bf16 %zmm24, %zmm23, %zmm22 {%k7} +# INTEL: vfnmadd231bf16 zmm22 {k7}, zmm23, zmm24 0x62,0x86,0x44,0x47,0xbc,0xf0 -# ATT: vfnmadd231nepbf16 %zmm24, %zmm23, %zmm22 {%k7} {z} -# INTEL: vfnmadd231nepbf16 zmm22 {k7} {z}, zmm23, zmm24 +# ATT: vfnmadd231bf16 %zmm24, %zmm23, %zmm22 {%k7} {z} +# INTEL: vfnmadd231bf16 zmm22 {k7} {z}, zmm23, zmm24 0x62,0x86,0x44,0xc7,0xbc,0xf0 -# ATT: vfnmadd231nepbf16 %xmm24, %xmm23, %xmm22 -# INTEL: vfnmadd231nepbf16 xmm22, xmm23, xmm24 +# ATT: vfnmadd231bf16 %xmm24, %xmm23, %xmm22 +# INTEL: vfnmadd231bf16 xmm22, xmm23, xmm24 0x62,0x86,0x44,0x00,0xbc,0xf0 -# ATT: vfnmadd231nepbf16 %xmm24, %xmm23, %xmm22 {%k7} -# INTEL: vfnmadd231nepbf16 xmm22 {k7}, xmm23, xmm24 +# ATT: vfnmadd231bf16 %xmm24, %xmm23, %xmm22 {%k7} +# INTEL: vfnmadd231bf16 xmm22 {k7}, xmm23, xmm24 0x62,0x86,0x44,0x07,0xbc,0xf0 -# ATT: vfnmadd231nepbf16 %xmm24, %xmm23, %xmm22 {%k7} {z} -# INTEL: vfnmadd231nepbf16 xmm22 {k7} {z}, xmm23, xmm24 +# ATT: vfnmadd231bf16 %xmm24, %xmm23, %xmm22 {%k7} {z} +# INTEL: vfnmadd231bf16 xmm22 {k7} {z}, xmm23, xmm24 0x62,0x86,0x44,0x87,0xbc,0xf0 -# ATT: vfnmadd231nepbf16 268435456(%rbp,%r14,8), %zmm23, %zmm22 -# INTEL: vfnmadd231nepbf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456] +# ATT: vfnmadd231bf16 268435456(%rbp,%r14,8), %zmm23, %zmm22 +# INTEL: vfnmadd231bf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456] 0x62,0xa6,0x44,0x40,0xbc,0xb4,0xf5,0x00,0x00,0x00,0x10 -# ATT: vfnmadd231nepbf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7} -# INTEL: vfnmadd231nepbf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291] +# ATT: vfnmadd231bf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7} +# INTEL: vfnmadd231bf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291] 0x62,0xc6,0x44,0x47,0xbc,0xb4,0x80,0x23,0x01,0x00,0x00 -# ATT: vfnmadd231nepbf16 (%rip){1to32}, %zmm23, %zmm22 -# INTEL: vfnmadd231nepbf16 zmm22, zmm23, word ptr [rip]{1to32} +# ATT: vfnmadd231bf16 (%rip){1to32}, %zmm23, %zmm22 +# INTEL: vfnmadd231bf16 zmm22, zmm23, word ptr [rip]{1to32} 0x62,0xe6,0x44,0x50,0xbc,0x35,0x00,0x00,0x00,0x00 -# ATT: vfnmadd231nepbf16 -2048(,%rbp,2), %zmm23, %zmm22 -# INTEL: vfnmadd231nepbf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048] +# ATT: vfnmadd231bf16 -2048(,%rbp,2), %zmm23, %zmm22 +# INTEL: vfnmadd231bf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048] 0x62,0xe6,0x44,0x40,0xbc,0x34,0x6d,0x00,0xf8,0xff,0xff -# ATT: vfnmadd231nepbf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z} -# INTEL: vfnmadd231nepbf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128] +# ATT: vfnmadd231bf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z} +# INTEL: vfnmadd231bf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128] 0x62,0xe6,0x44,0xc7,0xbc,0x71,0x7f -# ATT: vfnmadd231nepbf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z} -# INTEL: vfnmadd231nepbf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32} +# ATT: vfnmadd231bf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z} +# INTEL: vfnmadd231bf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32} 0x62,0xe6,0x44,0xd7,0xbc,0x72,0x80 -# ATT: vfnmadd231nepbf16 268435456(%rbp,%r14,8), %ymm23, %ymm22 -# INTEL: vfnmadd231nepbf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456] +# ATT: vfnmadd231bf16 268435456(%rbp,%r14,8), %ymm23, %ymm22 +# INTEL: vfnmadd231bf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456] 0x62,0xa6,0x44,0x20,0xbc,0xb4,0xf5,0x00,0x00,0x00,0x10 -# ATT: vfnmadd231nepbf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7} -# INTEL: vfnmadd231nepbf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291] +# ATT: vfnmadd231bf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7} +# INTEL: vfnmadd231bf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291] 0x62,0xc6,0x44,0x27,0xbc,0xb4,0x80,0x23,0x01,0x00,0x00 -# ATT: vfnmadd231nepbf16 (%rip){1to16}, %ymm23, %ymm22 -# INTEL: vfnmadd231nepbf16 ymm22, ymm23, word ptr [rip]{1to16} +# ATT: vfnmadd231bf16 (%rip){1to16}, %ymm23, %ymm22 +# INTEL: vfnmadd231bf16 ymm22, ymm23, word ptr [rip]{1to16} 0x62,0xe6,0x44,0x30,0xbc,0x35,0x00,0x00,0x00,0x00 -# ATT: vfnmadd231nepbf16 -1024(,%rbp,2), %ymm23, %ymm22 -# INTEL: vfnmadd231nepbf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024] +# ATT: vfnmadd231bf16 -1024(,%rbp,2), %ymm23, %ymm22 +# INTEL: vfnmadd231bf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024] 0x62,0xe6,0x44,0x20,0xbc,0x34,0x6d,0x00,0xfc,0xff,0xff -# ATT: vfnmadd231nepbf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z} -# INTEL: vfnmadd231nepbf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064] +# ATT: vfnmadd231bf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z} +# INTEL: vfnmadd231bf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064] 0x62,0xe6,0x44,0xa7,0xbc,0x71,0x7f -# ATT: vfnmadd231nepbf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z} -# INTEL: vfnmadd231nepbf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16} +# ATT: vfnmadd231bf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z} +# INTEL: vfnmadd231bf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16} 0x62,0xe6,0x44,0xb7,0xbc,0x72,0x80 -# ATT: vfnmadd231nepbf16 268435456(%rbp,%r14,8), %xmm23, %xmm22 -# INTEL: vfnmadd231nepbf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456] +# ATT: vfnmadd231bf16 268435456(%rbp,%r14,8), %xmm23, %xmm22 +# INTEL: vfnmadd231bf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456] 0x62,0xa6,0x44,0x00,0xbc,0xb4,0xf5,0x00,0x00,0x00,0x10 -# ATT: vfnmadd231nepbf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7} -# INTEL: vfnmadd231nepbf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291] +# ATT: vfnmadd231bf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7} +# INTEL: vfnmadd231bf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291] 0x62,0xc6,0x44,0x07,0xbc,0xb4,0x80,0x23,0x01,0x00,0x00 -# ATT: vfnmadd231nepbf16 (%rip){1to8}, %xmm23, %xmm22 -# INTEL: vfnmadd231nepbf16 xmm22, xmm23, word ptr [rip]{1to8} +# ATT: vfnmadd231bf16 (%rip){1to8}, %xmm23, %xmm22 +# INTEL: vfnmadd231bf16 xmm22, xmm23, word ptr [rip]{1to8} 0x62,0xe6,0x44,0x10,0xbc,0x35,0x00,0x00,0x00,0x00 -# ATT: vfnmadd231nepbf16 -512(,%rbp,2), %xmm23, %xmm22 -# INTEL: vfnmadd231nepbf16 xmm22, xmm23, xmmword ptr [2*rbp - 512] +# ATT: vfnmadd231bf16 -512(,%rbp,2), %xmm23, %xmm22 +# INTEL: vfnmadd231bf16 xmm22, xmm23, xmmword ptr [2*rbp - 512] 0x62,0xe6,0x44,0x00,0xbc,0x34,0x6d,0x00,0xfe,0xff,0xff -# ATT: vfnmadd231nepbf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z} -# INTEL: vfnmadd231nepbf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032] +# ATT: vfnmadd231bf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z} +# INTEL: vfnmadd231bf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032] 0x62,0xe6,0x44,0x87,0xbc,0x71,0x7f -# ATT: vfnmadd231nepbf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z} -# INTEL: vfnmadd231nepbf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8} +# ATT: vfnmadd231bf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z} +# INTEL: vfnmadd231bf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8} 0x62,0xe6,0x44,0x97,0xbc,0x72,0x80 -# ATT: vfnmsub132nepbf16 %ymm24, %ymm23, %ymm22 -# INTEL: vfnmsub132nepbf16 ymm22, ymm23, ymm24 +# ATT: vfnmsub132bf16 %ymm24, %ymm23, %ymm22 +# INTEL: vfnmsub132bf16 ymm22, ymm23, ymm24 0x62,0x86,0x44,0x20,0x9e,0xf0 -# ATT: vfnmsub132nepbf16 %ymm24, %ymm23, %ymm22 {%k7} -# INTEL: vfnmsub132nepbf16 ymm22 {k7}, ymm23, ymm24 +# ATT: vfnmsub132bf16 %ymm24, %ymm23, %ymm22 {%k7} +# INTEL: vfnmsub132bf16 ymm22 {k7}, ymm23, ymm24 0x62,0x86,0x44,0x27,0x9e,0xf0 -# ATT: vfnmsub132nepbf16 %ymm24, %ymm23, %ymm22 {%k7} {z} -# INTEL: vfnmsub132nepbf16 ymm22 {k7} {z}, ymm23, ymm24 +# ATT: vfnmsub132bf16 %ymm24, %ymm23, %ymm22 {%k7} {z} +# INTEL: vfnmsub132bf16 ymm22 {k7} {z}, ymm23, ymm24 0x62,0x86,0x44,0xa7,0x9e,0xf0 -# ATT: vfnmsub132nepbf16 %zmm24, %zmm23, %zmm22 -# INTEL: vfnmsub132nepbf16 zmm22, zmm23, zmm24 +# ATT: vfnmsub132bf16 %zmm24, %zmm23, %zmm22 +# INTEL: vfnmsub132bf16 zmm22, zmm23, zmm24 0x62,0x86,0x44,0x40,0x9e,0xf0 -# ATT: vfnmsub132nepbf16 %zmm24, %zmm23, %zmm22 {%k7} -# INTEL: vfnmsub132nepbf16 zmm22 {k7}, zmm23, zmm24 +# ATT: vfnmsub132bf16 %zmm24, %zmm23, %zmm22 {%k7} +# INTEL: vfnmsub132bf16 zmm22 {k7}, zmm23, zmm24 0x62,0x86,0x44,0x47,0x9e,0xf0 -# ATT: vfnmsub132nepbf16 %zmm24, %zmm23, %zmm22 {%k7} {z} -# INTEL: vfnmsub132nepbf16 zmm22 {k7} {z}, zmm23, zmm24 +# ATT: vfnmsub132bf16 %zmm24, %zmm23, %zmm22 {%k7} {z} +# INTEL: vfnmsub132bf16 zmm22 {k7} {z}, zmm23, zmm24 0x62,0x86,0x44,0xc7,0x9e,0xf0 -# ATT: vfnmsub132nepbf16 %xmm24, %xmm23, %xmm22 -# INTEL: vfnmsub132nepbf16 xmm22, xmm23, xmm24 +# ATT: vfnmsub132bf16 %xmm24, %xmm23, %xmm22 +# INTEL: vfnmsub132bf16 xmm22, xmm23, xmm24 0x62,0x86,0x44,0x00,0x9e,0xf0 -# ATT: vfnmsub132nepbf16 %xmm24, %xmm23, %xmm22 {%k7} -# INTEL: vfnmsub132nepbf16 xmm22 {k7}, xmm23, xmm24 +# ATT: vfnmsub132bf16 %xmm24, %xmm23, %xmm22 {%k7} +# INTEL: vfnmsub132bf16 xmm22 {k7}, xmm23, xmm24 0x62,0x86,0x44,0x07,0x9e,0xf0 -# ATT: vfnmsub132nepbf16 %xmm24, %xmm23, %xmm22 {%k7} {z} -# INTEL: vfnmsub132nepbf16 xmm22 {k7} {z}, xmm23, xmm24 +# ATT: vfnmsub132bf16 %xmm24, %xmm23, %xmm22 {%k7} {z} +# INTEL: vfnmsub132bf16 xmm22 {k7} {z}, xmm23, xmm24 0x62,0x86,0x44,0x87,0x9e,0xf0 -# ATT: vfnmsub132nepbf16 268435456(%rbp,%r14,8), %zmm23, %zmm22 -# INTEL: vfnmsub132nepbf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456] +# ATT: vfnmsub132bf16 268435456(%rbp,%r14,8), %zmm23, %zmm22 +# INTEL: vfnmsub132bf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456] 0x62,0xa6,0x44,0x40,0x9e,0xb4,0xf5,0x00,0x00,0x00,0x10 -# ATT: vfnmsub132nepbf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7} -# INTEL: vfnmsub132nepbf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291] +# ATT: vfnmsub132bf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7} +# INTEL: vfnmsub132bf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291] 0x62,0xc6,0x44,0x47,0x9e,0xb4,0x80,0x23,0x01,0x00,0x00 -# ATT: vfnmsub132nepbf16 (%rip){1to32}, %zmm23, %zmm22 -# INTEL: vfnmsub132nepbf16 zmm22, zmm23, word ptr [rip]{1to32} +# ATT: vfnmsub132bf16 (%rip){1to32}, %zmm23, %zmm22 +# INTEL: vfnmsub132bf16 zmm22, zmm23, word ptr [rip]{1to32} 0x62,0xe6,0x44,0x50,0x9e,0x35,0x00,0x00,0x00,0x00 -# ATT: vfnmsub132nepbf16 -2048(,%rbp,2), %zmm23, %zmm22 -# INTEL: vfnmsub132nepbf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048] +# ATT: vfnmsub132bf16 -2048(,%rbp,2), %zmm23, %zmm22 +# INTEL: vfnmsub132bf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048] 0x62,0xe6,0x44,0x40,0x9e,0x34,0x6d,0x00,0xf8,0xff,0xff -# ATT: vfnmsub132nepbf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z} -# INTEL: vfnmsub132nepbf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128] +# ATT: vfnmsub132bf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z} +# INTEL: vfnmsub132bf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128] 0x62,0xe6,0x44,0xc7,0x9e,0x71,0x7f -# ATT: vfnmsub132nepbf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z} -# INTEL: vfnmsub132nepbf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32} +# ATT: vfnmsub132bf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z} +# INTEL: vfnmsub132bf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32} 0x62,0xe6,0x44,0xd7,0x9e,0x72,0x80 -# ATT: vfnmsub132nepbf16 268435456(%rbp,%r14,8), %ymm23, %ymm22 -# INTEL: vfnmsub132nepbf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456] +# ATT: vfnmsub132bf16 268435456(%rbp,%r14,8), %ymm23, %ymm22 +# INTEL: vfnmsub132bf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456] 0x62,0xa6,0x44,0x20,0x9e,0xb4,0xf5,0x00,0x00,0x00,0x10 -# ATT: vfnmsub132nepbf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7} -# INTEL: vfnmsub132nepbf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291] +# ATT: vfnmsub132bf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7} +# INTEL: vfnmsub132bf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291] 0x62,0xc6,0x44,0x27,0x9e,0xb4,0x80,0x23,0x01,0x00,0x00 -# ATT: vfnmsub132nepbf16 (%rip){1to16}, %ymm23, %ymm22 -# INTEL: vfnmsub132nepbf16 ymm22, ymm23, word ptr [rip]{1to16} +# ATT: vfnmsub132bf16 (%rip){1to16}, %ymm23, %ymm22 +# INTEL: vfnmsub132bf16 ymm22, ymm23, word ptr [rip]{1to16} 0x62,0xe6,0x44,0x30,0x9e,0x35,0x00,0x00,0x00,0x00 -# ATT: vfnmsub132nepbf16 -1024(,%rbp,2), %ymm23, %ymm22 -# INTEL: vfnmsub132nepbf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024] +# ATT: vfnmsub132bf16 -1024(,%rbp,2), %ymm23, %ymm22 +# INTEL: vfnmsub132bf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024] 0x62,0xe6,0x44,0x20,0x9e,0x34,0x6d,0x00,0xfc,0xff,0xff -# ATT: vfnmsub132nepbf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z} -# INTEL: vfnmsub132nepbf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064] +# ATT: vfnmsub132bf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z} +# INTEL: vfnmsub132bf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064] 0x62,0xe6,0x44,0xa7,0x9e,0x71,0x7f -# ATT: vfnmsub132nepbf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z} -# INTEL: vfnmsub132nepbf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16} +# ATT: vfnmsub132bf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z} +# INTEL: vfnmsub132bf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16} 0x62,0xe6,0x44,0xb7,0x9e,0x72,0x80 -# ATT: vfnmsub132nepbf16 268435456(%rbp,%r14,8), %xmm23, %xmm22 -# INTEL: vfnmsub132nepbf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456] +# ATT: vfnmsub132bf16 268435456(%rbp,%r14,8), %xmm23, %xmm22 +# INTEL: vfnmsub132bf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456] 0x62,0xa6,0x44,0x00,0x9e,0xb4,0xf5,0x00,0x00,0x00,0x10 -# ATT: vfnmsub132nepbf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7} -# INTEL: vfnmsub132nepbf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291] +# ATT: vfnmsub132bf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7} +# INTEL: vfnmsub132bf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291] 0x62,0xc6,0x44,0x07,0x9e,0xb4,0x80,0x23,0x01,0x00,0x00 -# ATT: vfnmsub132nepbf16 (%rip){1to8}, %xmm23, %xmm22 -# INTEL: vfnmsub132nepbf16 xmm22, xmm23, word ptr [rip]{1to8} +# ATT: vfnmsub132bf16 (%rip){1to8}, %xmm23, %xmm22 +# INTEL: vfnmsub132bf16 xmm22, xmm23, word ptr [rip]{1to8} 0x62,0xe6,0x44,0x10,0x9e,0x35,0x00,0x00,0x00,0x00 -# ATT: vfnmsub132nepbf16 -512(,%rbp,2), %xmm23, %xmm22 -# INTEL: vfnmsub132nepbf16 xmm22, xmm23, xmmword ptr [2*rbp - 512] +# ATT: vfnmsub132bf16 -512(,%rbp,2), %xmm23, %xmm22 +# INTEL: vfnmsub132bf16 xmm22, xmm23, xmmword ptr [2*rbp - 512] 0x62,0xe6,0x44,0x00,0x9e,0x34,0x6d,0x00,0xfe,0xff,0xff -# ATT: vfnmsub132nepbf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z} -# INTEL: vfnmsub132nepbf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032] +# ATT: vfnmsub132bf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z} +# INTEL: vfnmsub132bf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032] 0x62,0xe6,0x44,0x87,0x9e,0x71,0x7f -# ATT: vfnmsub132nepbf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z} -# INTEL: vfnmsub132nepbf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8} +# ATT: vfnmsub132bf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z} +# INTEL: vfnmsub132bf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8} 0x62,0xe6,0x44,0x97,0x9e,0x72,0x80 -# ATT: vfnmsub213nepbf16 %ymm24, %ymm23, %ymm22 -# INTEL: vfnmsub213nepbf16 ymm22, ymm23, ymm24 +# ATT: vfnmsub213bf16 %ymm24, %ymm23, %ymm22 +# INTEL: vfnmsub213bf16 ymm22, ymm23, ymm24 0x62,0x86,0x44,0x20,0xae,0xf0 -# ATT: vfnmsub213nepbf16 %ymm24, %ymm23, %ymm22 {%k7} -# INTEL: vfnmsub213nepbf16 ymm22 {k7}, ymm23, ymm24 +# ATT: vfnmsub213bf16 %ymm24, %ymm23, %ymm22 {%k7} +# INTEL: vfnmsub213bf16 ymm22 {k7}, ymm23, ymm24 0x62,0x86,0x44,0x27,0xae,0xf0 -# ATT: vfnmsub213nepbf16 %ymm24, %ymm23, %ymm22 {%k7} {z} -# INTEL: vfnmsub213nepbf16 ymm22 {k7} {z}, ymm23, ymm24 +# ATT: vfnmsub213bf16 %ymm24, %ymm23, %ymm22 {%k7} {z} +# INTEL: vfnmsub213bf16 ymm22 {k7} {z}, ymm23, ymm24 0x62,0x86,0x44,0xa7,0xae,0xf0 -# ATT: vfnmsub213nepbf16 %zmm24, %zmm23, %zmm22 -# INTEL: vfnmsub213nepbf16 zmm22, zmm23, zmm24 +# ATT: vfnmsub213bf16 %zmm24, %zmm23, %zmm22 +# INTEL: vfnmsub213bf16 zmm22, zmm23, zmm24 0x62,0x86,0x44,0x40,0xae,0xf0 -# ATT: vfnmsub213nepbf16 %zmm24, %zmm23, %zmm22 {%k7} -# INTEL: vfnmsub213nepbf16 zmm22 {k7}, zmm23, zmm24 +# ATT: vfnmsub213bf16 %zmm24, %zmm23, %zmm22 {%k7} +# INTEL: vfnmsub213bf16 zmm22 {k7}, zmm23, zmm24 0x62,0x86,0x44,0x47,0xae,0xf0 -# ATT: vfnmsub213nepbf16 %zmm24, %zmm23, %zmm22 {%k7} {z} -# INTEL: vfnmsub213nepbf16 zmm22 {k7} {z}, zmm23, zmm24 +# ATT: vfnmsub213bf16 %zmm24, %zmm23, %zmm22 {%k7} {z} +# INTEL: vfnmsub213bf16 zmm22 {k7} {z}, zmm23, zmm24 0x62,0x86,0x44,0xc7,0xae,0xf0 -# ATT: vfnmsub213nepbf16 %xmm24, %xmm23, %xmm22 -# INTEL: vfnmsub213nepbf16 xmm22, xmm23, xmm24 +# ATT: vfnmsub213bf16 %xmm24, %xmm23, %xmm22 +# INTEL: vfnmsub213bf16 xmm22, xmm23, xmm24 0x62,0x86,0x44,0x00,0xae,0xf0 -# ATT: vfnmsub213nepbf16 %xmm24, %xmm23, %xmm22 {%k7} -# INTEL: vfnmsub213nepbf16 xmm22 {k7}, xmm23, xmm24 +# ATT: vfnmsub213bf16 %xmm24, %xmm23, %xmm22 {%k7} +# INTEL: vfnmsub213bf16 xmm22 {k7}, xmm23, xmm24 0x62,0x86,0x44,0x07,0xae,0xf0 -# ATT: vfnmsub213nepbf16 %xmm24, %xmm23, %xmm22 {%k7} {z} -# INTEL: vfnmsub213nepbf16 xmm22 {k7} {z}, xmm23, xmm24 +# ATT: vfnmsub213bf16 %xmm24, %xmm23, %xmm22 {%k7} {z} +# INTEL: vfnmsub213bf16 xmm22 {k7} {z}, xmm23, xmm24 0x62,0x86,0x44,0x87,0xae,0xf0 -# ATT: vfnmsub213nepbf16 268435456(%rbp,%r14,8), %zmm23, %zmm22 -# INTEL: vfnmsub213nepbf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456] +# ATT: vfnmsub213bf16 268435456(%rbp,%r14,8), %zmm23, %zmm22 +# INTEL: vfnmsub213bf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456] 0x62,0xa6,0x44,0x40,0xae,0xb4,0xf5,0x00,0x00,0x00,0x10 -# ATT: vfnmsub213nepbf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7} -# INTEL: vfnmsub213nepbf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291] +# ATT: vfnmsub213bf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7} +# INTEL: vfnmsub213bf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291] 0x62,0xc6,0x44,0x47,0xae,0xb4,0x80,0x23,0x01,0x00,0x00 -# ATT: vfnmsub213nepbf16 (%rip){1to32}, %zmm23, %zmm22 -# INTEL: vfnmsub213nepbf16 zmm22, zmm23, word ptr [rip]{1to32} +# ATT: vfnmsub213bf16 (%rip){1to32}, %zmm23, %zmm22 +# INTEL: vfnmsub213bf16 zmm22, zmm23, word ptr [rip]{1to32} 0x62,0xe6,0x44,0x50,0xae,0x35,0x00,0x00,0x00,0x00 -# ATT: vfnmsub213nepbf16 -2048(,%rbp,2), %zmm23, %zmm22 -# INTEL: vfnmsub213nepbf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048] +# ATT: vfnmsub213bf16 -2048(,%rbp,2), %zmm23, %zmm22 +# INTEL: vfnmsub213bf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048] 0x62,0xe6,0x44,0x40,0xae,0x34,0x6d,0x00,0xf8,0xff,0xff -# ATT: vfnmsub213nepbf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z} -# INTEL: vfnmsub213nepbf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128] +# ATT: vfnmsub213bf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z} +# INTEL: vfnmsub213bf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128] 0x62,0xe6,0x44,0xc7,0xae,0x71,0x7f -# ATT: vfnmsub213nepbf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z} -# INTEL: vfnmsub213nepbf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32} +# ATT: vfnmsub213bf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z} +# INTEL: vfnmsub213bf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32} 0x62,0xe6,0x44,0xd7,0xae,0x72,0x80 -# ATT: vfnmsub213nepbf16 268435456(%rbp,%r14,8), %ymm23, %ymm22 -# INTEL: vfnmsub213nepbf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456] +# ATT: vfnmsub213bf16 268435456(%rbp,%r14,8), %ymm23, %ymm22 +# INTEL: vfnmsub213bf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456] 0x62,0xa6,0x44,0x20,0xae,0xb4,0xf5,0x00,0x00,0x00,0x10 -# ATT: vfnmsub213nepbf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7} -# INTEL: vfnmsub213nepbf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291] +# ATT: vfnmsub213bf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7} +# INTEL: vfnmsub213bf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291] 0x62,0xc6,0x44,0x27,0xae,0xb4,0x80,0x23,0x01,0x00,0x00 -# ATT: vfnmsub213nepbf16 (%rip){1to16}, %ymm23, %ymm22 -# INTEL: vfnmsub213nepbf16 ymm22, ymm23, word ptr [rip]{1to16} +# ATT: vfnmsub213bf16 (%rip){1to16}, %ymm23, %ymm22 +# INTEL: vfnmsub213bf16 ymm22, ymm23, word ptr [rip]{1to16} 0x62,0xe6,0x44,0x30,0xae,0x35,0x00,0x00,0x00,0x00 -# ATT: vfnmsub213nepbf16 -1024(,%rbp,2), %ymm23, %ymm22 -# INTEL: vfnmsub213nepbf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024] +# ATT: vfnmsub213bf16 -1024(,%rbp,2), %ymm23, %ymm22 +# INTEL: vfnmsub213bf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024] 0x62,0xe6,0x44,0x20,0xae,0x34,0x6d,0x00,0xfc,0xff,0xff -# ATT: vfnmsub213nepbf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z} -# INTEL: vfnmsub213nepbf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064] +# ATT: vfnmsub213bf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z} +# INTEL: vfnmsub213bf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064] 0x62,0xe6,0x44,0xa7,0xae,0x71,0x7f -# ATT: vfnmsub213nepbf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z} -# INTEL: vfnmsub213nepbf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16} +# ATT: vfnmsub213bf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z} +# INTEL: vfnmsub213bf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16} 0x62,0xe6,0x44,0xb7,0xae,0x72,0x80 -# ATT: vfnmsub213nepbf16 268435456(%rbp,%r14,8), %xmm23, %xmm22 -# INTEL: vfnmsub213nepbf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456] +# ATT: vfnmsub213bf16 268435456(%rbp,%r14,8), %xmm23, %xmm22 +# INTEL: vfnmsub213bf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456] 0x62,0xa6,0x44,0x00,0xae,0xb4,0xf5,0x00,0x00,0x00,0x10 -# ATT: vfnmsub213nepbf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7} -# INTEL: vfnmsub213nepbf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291] +# ATT: vfnmsub213bf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7} +# INTEL: vfnmsub213bf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291] 0x62,0xc6,0x44,0x07,0xae,0xb4,0x80,0x23,0x01,0x00,0x00 -# ATT: vfnmsub213nepbf16 (%rip){1to8}, %xmm23, %xmm22 -# INTEL: vfnmsub213nepbf16 xmm22, xmm23, word ptr [rip]{1to8} +# ATT: vfnmsub213bf16 (%rip){1to8}, %xmm23, %xmm22 +# INTEL: vfnmsub213bf16 xmm22, xmm23, word ptr [rip]{1to8} 0x62,0xe6,0x44,0x10,0xae,0x35,0x00,0x00,0x00,0x00 -# ATT: vfnmsub213nepbf16 -512(,%rbp,2), %xmm23, %xmm22 -# INTEL: vfnmsub213nepbf16 xmm22, xmm23, xmmword ptr [2*rbp - 512] +# ATT: vfnmsub213bf16 -512(,%rbp,2), %xmm23, %xmm22 +# INTEL: vfnmsub213bf16 xmm22, xmm23, xmmword ptr [2*rbp - 512] 0x62,0xe6,0x44,0x00,0xae,0x34,0x6d,0x00,0xfe,0xff,0xff -# ATT: vfnmsub213nepbf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z} -# INTEL: vfnmsub213nepbf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032] +# ATT: vfnmsub213bf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z} +# INTEL: vfnmsub213bf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032] 0x62,0xe6,0x44,0x87,0xae,0x71,0x7f -# ATT: vfnmsub213nepbf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z} -# INTEL: vfnmsub213nepbf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8} +# ATT: vfnmsub213bf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z} +# INTEL: vfnmsub213bf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8} 0x62,0xe6,0x44,0x97,0xae,0x72,0x80 -# ATT: vfnmsub231nepbf16 %ymm24, %ymm23, %ymm22 -# INTEL: vfnmsub231nepbf16 ymm22, ymm23, ymm24 +# ATT: vfnmsub231bf16 %ymm24, %ymm23, %ymm22 +# INTEL: vfnmsub231bf16 ymm22, ymm23, ymm24 0x62,0x86,0x44,0x20,0xbe,0xf0 -# ATT: vfnmsub231nepbf16 %ymm24, %ymm23, %ymm22 {%k7} -# INTEL: vfnmsub231nepbf16 ymm22 {k7}, ymm23, ymm24 +# ATT: vfnmsub231bf16 %ymm24, %ymm23, %ymm22 {%k7} +# INTEL: vfnmsub231bf16 ymm22 {k7}, ymm23, ymm24 0x62,0x86,0x44,0x27,0xbe,0xf0 -# ATT: vfnmsub231nepbf16 %ymm24, %ymm23, %ymm22 {%k7} {z} -# INTEL: vfnmsub231nepbf16 ymm22 {k7} {z}, ymm23, ymm24 +# ATT: vfnmsub231bf16 %ymm24, %ymm23, %ymm22 {%k7} {z} +# INTEL: vfnmsub231bf16 ymm22 {k7} {z}, ymm23, ymm24 0x62,0x86,0x44,0xa7,0xbe,0xf0 -# ATT: vfnmsub231nepbf16 %zmm24, %zmm23, %zmm22 -# INTEL: vfnmsub231nepbf16 zmm22, zmm23, zmm24 +# ATT: vfnmsub231bf16 %zmm24, %zmm23, %zmm22 +# INTEL: vfnmsub231bf16 zmm22, zmm23, zmm24 0x62,0x86,0x44,0x40,0xbe,0xf0 -# ATT: vfnmsub231nepbf16 %zmm24, %zmm23, %zmm22 {%k7} -# INTEL: vfnmsub231nepbf16 zmm22 {k7}, zmm23, zmm24 +# ATT: vfnmsub231bf16 %zmm24, %zmm23, %zmm22 {%k7} +# INTEL: vfnmsub231bf16 zmm22 {k7}, zmm23, zmm24 0x62,0x86,0x44,0x47,0xbe,0xf0 -# ATT: vfnmsub231nepbf16 %zmm24, %zmm23, %zmm22 {%k7} {z} -# INTEL: vfnmsub231nepbf16 zmm22 {k7} {z}, zmm23, zmm24 +# ATT: vfnmsub231bf16 %zmm24, %zmm23, %zmm22 {%k7} {z} +# INTEL: vfnmsub231bf16 zmm22 {k7} {z}, zmm23, zmm24 0x62,0x86,0x44,0xc7,0xbe,0xf0 -# ATT: vfnmsub231nepbf16 %xmm24, %xmm23, %xmm22 -# INTEL: vfnmsub231nepbf16 xmm22, xmm23, xmm24 +# ATT: vfnmsub231bf16 %xmm24, %xmm23, %xmm22 +# INTEL: vfnmsub231bf16 xmm22, xmm23, xmm24 0x62,0x86,0x44,0x00,0xbe,0xf0 -# ATT: vfnmsub231nepbf16 %xmm24, %xmm23, %xmm22 {%k7} -# INTEL: vfnmsub231nepbf16 xmm22 {k7}, xmm23, xmm24 +# ATT: vfnmsub231bf16 %xmm24, %xmm23, %xmm22 {%k7} +# INTEL: vfnmsub231bf16 xmm22 {k7}, xmm23, xmm24 0x62,0x86,0x44,0x07,0xbe,0xf0 -# ATT: vfnmsub231nepbf16 %xmm24, %xmm23, %xmm22 {%k7} {z} -# INTEL: vfnmsub231nepbf16 xmm22 {k7} {z}, xmm23, xmm24 +# ATT: vfnmsub231bf16 %xmm24, %xmm23, %xmm22 {%k7} {z} +# INTEL: vfnmsub231bf16 xmm22 {k7} {z}, xmm23, xmm24 0x62,0x86,0x44,0x87,0xbe,0xf0 -# ATT: vfnmsub231nepbf16 268435456(%rbp,%r14,8), %zmm23, %zmm22 -# INTEL: vfnmsub231nepbf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456] +# ATT: vfnmsub231bf16 268435456(%rbp,%r14,8), %zmm23, %zmm22 +# INTEL: vfnmsub231bf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456] 0x62,0xa6,0x44,0x40,0xbe,0xb4,0xf5,0x00,0x00,0x00,0x10 -# ATT: vfnmsub231nepbf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7} -# INTEL: vfnmsub231nepbf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291] +# ATT: vfnmsub231bf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7} +# INTEL: vfnmsub231bf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291] 0x62,0xc6,0x44,0x47,0xbe,0xb4,0x80,0x23,0x01,0x00,0x00 -# ATT: vfnmsub231nepbf16 (%rip){1to32}, %zmm23, %zmm22 -# INTEL: vfnmsub231nepbf16 zmm22, zmm23, word ptr [rip]{1to32} +# ATT: vfnmsub231bf16 (%rip){1to32}, %zmm23, %zmm22 +# INTEL: vfnmsub231bf16 zmm22, zmm23, word ptr [rip]{1to32} 0x62,0xe6,0x44,0x50,0xbe,0x35,0x00,0x00,0x00,0x00 -# ATT: vfnmsub231nepbf16 -2048(,%rbp,2), %zmm23, %zmm22 -# INTEL: vfnmsub231nepbf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048] +# ATT: vfnmsub231bf16 -2048(,%rbp,2), %zmm23, %zmm22 +# INTEL: vfnmsub231bf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048] 0x62,0xe6,0x44,0x40,0xbe,0x34,0x6d,0x00,0xf8,0xff,0xff -# ATT: vfnmsub231nepbf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z} -# INTEL: vfnmsub231nepbf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128] +# ATT: vfnmsub231bf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z} +# INTEL: vfnmsub231bf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128] 0x62,0xe6,0x44,0xc7,0xbe,0x71,0x7f -# ATT: vfnmsub231nepbf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z} -# INTEL: vfnmsub231nepbf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32} +# ATT: vfnmsub231bf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z} +# INTEL: vfnmsub231bf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32} 0x62,0xe6,0x44,0xd7,0xbe,0x72,0x80 -# ATT: vfnmsub231nepbf16 268435456(%rbp,%r14,8), %ymm23, %ymm22 -# INTEL: vfnmsub231nepbf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456] +# ATT: vfnmsub231bf16 268435456(%rbp,%r14,8), %ymm23, %ymm22 +# INTEL: vfnmsub231bf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456] 0x62,0xa6,0x44,0x20,0xbe,0xb4,0xf5,0x00,0x00,0x00,0x10 -# ATT: vfnmsub231nepbf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7} -# INTEL: vfnmsub231nepbf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291] +# ATT: vfnmsub231bf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7} +# INTEL: vfnmsub231bf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291] 0x62,0xc6,0x44,0x27,0xbe,0xb4,0x80,0x23,0x01,0x00,0x00 -# ATT: vfnmsub231nepbf16 (%rip){1to16}, %ymm23, %ymm22 -# INTEL: vfnmsub231nepbf16 ymm22, ymm23, word ptr [rip]{1to16} +# ATT: vfnmsub231bf16 (%rip){1to16}, %ymm23, %ymm22 +# INTEL: vfnmsub231bf16 ymm22, ymm23, word ptr [rip]{1to16} 0x62,0xe6,0x44,0x30,0xbe,0x35,0x00,0x00,0x00,0x00 -# ATT: vfnmsub231nepbf16 -1024(,%rbp,2), %ymm23, %ymm22 -# INTEL: vfnmsub231nepbf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024] +# ATT: vfnmsub231bf16 -1024(,%rbp,2), %ymm23, %ymm22 +# INTEL: vfnmsub231bf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024] 0x62,0xe6,0x44,0x20,0xbe,0x34,0x6d,0x00,0xfc,0xff,0xff -# ATT: vfnmsub231nepbf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z} -# INTEL: vfnmsub231nepbf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064] +# ATT: vfnmsub231bf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z} +# INTEL: vfnmsub231bf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064] 0x62,0xe6,0x44,0xa7,0xbe,0x71,0x7f -# ATT: vfnmsub231nepbf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z} -# INTEL: vfnmsub231nepbf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16} +# ATT: vfnmsub231bf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z} +# INTEL: vfnmsub231bf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16} 0x62,0xe6,0x44,0xb7,0xbe,0x72,0x80 -# ATT: vfnmsub231nepbf16 268435456(%rbp,%r14,8), %xmm23, %xmm22 -# INTEL: vfnmsub231nepbf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456] +# ATT: vfnmsub231bf16 268435456(%rbp,%r14,8), %xmm23, %xmm22 +# INTEL: vfnmsub231bf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456] 0x62,0xa6,0x44,0x00,0xbe,0xb4,0xf5,0x00,0x00,0x00,0x10 -# ATT: vfnmsub231nepbf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7} -# INTEL: vfnmsub231nepbf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291] +# ATT: vfnmsub231bf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7} +# INTEL: vfnmsub231bf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291] 0x62,0xc6,0x44,0x07,0xbe,0xb4,0x80,0x23,0x01,0x00,0x00 -# ATT: vfnmsub231nepbf16 (%rip){1to8}, %xmm23, %xmm22 -# INTEL: vfnmsub231nepbf16 xmm22, xmm23, word ptr [rip]{1to8} +# ATT: vfnmsub231bf16 (%rip){1to8}, %xmm23, %xmm22 +# INTEL: vfnmsub231bf16 xmm22, xmm23, word ptr [rip]{1to8} 0x62,0xe6,0x44,0x10,0xbe,0x35,0x00,0x00,0x00,0x00 -# ATT: vfnmsub231nepbf16 -512(,%rbp,2), %xmm23, %xmm22 -# INTEL: vfnmsub231nepbf16 xmm22, xmm23, xmmword ptr [2*rbp - 512] +# ATT: vfnmsub231bf16 -512(,%rbp,2), %xmm23, %xmm22 +# INTEL: vfnmsub231bf16 xmm22, xmm23, xmmword ptr [2*rbp - 512] 0x62,0xe6,0x44,0x00,0xbe,0x34,0x6d,0x00,0xfe,0xff,0xff -# ATT: vfnmsub231nepbf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z} -# INTEL: vfnmsub231nepbf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032] +# ATT: vfnmsub231bf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z} +# INTEL: vfnmsub231bf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032] 0x62,0xe6,0x44,0x87,0xbe,0x71,0x7f -# ATT: vfnmsub231nepbf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z} -# INTEL: vfnmsub231nepbf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8} +# ATT: vfnmsub231bf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z} +# INTEL: vfnmsub231bf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8} 0x62,0xe6,0x44,0x97,0xbe,0x72,0x80 -# ATT: vfpclasspbf16 $123, %zmm23, %k5 -# INTEL: vfpclasspbf16 k5, zmm23, 123 +# ATT: vfpclassbf16 $123, %zmm23, %k5 +# INTEL: vfpclassbf16 k5, zmm23, 123 0x62,0xb3,0x7f,0x48,0x66,0xef,0x7b -# ATT: vfpclasspbf16 $123, %zmm23, %k5 {%k7} -# INTEL: vfpclasspbf16 k5 {k7}, zmm23, 123 +# ATT: vfpclassbf16 $123, %zmm23, %k5 {%k7} +# INTEL: vfpclassbf16 k5 {k7}, zmm23, 123 0x62,0xb3,0x7f,0x4f,0x66,0xef,0x7b -# ATT: vfpclasspbf16 $123, %ymm23, %k5 -# INTEL: vfpclasspbf16 k5, ymm23, 123 +# ATT: vfpclassbf16 $123, %ymm23, %k5 +# INTEL: vfpclassbf16 k5, ymm23, 123 0x62,0xb3,0x7f,0x28,0x66,0xef,0x7b -# ATT: vfpclasspbf16 $123, %ymm23, %k5 {%k7} -# INTEL: vfpclasspbf16 k5 {k7}, ymm23, 123 +# ATT: vfpclassbf16 $123, %ymm23, %k5 {%k7} +# INTEL: vfpclassbf16 k5 {k7}, ymm23, 123 0x62,0xb3,0x7f,0x2f,0x66,0xef,0x7b -# ATT: vfpclasspbf16 $123, %xmm23, %k5 -# INTEL: vfpclasspbf16 k5, xmm23, 123 +# ATT: vfpclassbf16 $123, %xmm23, %k5 +# INTEL: vfpclassbf16 k5, xmm23, 123 0x62,0xb3,0x7f,0x08,0x66,0xef,0x7b -# ATT: vfpclasspbf16 $123, %xmm23, %k5 {%k7} -# INTEL: vfpclasspbf16 k5 {k7}, xmm23, 123 +# ATT: vfpclassbf16 $123, %xmm23, %k5 {%k7} +# INTEL: vfpclassbf16 k5 {k7}, xmm23, 123 0x62,0xb3,0x7f,0x0f,0x66,0xef,0x7b -# ATT: vfpclasspbf16x $123, 268435456(%rbp,%r14,8), %k5 -# INTEL: vfpclasspbf16 k5, xmmword ptr [rbp + 8*r14 + 268435456], 123 +# ATT: vfpclassbf16x $123, 268435456(%rbp,%r14,8), %k5 +# INTEL: vfpclassbf16 k5, xmmword ptr [rbp + 8*r14 + 268435456], 123 0x62,0xb3,0x7f,0x08,0x66,0xac,0xf5,0x00,0x00,0x00,0x10,0x7b -# ATT: vfpclasspbf16x $123, 291(%r8,%rax,4), %k5 {%k7} -# INTEL: vfpclasspbf16 k5 {k7}, xmmword ptr [r8 + 4*rax + 291], 123 +# ATT: vfpclassbf16x $123, 291(%r8,%rax,4), %k5 {%k7} +# INTEL: vfpclassbf16 k5 {k7}, xmmword ptr [r8 + 4*rax + 291], 123 0x62,0xd3,0x7f,0x0f,0x66,0xac,0x80,0x23,0x01,0x00,0x00,0x7b -# ATT: vfpclasspbf16 $123, (%rip){1to8}, %k5 -# INTEL: vfpclasspbf16 k5, word ptr [rip]{1to8}, 123 +# ATT: vfpclassbf16 $123, (%rip){1to8}, %k5 +# INTEL: vfpclassbf16 k5, word ptr [rip]{1to8}, 123 0x62,0xf3,0x7f,0x18,0x66,0x2d,0x00,0x00,0x00,0x00,0x7b -# ATT: vfpclasspbf16x $123, -512(,%rbp,2), %k5 -# INTEL: vfpclasspbf16 k5, xmmword ptr [2*rbp - 512], 123 +# ATT: vfpclassbf16x $123, -512(,%rbp,2), %k5 +# INTEL: vfpclassbf16 k5, xmmword ptr [2*rbp - 512], 123 0x62,0xf3,0x7f,0x08,0x66,0x2c,0x6d,0x00,0xfe,0xff,0xff,0x7b -# ATT: vfpclasspbf16x $123, 2032(%rcx), %k5 {%k7} -# INTEL: vfpclasspbf16 k5 {k7}, xmmword ptr [rcx + 2032], 123 +# ATT: vfpclassbf16x $123, 2032(%rcx), %k5 {%k7} +# INTEL: vfpclassbf16 k5 {k7}, xmmword ptr [rcx + 2032], 123 0x62,0xf3,0x7f,0x0f,0x66,0x69,0x7f,0x7b -# ATT: vfpclasspbf16 $123, -256(%rdx){1to8}, %k5 {%k7} -# INTEL: vfpclasspbf16 k5 {k7}, word ptr [rdx - 256]{1to8}, 123 +# ATT: vfpclassbf16 $123, -256(%rdx){1to8}, %k5 {%k7} +# INTEL: vfpclassbf16 k5 {k7}, word ptr [rdx - 256]{1to8}, 123 0x62,0xf3,0x7f,0x1f,0x66,0x6a,0x80,0x7b -# ATT: vfpclasspbf16 $123, (%rip){1to16}, %k5 -# INTEL: vfpclasspbf16 k5, word ptr [rip]{1to16}, 123 +# ATT: vfpclassbf16 $123, (%rip){1to16}, %k5 +# INTEL: vfpclassbf16 k5, word ptr [rip]{1to16}, 123 0x62,0xf3,0x7f,0x38,0x66,0x2d,0x00,0x00,0x00,0x00,0x7b -# ATT: vfpclasspbf16y $123, -1024(,%rbp,2), %k5 -# INTEL: vfpclasspbf16 k5, ymmword ptr [2*rbp - 1024], 123 +# ATT: vfpclassbf16y $123, -1024(,%rbp,2), %k5 +# INTEL: vfpclassbf16 k5, ymmword ptr [2*rbp - 1024], 123 0x62,0xf3,0x7f,0x28,0x66,0x2c,0x6d,0x00,0xfc,0xff,0xff,0x7b -# ATT: vfpclasspbf16y $123, 4064(%rcx), %k5 {%k7} -# INTEL: vfpclasspbf16 k5 {k7}, ymmword ptr [rcx + 4064], 123 +# ATT: vfpclassbf16y $123, 4064(%rcx), %k5 {%k7} +# INTEL: vfpclassbf16 k5 {k7}, ymmword ptr [rcx + 4064], 123 0x62,0xf3,0x7f,0x2f,0x66,0x69,0x7f,0x7b -# ATT: vfpclasspbf16 $123, -256(%rdx){1to16}, %k5 {%k7} -# INTEL: vfpclasspbf16 k5 {k7}, word ptr [rdx - 256]{1to16}, 123 +# ATT: vfpclassbf16 $123, -256(%rdx){1to16}, %k5 {%k7} +# INTEL: vfpclassbf16 k5 {k7}, word ptr [rdx - 256]{1to16}, 123 0x62,0xf3,0x7f,0x3f,0x66,0x6a,0x80,0x7b -# ATT: vfpclasspbf16 $123, (%rip){1to32}, %k5 -# INTEL: vfpclasspbf16 k5, word ptr [rip]{1to32}, 123 +# ATT: vfpclassbf16 $123, (%rip){1to32}, %k5 +# INTEL: vfpclassbf16 k5, word ptr [rip]{1to32}, 123 0x62,0xf3,0x7f,0x58,0x66,0x2d,0x00,0x00,0x00,0x00,0x7b -# ATT: vfpclasspbf16z $123, -2048(,%rbp,2), %k5 -# INTEL: vfpclasspbf16 k5, zmmword ptr [2*rbp - 2048], 123 +# ATT: vfpclassbf16z $123, -2048(,%rbp,2), %k5 +# INTEL: vfpclassbf16 k5, zmmword ptr [2*rbp - 2048], 123 0x62,0xf3,0x7f,0x48,0x66,0x2c,0x6d,0x00,0xf8,0xff,0xff,0x7b -# ATT: vfpclasspbf16z $123, 8128(%rcx), %k5 {%k7} -# INTEL: vfpclasspbf16 k5 {k7}, zmmword ptr [rcx + 8128], 123 +# ATT: vfpclassbf16z $123, 8128(%rcx), %k5 {%k7} +# INTEL: vfpclassbf16 k5 {k7}, zmmword ptr [rcx + 8128], 123 0x62,0xf3,0x7f,0x4f,0x66,0x69,0x7f,0x7b -# ATT: vfpclasspbf16 $123, -256(%rdx){1to32}, %k5 {%k7} -# INTEL: vfpclasspbf16 k5 {k7}, word ptr [rdx - 256]{1to32}, 123 +# ATT: vfpclassbf16 $123, -256(%rdx){1to32}, %k5 {%k7} +# INTEL: vfpclassbf16 k5 {k7}, word ptr [rdx - 256]{1to32}, 123 0x62,0xf3,0x7f,0x5f,0x66,0x6a,0x80,0x7b -# ATT: vgetexppbf16 %xmm23, %xmm22 -# INTEL: vgetexppbf16 xmm22, xmm23 +# ATT: vgetexpbf16 %xmm23, %xmm22 +# INTEL: vgetexpbf16 xmm22, xmm23 0x62,0xa5,0x7d,0x08,0x42,0xf7 -# ATT: vgetexppbf16 %xmm23, %xmm22 {%k7} -# INTEL: vgetexppbf16 xmm22 {k7}, xmm23 +# ATT: vgetexpbf16 %xmm23, %xmm22 {%k7} +# INTEL: vgetexpbf16 xmm22 {k7}, xmm23 0x62,0xa5,0x7d,0x0f,0x42,0xf7 -# ATT: vgetexppbf16 %xmm23, %xmm22 {%k7} {z} -# INTEL: vgetexppbf16 xmm22 {k7} {z}, xmm23 +# ATT: vgetexpbf16 %xmm23, %xmm22 {%k7} {z} +# INTEL: vgetexpbf16 xmm22 {k7} {z}, xmm23 0x62,0xa5,0x7d,0x8f,0x42,0xf7 -# ATT: vgetexppbf16 %zmm23, %zmm22 -# INTEL: vgetexppbf16 zmm22, zmm23 +# ATT: vgetexpbf16 %zmm23, %zmm22 +# INTEL: vgetexpbf16 zmm22, zmm23 0x62,0xa5,0x7d,0x48,0x42,0xf7 -# ATT: vgetexppbf16 %zmm23, %zmm22 {%k7} -# INTEL: vgetexppbf16 zmm22 {k7}, zmm23 +# ATT: vgetexpbf16 %zmm23, %zmm22 {%k7} +# INTEL: vgetexpbf16 zmm22 {k7}, zmm23 0x62,0xa5,0x7d,0x4f,0x42,0xf7 -# ATT: vgetexppbf16 %zmm23, %zmm22 {%k7} {z} -# INTEL: vgetexppbf16 zmm22 {k7} {z}, zmm23 +# ATT: vgetexpbf16 %zmm23, %zmm22 {%k7} {z} +# INTEL: vgetexpbf16 zmm22 {k7} {z}, zmm23 0x62,0xa5,0x7d,0xcf,0x42,0xf7 -# ATT: vgetexppbf16 %ymm23, %ymm22 -# INTEL: vgetexppbf16 ymm22, ymm23 +# ATT: vgetexpbf16 %ymm23, %ymm22 +# INTEL: vgetexpbf16 ymm22, ymm23 0x62,0xa5,0x7d,0x28,0x42,0xf7 -# ATT: vgetexppbf16 %ymm23, %ymm22 {%k7} -# INTEL: vgetexppbf16 ymm22 {k7}, ymm23 +# ATT: vgetexpbf16 %ymm23, %ymm22 {%k7} +# INTEL: vgetexpbf16 ymm22 {k7}, ymm23 0x62,0xa5,0x7d,0x2f,0x42,0xf7 -# ATT: vgetexppbf16 %ymm23, %ymm22 {%k7} {z} -# INTEL: vgetexppbf16 ymm22 {k7} {z}, ymm23 +# ATT: vgetexpbf16 %ymm23, %ymm22 {%k7} {z} +# INTEL: vgetexpbf16 ymm22 {k7} {z}, ymm23 0x62,0xa5,0x7d,0xaf,0x42,0xf7 -# ATT: vgetexppbf16 268435456(%rbp,%r14,8), %xmm22 -# INTEL: vgetexppbf16 xmm22, xmmword ptr [rbp + 8*r14 + 268435456] +# ATT: vgetexpbf16 268435456(%rbp,%r14,8), %xmm22 +# INTEL: vgetexpbf16 xmm22, xmmword ptr [rbp + 8*r14 + 268435456] 0x62,0xa5,0x7d,0x08,0x42,0xb4,0xf5,0x00,0x00,0x00,0x10 -# ATT: vgetexppbf16 291(%r8,%rax,4), %xmm22 {%k7} -# INTEL: vgetexppbf16 xmm22 {k7}, xmmword ptr [r8 + 4*rax + 291] +# ATT: vgetexpbf16 291(%r8,%rax,4), %xmm22 {%k7} +# INTEL: vgetexpbf16 xmm22 {k7}, xmmword ptr [r8 + 4*rax + 291] 0x62,0xc5,0x7d,0x0f,0x42,0xb4,0x80,0x23,0x01,0x00,0x00 -# ATT: vgetexppbf16 (%rip){1to8}, %xmm22 -# INTEL: vgetexppbf16 xmm22, word ptr [rip]{1to8} +# ATT: vgetexpbf16 (%rip){1to8}, %xmm22 +# INTEL: vgetexpbf16 xmm22, word ptr [rip]{1to8} 0x62,0xe5,0x7d,0x18,0x42,0x35,0x00,0x00,0x00,0x00 -# ATT: vgetexppbf16 -512(,%rbp,2), %xmm22 -# INTEL: vgetexppbf16 xmm22, xmmword ptr [2*rbp - 512] +# ATT: vgetexpbf16 -512(,%rbp,2), %xmm22 +# INTEL: vgetexpbf16 xmm22, xmmword ptr [2*rbp - 512] 0x62,0xe5,0x7d,0x08,0x42,0x34,0x6d,0x00,0xfe,0xff,0xff -# ATT: vgetexppbf16 2032(%rcx), %xmm22 {%k7} {z} -# INTEL: vgetexppbf16 xmm22 {k7} {z}, xmmword ptr [rcx + 2032] +# ATT: vgetexpbf16 2032(%rcx), %xmm22 {%k7} {z} +# INTEL: vgetexpbf16 xmm22 {k7} {z}, xmmword ptr [rcx + 2032] 0x62,0xe5,0x7d,0x8f,0x42,0x71,0x7f -# ATT: vgetexppbf16 -256(%rdx){1to8}, %xmm22 {%k7} {z} -# INTEL: vgetexppbf16 xmm22 {k7} {z}, word ptr [rdx - 256]{1to8} +# ATT: vgetexpbf16 -256(%rdx){1to8}, %xmm22 {%k7} {z} +# INTEL: vgetexpbf16 xmm22 {k7} {z}, word ptr [rdx - 256]{1to8} 0x62,0xe5,0x7d,0x9f,0x42,0x72,0x80 -# ATT: vgetexppbf16 268435456(%rbp,%r14,8), %ymm22 -# INTEL: vgetexppbf16 ymm22, ymmword ptr [rbp + 8*r14 + 268435456] +# ATT: vgetexpbf16 268435456(%rbp,%r14,8), %ymm22 +# INTEL: vgetexpbf16 ymm22, ymmword ptr [rbp + 8*r14 + 268435456] 0x62,0xa5,0x7d,0x28,0x42,0xb4,0xf5,0x00,0x00,0x00,0x10 -# ATT: vgetexppbf16 291(%r8,%rax,4), %ymm22 {%k7} -# INTEL: vgetexppbf16 ymm22 {k7}, ymmword ptr [r8 + 4*rax + 291] +# ATT: vgetexpbf16 291(%r8,%rax,4), %ymm22 {%k7} +# INTEL: vgetexpbf16 ymm22 {k7}, ymmword ptr [r8 + 4*rax + 291] 0x62,0xc5,0x7d,0x2f,0x42,0xb4,0x80,0x23,0x01,0x00,0x00 -# ATT: vgetexppbf16 (%rip){1to16}, %ymm22 -# INTEL: vgetexppbf16 ymm22, word ptr [rip]{1to16} +# ATT: vgetexpbf16 (%rip){1to16}, %ymm22 +# INTEL: vgetexpbf16 ymm22, word ptr [rip]{1to16} 0x62,0xe5,0x7d,0x38,0x42,0x35,0x00,0x00,0x00,0x00 -# ATT: vgetexppbf16 -1024(,%rbp,2), %ymm22 -# INTEL: vgetexppbf16 ymm22, ymmword ptr [2*rbp - 1024] +# ATT: vgetexpbf16 -1024(,%rbp,2), %ymm22 +# INTEL: vgetexpbf16 ymm22, ymmword ptr [2*rbp - 1024] 0x62,0xe5,0x7d,0x28,0x42,0x34,0x6d,0x00,0xfc,0xff,0xff -# ATT: vgetexppbf16 4064(%rcx), %ymm22 {%k7} {z} -# INTEL: vgetexppbf16 ymm22 {k7} {z}, ymmword ptr [rcx + 4064] +# ATT: vgetexpbf16 4064(%rcx), %ymm22 {%k7} {z} +# INTEL: vgetexpbf16 ymm22 {k7} {z}, ymmword ptr [rcx + 4064] 0x62,0xe5,0x7d,0xaf,0x42,0x71,0x7f -# ATT: vgetexppbf16 -256(%rdx){1to16}, %ymm22 {%k7} {z} -# INTEL: vgetexppbf16 ymm22 {k7} {z}, word ptr [rdx - 256]{1to16} +# ATT: vgetexpbf16 -256(%rdx){1to16}, %ymm22 {%k7} {z} +# INTEL: vgetexpbf16 ymm22 {k7} {z}, word ptr [rdx - 256]{1to16} 0x62,0xe5,0x7d,0xbf,0x42,0x72,0x80 -# ATT: vgetexppbf16 268435456(%rbp,%r14,8), %zmm22 -# INTEL: vgetexppbf16 zmm22, zmmword ptr [rbp + 8*r14 + 268435456] +# ATT: vgetexpbf16 268435456(%rbp,%r14,8), %zmm22 +# INTEL: vgetexpbf16 zmm22, zmmword ptr [rbp + 8*r14 + 268435456] 0x62,0xa5,0x7d,0x48,0x42,0xb4,0xf5,0x00,0x00,0x00,0x10 -# ATT: vgetexppbf16 291(%r8,%rax,4), %zmm22 {%k7} -# INTEL: vgetexppbf16 zmm22 {k7}, zmmword ptr [r8 + 4*rax + 291] +# ATT: vgetexpbf16 291(%r8,%rax,4), %zmm22 {%k7} +# INTEL: vgetexpbf16 zmm22 {k7}, zmmword ptr [r8 + 4*rax + 291] 0x62,0xc5,0x7d,0x4f,0x42,0xb4,0x80,0x23,0x01,0x00,0x00 -# ATT: vgetexppbf16 (%rip){1to32}, %zmm22 -# INTEL: vgetexppbf16 zmm22, word ptr [rip]{1to32} +# ATT: vgetexpbf16 (%rip){1to32}, %zmm22 +# INTEL: vgetexpbf16 zmm22, word ptr [rip]{1to32} 0x62,0xe5,0x7d,0x58,0x42,0x35,0x00,0x00,0x00,0x00 -# ATT: vgetexppbf16 -2048(,%rbp,2), %zmm22 -# INTEL: vgetexppbf16 zmm22, zmmword ptr [2*rbp - 2048] +# ATT: vgetexpbf16 -2048(,%rbp,2), %zmm22 +# INTEL: vgetexpbf16 zmm22, zmmword ptr [2*rbp - 2048] 0x62,0xe5,0x7d,0x48,0x42,0x34,0x6d,0x00,0xf8,0xff,0xff -# ATT: vgetexppbf16 8128(%rcx), %zmm22 {%k7} {z} -# INTEL: vgetexppbf16 zmm22 {k7} {z}, zmmword ptr [rcx + 8128] +# ATT: vgetexpbf16 8128(%rcx), %zmm22 {%k7} {z} +# INTEL: vgetexpbf16 zmm22 {k7} {z}, zmmword ptr [rcx + 8128] 0x62,0xe5,0x7d,0xcf,0x42,0x71,0x7f -# ATT: vgetexppbf16 -256(%rdx){1to32}, %zmm22 {%k7} {z} -# INTEL: vgetexppbf16 zmm22 {k7} {z}, word ptr [rdx - 256]{1to32} +# ATT: vgetexpbf16 -256(%rdx){1to32}, %zmm22 {%k7} {z} +# INTEL: vgetexpbf16 zmm22 {k7} {z}, word ptr [rdx - 256]{1to32} 0x62,0xe5,0x7d,0xdf,0x42,0x72,0x80 -# ATT: vgetmantpbf16 $123, %zmm23, %zmm22 -# INTEL: vgetmantpbf16 zmm22, zmm23, 123 +# ATT: vgetmantbf16 $123, %zmm23, %zmm22 +# INTEL: vgetmantbf16 zmm22, zmm23, 123 0x62,0xa3,0x7f,0x48,0x26,0xf7,0x7b -# ATT: vgetmantpbf16 $123, %zmm23, %zmm22 {%k7} -# INTEL: vgetmantpbf16 zmm22 {k7}, zmm23, 123 +# ATT: vgetmantbf16 $123, %zmm23, %zmm22 {%k7} +# INTEL: vgetmantbf16 zmm22 {k7}, zmm23, 123 0x62,0xa3,0x7f,0x4f,0x26,0xf7,0x7b -# ATT: vgetmantpbf16 $123, %zmm23, %zmm22 {%k7} {z} -# INTEL: vgetmantpbf16 zmm22 {k7} {z}, zmm23, 123 +# ATT: vgetmantbf16 $123, %zmm23, %zmm22 {%k7} {z} +# INTEL: vgetmantbf16 zmm22 {k7} {z}, zmm23, 123 0x62,0xa3,0x7f,0xcf,0x26,0xf7,0x7b -# ATT: vgetmantpbf16 $123, %ymm23, %ymm22 -# INTEL: vgetmantpbf16 ymm22, ymm23, 123 +# ATT: vgetmantbf16 $123, %ymm23, %ymm22 +# INTEL: vgetmantbf16 ymm22, ymm23, 123 0x62,0xa3,0x7f,0x28,0x26,0xf7,0x7b -# ATT: vgetmantpbf16 $123, %ymm23, %ymm22 {%k7} -# INTEL: vgetmantpbf16 ymm22 {k7}, ymm23, 123 +# ATT: vgetmantbf16 $123, %ymm23, %ymm22 {%k7} +# INTEL: vgetmantbf16 ymm22 {k7}, ymm23, 123 0x62,0xa3,0x7f,0x2f,0x26,0xf7,0x7b -# ATT: vgetmantpbf16 $123, %ymm23, %ymm22 {%k7} {z} -# INTEL: vgetmantpbf16 ymm22 {k7} {z}, ymm23, 123 +# ATT: vgetmantbf16 $123, %ymm23, %ymm22 {%k7} {z} +# INTEL: vgetmantbf16 ymm22 {k7} {z}, ymm23, 123 0x62,0xa3,0x7f,0xaf,0x26,0xf7,0x7b -# ATT: vgetmantpbf16 $123, %xmm23, %xmm22 -# INTEL: vgetmantpbf16 xmm22, xmm23, 123 +# ATT: vgetmantbf16 $123, %xmm23, %xmm22 +# INTEL: vgetmantbf16 xmm22, xmm23, 123 0x62,0xa3,0x7f,0x08,0x26,0xf7,0x7b -# ATT: vgetmantpbf16 $123, %xmm23, %xmm22 {%k7} -# INTEL: vgetmantpbf16 xmm22 {k7}, xmm23, 123 +# ATT: vgetmantbf16 $123, %xmm23, %xmm22 {%k7} +# INTEL: vgetmantbf16 xmm22 {k7}, xmm23, 123 0x62,0xa3,0x7f,0x0f,0x26,0xf7,0x7b -# ATT: vgetmantpbf16 $123, %xmm23, %xmm22 {%k7} {z} -# INTEL: vgetmantpbf16 xmm22 {k7} {z}, xmm23, 123 +# ATT: vgetmantbf16 $123, %xmm23, %xmm22 {%k7} {z} +# INTEL: vgetmantbf16 xmm22 {k7} {z}, xmm23, 123 0x62,0xa3,0x7f,0x8f,0x26,0xf7,0x7b -# ATT: vgetmantpbf16 $123, 268435456(%rbp,%r14,8), %xmm22 -# INTEL: vgetmantpbf16 xmm22, xmmword ptr [rbp + 8*r14 + 268435456], 123 +# ATT: vgetmantbf16 $123, 268435456(%rbp,%r14,8), %xmm22 +# INTEL: vgetmantbf16 xmm22, xmmword ptr [rbp + 8*r14 + 268435456], 123 0x62,0xa3,0x7f,0x08,0x26,0xb4,0xf5,0x00,0x00,0x00,0x10,0x7b -# ATT: vgetmantpbf16 $123, 291(%r8,%rax,4), %xmm22 {%k7} -# INTEL: vgetmantpbf16 xmm22 {k7}, xmmword ptr [r8 + 4*rax + 291], 123 +# ATT: vgetmantbf16 $123, 291(%r8,%rax,4), %xmm22 {%k7} +# INTEL: vgetmantbf16 xmm22 {k7}, xmmword ptr [r8 + 4*rax + 291], 123 0x62,0xc3,0x7f,0x0f,0x26,0xb4,0x80,0x23,0x01,0x00,0x00,0x7b -# ATT: vgetmantpbf16 $123, (%rip){1to8}, %xmm22 -# INTEL: vgetmantpbf16 xmm22, word ptr [rip]{1to8}, 123 +# ATT: vgetmantbf16 $123, (%rip){1to8}, %xmm22 +# INTEL: vgetmantbf16 xmm22, word ptr [rip]{1to8}, 123 0x62,0xe3,0x7f,0x18,0x26,0x35,0x00,0x00,0x00,0x00,0x7b -# ATT: vgetmantpbf16 $123, -512(,%rbp,2), %xmm22 -# INTEL: vgetmantpbf16 xmm22, xmmword ptr [2*rbp - 512], 123 +# ATT: vgetmantbf16 $123, -512(,%rbp,2), %xmm22 +# INTEL: vgetmantbf16 xmm22, xmmword ptr [2*rbp - 512], 123 0x62,0xe3,0x7f,0x08,0x26,0x34,0x6d,0x00,0xfe,0xff,0xff,0x7b -# ATT: vgetmantpbf16 $123, 2032(%rcx), %xmm22 {%k7} {z} -# INTEL: vgetmantpbf16 xmm22 {k7} {z}, xmmword ptr [rcx + 2032], 123 +# ATT: vgetmantbf16 $123, 2032(%rcx), %xmm22 {%k7} {z} +# INTEL: vgetmantbf16 xmm22 {k7} {z}, xmmword ptr [rcx + 2032], 123 0x62,0xe3,0x7f,0x8f,0x26,0x71,0x7f,0x7b -# ATT: vgetmantpbf16 $123, -256(%rdx){1to8}, %xmm22 {%k7} {z} -# INTEL: vgetmantpbf16 xmm22 {k7} {z}, word ptr [rdx - 256]{1to8}, 123 +# ATT: vgetmantbf16 $123, -256(%rdx){1to8}, %xmm22 {%k7} {z} +# INTEL: vgetmantbf16 xmm22 {k7} {z}, word ptr [rdx - 256]{1to8}, 123 0x62,0xe3,0x7f,0x9f,0x26,0x72,0x80,0x7b -# ATT: vgetmantpbf16 $123, 268435456(%rbp,%r14,8), %ymm22 -# INTEL: vgetmantpbf16 ymm22, ymmword ptr [rbp + 8*r14 + 268435456], 123 +# ATT: vgetmantbf16 $123, 268435456(%rbp,%r14,8), %ymm22 +# INTEL: vgetmantbf16 ymm22, ymmword ptr [rbp + 8*r14 + 268435456], 123 0x62,0xa3,0x7f,0x28,0x26,0xb4,0xf5,0x00,0x00,0x00,0x10,0x7b -# ATT: vgetmantpbf16 $123, 291(%r8,%rax,4), %ymm22 {%k7} -# INTEL: vgetmantpbf16 ymm22 {k7}, ymmword ptr [r8 + 4*rax + 291], 123 +# ATT: vgetmantbf16 $123, 291(%r8,%rax,4), %ymm22 {%k7} +# INTEL: vgetmantbf16 ymm22 {k7}, ymmword ptr [r8 + 4*rax + 291], 123 0x62,0xc3,0x7f,0x2f,0x26,0xb4,0x80,0x23,0x01,0x00,0x00,0x7b -# ATT: vgetmantpbf16 $123, (%rip){1to16}, %ymm22 -# INTEL: vgetmantpbf16 ymm22, word ptr [rip]{1to16}, 123 +# ATT: vgetmantbf16 $123, (%rip){1to16}, %ymm22 +# INTEL: vgetmantbf16 ymm22, word ptr [rip]{1to16}, 123 0x62,0xe3,0x7f,0x38,0x26,0x35,0x00,0x00,0x00,0x00,0x7b -# ATT: vgetmantpbf16 $123, -1024(,%rbp,2), %ymm22 -# INTEL: vgetmantpbf16 ymm22, ymmword ptr [2*rbp - 1024], 123 +# ATT: vgetmantbf16 $123, -1024(,%rbp,2), %ymm22 +# INTEL: vgetmantbf16 ymm22, ymmword ptr [2*rbp - 1024], 123 0x62,0xe3,0x7f,0x28,0x26,0x34,0x6d,0x00,0xfc,0xff,0xff,0x7b -# ATT: vgetmantpbf16 $123, 4064(%rcx), %ymm22 {%k7} {z} -# INTEL: vgetmantpbf16 ymm22 {k7} {z}, ymmword ptr [rcx + 4064], 123 +# ATT: vgetmantbf16 $123, 4064(%rcx), %ymm22 {%k7} {z} +# INTEL: vgetmantbf16 ymm22 {k7} {z}, ymmword ptr [rcx + 4064], 123 0x62,0xe3,0x7f,0xaf,0x26,0x71,0x7f,0x7b -# ATT: vgetmantpbf16 $123, -256(%rdx){1to16}, %ymm22 {%k7} {z} -# INTEL: vgetmantpbf16 ymm22 {k7} {z}, word ptr [rdx - 256]{1to16}, 123 +# ATT: vgetmantbf16 $123, -256(%rdx){1to16}, %ymm22 {%k7} {z} +# INTEL: vgetmantbf16 ymm22 {k7} {z}, word ptr [rdx - 256]{1to16}, 123 0x62,0xe3,0x7f,0xbf,0x26,0x72,0x80,0x7b -# ATT: vgetmantpbf16 $123, 268435456(%rbp,%r14,8), %zmm22 -# INTEL: vgetmantpbf16 zmm22, zmmword ptr [rbp + 8*r14 + 268435456], 123 +# ATT: vgetmantbf16 $123, 268435456(%rbp,%r14,8), %zmm22 +# INTEL: vgetmantbf16 zmm22, zmmword ptr [rbp + 8*r14 + 268435456], 123 0x62,0xa3,0x7f,0x48,0x26,0xb4,0xf5,0x00,0x00,0x00,0x10,0x7b -# ATT: vgetmantpbf16 $123, 291(%r8,%rax,4), %zmm22 {%k7} -# INTEL: vgetmantpbf16 zmm22 {k7}, zmmword ptr [r8 + 4*rax + 291], 123 +# ATT: vgetmantbf16 $123, 291(%r8,%rax,4), %zmm22 {%k7} +# INTEL: vgetmantbf16 zmm22 {k7}, zmmword ptr [r8 + 4*rax + 291], 123 0x62,0xc3,0x7f,0x4f,0x26,0xb4,0x80,0x23,0x01,0x00,0x00,0x7b -# ATT: vgetmantpbf16 $123, (%rip){1to32}, %zmm22 -# INTEL: vgetmantpbf16 zmm22, word ptr [rip]{1to32}, 123 +# ATT: vgetmantbf16 $123, (%rip){1to32}, %zmm22 +# INTEL: vgetmantbf16 zmm22, word ptr [rip]{1to32}, 123 0x62,0xe3,0x7f,0x58,0x26,0x35,0x00,0x00,0x00,0x00,0x7b -# ATT: vgetmantpbf16 $123, -2048(,%rbp,2), %zmm22 -# INTEL: vgetmantpbf16 zmm22, zmmword ptr [2*rbp - 2048], 123 +# ATT: vgetmantbf16 $123, -2048(,%rbp,2), %zmm22 +# INTEL: vgetmantbf16 zmm22, zmmword ptr [2*rbp - 2048], 123 0x62,0xe3,0x7f,0x48,0x26,0x34,0x6d,0x00,0xf8,0xff,0xff,0x7b -# ATT: vgetmantpbf16 $123, 8128(%rcx), %zmm22 {%k7} {z} -# INTEL: vgetmantpbf16 zmm22 {k7} {z}, zmmword ptr [rcx + 8128], 123 +# ATT: vgetmantbf16 $123, 8128(%rcx), %zmm22 {%k7} {z} +# INTEL: vgetmantbf16 zmm22 {k7} {z}, zmmword ptr [rcx + 8128], 123 0x62,0xe3,0x7f,0xcf,0x26,0x71,0x7f,0x7b -# ATT: vgetmantpbf16 $123, -256(%rdx){1to32}, %zmm22 {%k7} {z} -# INTEL: vgetmantpbf16 zmm22 {k7} {z}, word ptr [rdx - 256]{1to32}, 123 +# ATT: vgetmantbf16 $123, -256(%rdx){1to32}, %zmm22 {%k7} {z} +# INTEL: vgetmantbf16 zmm22 {k7} {z}, word ptr [rdx - 256]{1to32}, 123 0x62,0xe3,0x7f,0xdf,0x26,0x72,0x80,0x7b -# ATT: vmaxpbf16 %ymm24, %ymm23, %ymm22 -# INTEL: vmaxpbf16 ymm22, ymm23, ymm24 +# ATT: vmaxbf16 %ymm24, %ymm23, %ymm22 +# INTEL: vmaxbf16 ymm22, ymm23, ymm24 0x62,0x85,0x45,0x20,0x5f,0xf0 -# ATT: vmaxpbf16 %ymm24, %ymm23, %ymm22 {%k7} -# INTEL: vmaxpbf16 ymm22 {k7}, ymm23, ymm24 +# ATT: vmaxbf16 %ymm24, %ymm23, %ymm22 {%k7} +# INTEL: vmaxbf16 ymm22 {k7}, ymm23, ymm24 0x62,0x85,0x45,0x27,0x5f,0xf0 -# ATT: vmaxpbf16 %ymm24, %ymm23, %ymm22 {%k7} {z} -# INTEL: vmaxpbf16 ymm22 {k7} {z}, ymm23, ymm24 +# ATT: vmaxbf16 %ymm24, %ymm23, %ymm22 {%k7} {z} +# INTEL: vmaxbf16 ymm22 {k7} {z}, ymm23, ymm24 0x62,0x85,0x45,0xa7,0x5f,0xf0 -# ATT: vmaxpbf16 %zmm24, %zmm23, %zmm22 -# INTEL: vmaxpbf16 zmm22, zmm23, zmm24 +# ATT: vmaxbf16 %zmm24, %zmm23, %zmm22 +# INTEL: vmaxbf16 zmm22, zmm23, zmm24 0x62,0x85,0x45,0x40,0x5f,0xf0 -# ATT: vmaxpbf16 %zmm24, %zmm23, %zmm22 {%k7} -# INTEL: vmaxpbf16 zmm22 {k7}, zmm23, zmm24 +# ATT: vmaxbf16 %zmm24, %zmm23, %zmm22 {%k7} +# INTEL: vmaxbf16 zmm22 {k7}, zmm23, zmm24 0x62,0x85,0x45,0x47,0x5f,0xf0 -# ATT: vmaxpbf16 %zmm24, %zmm23, %zmm22 {%k7} {z} -# INTEL: vmaxpbf16 zmm22 {k7} {z}, zmm23, zmm24 +# ATT: vmaxbf16 %zmm24, %zmm23, %zmm22 {%k7} {z} +# INTEL: vmaxbf16 zmm22 {k7} {z}, zmm23, zmm24 0x62,0x85,0x45,0xc7,0x5f,0xf0 -# ATT: vmaxpbf16 %xmm24, %xmm23, %xmm22 -# INTEL: vmaxpbf16 xmm22, xmm23, xmm24 +# ATT: vmaxbf16 %xmm24, %xmm23, %xmm22 +# INTEL: vmaxbf16 xmm22, xmm23, xmm24 0x62,0x85,0x45,0x00,0x5f,0xf0 -# ATT: vmaxpbf16 %xmm24, %xmm23, %xmm22 {%k7} -# INTEL: vmaxpbf16 xmm22 {k7}, xmm23, xmm24 +# ATT: vmaxbf16 %xmm24, %xmm23, %xmm22 {%k7} +# INTEL: vmaxbf16 xmm22 {k7}, xmm23, xmm24 0x62,0x85,0x45,0x07,0x5f,0xf0 -# ATT: vmaxpbf16 %xmm24, %xmm23, %xmm22 {%k7} {z} -# INTEL: vmaxpbf16 xmm22 {k7} {z}, xmm23, xmm24 +# ATT: vmaxbf16 %xmm24, %xmm23, %xmm22 {%k7} {z} +# INTEL: vmaxbf16 xmm22 {k7} {z}, xmm23, xmm24 0x62,0x85,0x45,0x87,0x5f,0xf0 -# ATT: vmaxpbf16 268435456(%rbp,%r14,8), %zmm23, %zmm22 -# INTEL: vmaxpbf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456] +# ATT: vmaxbf16 268435456(%rbp,%r14,8), %zmm23, %zmm22 +# INTEL: vmaxbf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456] 0x62,0xa5,0x45,0x40,0x5f,0xb4,0xf5,0x00,0x00,0x00,0x10 -# ATT: vmaxpbf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7} -# INTEL: vmaxpbf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291] +# ATT: vmaxbf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7} +# INTEL: vmaxbf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291] 0x62,0xc5,0x45,0x47,0x5f,0xb4,0x80,0x23,0x01,0x00,0x00 -# ATT: vmaxpbf16 (%rip){1to32}, %zmm23, %zmm22 -# INTEL: vmaxpbf16 zmm22, zmm23, word ptr [rip]{1to32} +# ATT: vmaxbf16 (%rip){1to32}, %zmm23, %zmm22 +# INTEL: vmaxbf16 zmm22, zmm23, word ptr [rip]{1to32} 0x62,0xe5,0x45,0x50,0x5f,0x35,0x00,0x00,0x00,0x00 -# ATT: vmaxpbf16 -2048(,%rbp,2), %zmm23, %zmm22 -# INTEL: vmaxpbf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048] +# ATT: vmaxbf16 -2048(,%rbp,2), %zmm23, %zmm22 +# INTEL: vmaxbf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048] 0x62,0xe5,0x45,0x40,0x5f,0x34,0x6d,0x00,0xf8,0xff,0xff -# ATT: vmaxpbf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z} -# INTEL: vmaxpbf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128] +# ATT: vmaxbf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z} +# INTEL: vmaxbf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128] 0x62,0xe5,0x45,0xc7,0x5f,0x71,0x7f -# ATT: vmaxpbf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z} -# INTEL: vmaxpbf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32} +# ATT: vmaxbf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z} +# INTEL: vmaxbf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32} 0x62,0xe5,0x45,0xd7,0x5f,0x72,0x80 -# ATT: vmaxpbf16 268435456(%rbp,%r14,8), %ymm23, %ymm22 -# INTEL: vmaxpbf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456] +# ATT: vmaxbf16 268435456(%rbp,%r14,8), %ymm23, %ymm22 +# INTEL: vmaxbf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456] 0x62,0xa5,0x45,0x20,0x5f,0xb4,0xf5,0x00,0x00,0x00,0x10 -# ATT: vmaxpbf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7} -# INTEL: vmaxpbf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291] +# ATT: vmaxbf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7} +# INTEL: vmaxbf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291] 0x62,0xc5,0x45,0x27,0x5f,0xb4,0x80,0x23,0x01,0x00,0x00 -# ATT: vmaxpbf16 (%rip){1to16}, %ymm23, %ymm22 -# INTEL: vmaxpbf16 ymm22, ymm23, word ptr [rip]{1to16} +# ATT: vmaxbf16 (%rip){1to16}, %ymm23, %ymm22 +# INTEL: vmaxbf16 ymm22, ymm23, word ptr [rip]{1to16} 0x62,0xe5,0x45,0x30,0x5f,0x35,0x00,0x00,0x00,0x00 -# ATT: vmaxpbf16 -1024(,%rbp,2), %ymm23, %ymm22 -# INTEL: vmaxpbf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024] +# ATT: vmaxbf16 -1024(,%rbp,2), %ymm23, %ymm22 +# INTEL: vmaxbf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024] 0x62,0xe5,0x45,0x20,0x5f,0x34,0x6d,0x00,0xfc,0xff,0xff -# ATT: vmaxpbf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z} -# INTEL: vmaxpbf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064] +# ATT: vmaxbf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z} +# INTEL: vmaxbf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064] 0x62,0xe5,0x45,0xa7,0x5f,0x71,0x7f -# ATT: vmaxpbf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z} -# INTEL: vmaxpbf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16} +# ATT: vmaxbf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z} +# INTEL: vmaxbf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16} 0x62,0xe5,0x45,0xb7,0x5f,0x72,0x80 -# ATT: vmaxpbf16 268435456(%rbp,%r14,8), %xmm23, %xmm22 -# INTEL: vmaxpbf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456] +# ATT: vmaxbf16 268435456(%rbp,%r14,8), %xmm23, %xmm22 +# INTEL: vmaxbf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456] 0x62,0xa5,0x45,0x00,0x5f,0xb4,0xf5,0x00,0x00,0x00,0x10 -# ATT: vmaxpbf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7} -# INTEL: vmaxpbf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291] +# ATT: vmaxbf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7} +# INTEL: vmaxbf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291] 0x62,0xc5,0x45,0x07,0x5f,0xb4,0x80,0x23,0x01,0x00,0x00 -# ATT: vmaxpbf16 (%rip){1to8}, %xmm23, %xmm22 -# INTEL: vmaxpbf16 xmm22, xmm23, word ptr [rip]{1to8} +# ATT: vmaxbf16 (%rip){1to8}, %xmm23, %xmm22 +# INTEL: vmaxbf16 xmm22, xmm23, word ptr [rip]{1to8} 0x62,0xe5,0x45,0x10,0x5f,0x35,0x00,0x00,0x00,0x00 -# ATT: vmaxpbf16 -512(,%rbp,2), %xmm23, %xmm22 -# INTEL: vmaxpbf16 xmm22, xmm23, xmmword ptr [2*rbp - 512] +# ATT: vmaxbf16 -512(,%rbp,2), %xmm23, %xmm22 +# INTEL: vmaxbf16 xmm22, xmm23, xmmword ptr [2*rbp - 512] 0x62,0xe5,0x45,0x00,0x5f,0x34,0x6d,0x00,0xfe,0xff,0xff -# ATT: vmaxpbf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z} -# INTEL: vmaxpbf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032] +# ATT: vmaxbf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z} +# INTEL: vmaxbf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032] 0x62,0xe5,0x45,0x87,0x5f,0x71,0x7f -# ATT: vmaxpbf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z} -# INTEL: vmaxpbf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8} +# ATT: vmaxbf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z} +# INTEL: vmaxbf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8} 0x62,0xe5,0x45,0x97,0x5f,0x72,0x80 -# ATT: vminpbf16 %ymm24, %ymm23, %ymm22 -# INTEL: vminpbf16 ymm22, ymm23, ymm24 +# ATT: vminbf16 %ymm24, %ymm23, %ymm22 +# INTEL: vminbf16 ymm22, ymm23, ymm24 0x62,0x85,0x45,0x20,0x5d,0xf0 -# ATT: vminpbf16 %ymm24, %ymm23, %ymm22 {%k7} -# INTEL: vminpbf16 ymm22 {k7}, ymm23, ymm24 +# ATT: vminbf16 %ymm24, %ymm23, %ymm22 {%k7} +# INTEL: vminbf16 ymm22 {k7}, ymm23, ymm24 0x62,0x85,0x45,0x27,0x5d,0xf0 -# ATT: vminpbf16 %ymm24, %ymm23, %ymm22 {%k7} {z} -# INTEL: vminpbf16 ymm22 {k7} {z}, ymm23, ymm24 +# ATT: vminbf16 %ymm24, %ymm23, %ymm22 {%k7} {z} +# INTEL: vminbf16 ymm22 {k7} {z}, ymm23, ymm24 0x62,0x85,0x45,0xa7,0x5d,0xf0 -# ATT: vminpbf16 %zmm24, %zmm23, %zmm22 -# INTEL: vminpbf16 zmm22, zmm23, zmm24 +# ATT: vminbf16 %zmm24, %zmm23, %zmm22 +# INTEL: vminbf16 zmm22, zmm23, zmm24 0x62,0x85,0x45,0x40,0x5d,0xf0 -# ATT: vminpbf16 %zmm24, %zmm23, %zmm22 {%k7} -# INTEL: vminpbf16 zmm22 {k7}, zmm23, zmm24 +# ATT: vminbf16 %zmm24, %zmm23, %zmm22 {%k7} +# INTEL: vminbf16 zmm22 {k7}, zmm23, zmm24 0x62,0x85,0x45,0x47,0x5d,0xf0 -# ATT: vminpbf16 %zmm24, %zmm23, %zmm22 {%k7} {z} -# INTEL: vminpbf16 zmm22 {k7} {z}, zmm23, zmm24 +# ATT: vminbf16 %zmm24, %zmm23, %zmm22 {%k7} {z} +# INTEL: vminbf16 zmm22 {k7} {z}, zmm23, zmm24 0x62,0x85,0x45,0xc7,0x5d,0xf0 -# ATT: vminpbf16 %xmm24, %xmm23, %xmm22 -# INTEL: vminpbf16 xmm22, xmm23, xmm24 +# ATT: vminbf16 %xmm24, %xmm23, %xmm22 +# INTEL: vminbf16 xmm22, xmm23, xmm24 0x62,0x85,0x45,0x00,0x5d,0xf0 -# ATT: vminpbf16 %xmm24, %xmm23, %xmm22 {%k7} -# INTEL: vminpbf16 xmm22 {k7}, xmm23, xmm24 +# ATT: vminbf16 %xmm24, %xmm23, %xmm22 {%k7} +# INTEL: vminbf16 xmm22 {k7}, xmm23, xmm24 0x62,0x85,0x45,0x07,0x5d,0xf0 -# ATT: vminpbf16 %xmm24, %xmm23, %xmm22 {%k7} {z} -# INTEL: vminpbf16 xmm22 {k7} {z}, xmm23, xmm24 +# ATT: vminbf16 %xmm24, %xmm23, %xmm22 {%k7} {z} +# INTEL: vminbf16 xmm22 {k7} {z}, xmm23, xmm24 0x62,0x85,0x45,0x87,0x5d,0xf0 -# ATT: vminpbf16 268435456(%rbp,%r14,8), %zmm23, %zmm22 -# INTEL: vminpbf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456] +# ATT: vminbf16 268435456(%rbp,%r14,8), %zmm23, %zmm22 +# INTEL: vminbf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456] 0x62,0xa5,0x45,0x40,0x5d,0xb4,0xf5,0x00,0x00,0x00,0x10 -# ATT: vminpbf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7} -# INTEL: vminpbf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291] +# ATT: vminbf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7} +# INTEL: vminbf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291] 0x62,0xc5,0x45,0x47,0x5d,0xb4,0x80,0x23,0x01,0x00,0x00 -# ATT: vminpbf16 (%rip){1to32}, %zmm23, %zmm22 -# INTEL: vminpbf16 zmm22, zmm23, word ptr [rip]{1to32} +# ATT: vminbf16 (%rip){1to32}, %zmm23, %zmm22 +# INTEL: vminbf16 zmm22, zmm23, word ptr [rip]{1to32} 0x62,0xe5,0x45,0x50,0x5d,0x35,0x00,0x00,0x00,0x00 -# ATT: vminpbf16 -2048(,%rbp,2), %zmm23, %zmm22 -# INTEL: vminpbf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048] +# ATT: vminbf16 -2048(,%rbp,2), %zmm23, %zmm22 +# INTEL: vminbf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048] 0x62,0xe5,0x45,0x40,0x5d,0x34,0x6d,0x00,0xf8,0xff,0xff -# ATT: vminpbf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z} -# INTEL: vminpbf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128] +# ATT: vminbf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z} +# INTEL: vminbf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128] 0x62,0xe5,0x45,0xc7,0x5d,0x71,0x7f -# ATT: vminpbf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z} -# INTEL: vminpbf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32} +# ATT: vminbf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z} +# INTEL: vminbf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32} 0x62,0xe5,0x45,0xd7,0x5d,0x72,0x80 -# ATT: vminpbf16 268435456(%rbp,%r14,8), %ymm23, %ymm22 -# INTEL: vminpbf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456] +# ATT: vminbf16 268435456(%rbp,%r14,8), %ymm23, %ymm22 +# INTEL: vminbf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456] 0x62,0xa5,0x45,0x20,0x5d,0xb4,0xf5,0x00,0x00,0x00,0x10 -# ATT: vminpbf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7} -# INTEL: vminpbf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291] +# ATT: vminbf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7} +# INTEL: vminbf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291] 0x62,0xc5,0x45,0x27,0x5d,0xb4,0x80,0x23,0x01,0x00,0x00 -# ATT: vminpbf16 (%rip){1to16}, %ymm23, %ymm22 -# INTEL: vminpbf16 ymm22, ymm23, word ptr [rip]{1to16} +# ATT: vminbf16 (%rip){1to16}, %ymm23, %ymm22 +# INTEL: vminbf16 ymm22, ymm23, word ptr [rip]{1to16} 0x62,0xe5,0x45,0x30,0x5d,0x35,0x00,0x00,0x00,0x00 -# ATT: vminpbf16 -1024(,%rbp,2), %ymm23, %ymm22 -# INTEL: vminpbf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024] +# ATT: vminbf16 -1024(,%rbp,2), %ymm23, %ymm22 +# INTEL: vminbf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024] 0x62,0xe5,0x45,0x20,0x5d,0x34,0x6d,0x00,0xfc,0xff,0xff -# ATT: vminpbf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z} -# INTEL: vminpbf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064] +# ATT: vminbf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z} +# INTEL: vminbf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064] 0x62,0xe5,0x45,0xa7,0x5d,0x71,0x7f -# ATT: vminpbf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z} -# INTEL: vminpbf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16} +# ATT: vminbf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z} +# INTEL: vminbf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16} 0x62,0xe5,0x45,0xb7,0x5d,0x72,0x80 -# ATT: vminpbf16 268435456(%rbp,%r14,8), %xmm23, %xmm22 -# INTEL: vminpbf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456] +# ATT: vminbf16 268435456(%rbp,%r14,8), %xmm23, %xmm22 +# INTEL: vminbf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456] 0x62,0xa5,0x45,0x00,0x5d,0xb4,0xf5,0x00,0x00,0x00,0x10 -# ATT: vminpbf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7} -# INTEL: vminpbf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291] +# ATT: vminbf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7} +# INTEL: vminbf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291] 0x62,0xc5,0x45,0x07,0x5d,0xb4,0x80,0x23,0x01,0x00,0x00 -# ATT: vminpbf16 (%rip){1to8}, %xmm23, %xmm22 -# INTEL: vminpbf16 xmm22, xmm23, word ptr [rip]{1to8} +# ATT: vminbf16 (%rip){1to8}, %xmm23, %xmm22 +# INTEL: vminbf16 xmm22, xmm23, word ptr [rip]{1to8} 0x62,0xe5,0x45,0x10,0x5d,0x35,0x00,0x00,0x00,0x00 -# ATT: vminpbf16 -512(,%rbp,2), %xmm23, %xmm22 -# INTEL: vminpbf16 xmm22, xmm23, xmmword ptr [2*rbp - 512] +# ATT: vminbf16 -512(,%rbp,2), %xmm23, %xmm22 +# INTEL: vminbf16 xmm22, xmm23, xmmword ptr [2*rbp - 512] 0x62,0xe5,0x45,0x00,0x5d,0x34,0x6d,0x00,0xfe,0xff,0xff -# ATT: vminpbf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z} -# INTEL: vminpbf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032] +# ATT: vminbf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z} +# INTEL: vminbf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032] 0x62,0xe5,0x45,0x87,0x5d,0x71,0x7f -# ATT: vminpbf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z} -# INTEL: vminpbf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8} +# ATT: vminbf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z} +# INTEL: vminbf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8} 0x62,0xe5,0x45,0x97,0x5d,0x72,0x80 -# ATT: vmulnepbf16 %ymm24, %ymm23, %ymm22 -# INTEL: vmulnepbf16 ymm22, ymm23, ymm24 +# ATT: vmulbf16 %ymm24, %ymm23, %ymm22 +# INTEL: vmulbf16 ymm22, ymm23, ymm24 0x62,0x85,0x45,0x20,0x59,0xf0 -# ATT: vmulnepbf16 %ymm24, %ymm23, %ymm22 {%k7} -# INTEL: vmulnepbf16 ymm22 {k7}, ymm23, ymm24 +# ATT: vmulbf16 %ymm24, %ymm23, %ymm22 {%k7} +# INTEL: vmulbf16 ymm22 {k7}, ymm23, ymm24 0x62,0x85,0x45,0x27,0x59,0xf0 -# ATT: vmulnepbf16 %ymm24, %ymm23, %ymm22 {%k7} {z} -# INTEL: vmulnepbf16 ymm22 {k7} {z}, ymm23, ymm24 +# ATT: vmulbf16 %ymm24, %ymm23, %ymm22 {%k7} {z} +# INTEL: vmulbf16 ymm22 {k7} {z}, ymm23, ymm24 0x62,0x85,0x45,0xa7,0x59,0xf0 -# ATT: vmulnepbf16 %zmm24, %zmm23, %zmm22 -# INTEL: vmulnepbf16 zmm22, zmm23, zmm24 +# ATT: vmulbf16 %zmm24, %zmm23, %zmm22 +# INTEL: vmulbf16 zmm22, zmm23, zmm24 0x62,0x85,0x45,0x40,0x59,0xf0 -# ATT: vmulnepbf16 %zmm24, %zmm23, %zmm22 {%k7} -# INTEL: vmulnepbf16 zmm22 {k7}, zmm23, zmm24 +# ATT: vmulbf16 %zmm24, %zmm23, %zmm22 {%k7} +# INTEL: vmulbf16 zmm22 {k7}, zmm23, zmm24 0x62,0x85,0x45,0x47,0x59,0xf0 -# ATT: vmulnepbf16 %zmm24, %zmm23, %zmm22 {%k7} {z} -# INTEL: vmulnepbf16 zmm22 {k7} {z}, zmm23, zmm24 +# ATT: vmulbf16 %zmm24, %zmm23, %zmm22 {%k7} {z} +# INTEL: vmulbf16 zmm22 {k7} {z}, zmm23, zmm24 0x62,0x85,0x45,0xc7,0x59,0xf0 -# ATT: vmulnepbf16 %xmm24, %xmm23, %xmm22 -# INTEL: vmulnepbf16 xmm22, xmm23, xmm24 +# ATT: vmulbf16 %xmm24, %xmm23, %xmm22 +# INTEL: vmulbf16 xmm22, xmm23, xmm24 0x62,0x85,0x45,0x00,0x59,0xf0 -# ATT: vmulnepbf16 %xmm24, %xmm23, %xmm22 {%k7} -# INTEL: vmulnepbf16 xmm22 {k7}, xmm23, xmm24 +# ATT: vmulbf16 %xmm24, %xmm23, %xmm22 {%k7} +# INTEL: vmulbf16 xmm22 {k7}, xmm23, xmm24 0x62,0x85,0x45,0x07,0x59,0xf0 -# ATT: vmulnepbf16 %xmm24, %xmm23, %xmm22 {%k7} {z} -# INTEL: vmulnepbf16 xmm22 {k7} {z}, xmm23, xmm24 +# ATT: vmulbf16 %xmm24, %xmm23, %xmm22 {%k7} {z} +# INTEL: vmulbf16 xmm22 {k7} {z}, xmm23, xmm24 0x62,0x85,0x45,0x87,0x59,0xf0 -# ATT: vmulnepbf16 268435456(%rbp,%r14,8), %zmm23, %zmm22 -# INTEL: vmulnepbf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456] +# ATT: vmulbf16 268435456(%rbp,%r14,8), %zmm23, %zmm22 +# INTEL: vmulbf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456] 0x62,0xa5,0x45,0x40,0x59,0xb4,0xf5,0x00,0x00,0x00,0x10 -# ATT: vmulnepbf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7} -# INTEL: vmulnepbf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291] +# ATT: vmulbf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7} +# INTEL: vmulbf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291] 0x62,0xc5,0x45,0x47,0x59,0xb4,0x80,0x23,0x01,0x00,0x00 -# ATT: vmulnepbf16 (%rip){1to32}, %zmm23, %zmm22 -# INTEL: vmulnepbf16 zmm22, zmm23, word ptr [rip]{1to32} +# ATT: vmulbf16 (%rip){1to32}, %zmm23, %zmm22 +# INTEL: vmulbf16 zmm22, zmm23, word ptr [rip]{1to32} 0x62,0xe5,0x45,0x50,0x59,0x35,0x00,0x00,0x00,0x00 -# ATT: vmulnepbf16 -2048(,%rbp,2), %zmm23, %zmm22 -# INTEL: vmulnepbf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048] +# ATT: vmulbf16 -2048(,%rbp,2), %zmm23, %zmm22 +# INTEL: vmulbf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048] 0x62,0xe5,0x45,0x40,0x59,0x34,0x6d,0x00,0xf8,0xff,0xff -# ATT: vmulnepbf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z} -# INTEL: vmulnepbf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128] +# ATT: vmulbf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z} +# INTEL: vmulbf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128] 0x62,0xe5,0x45,0xc7,0x59,0x71,0x7f -# ATT: vmulnepbf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z} -# INTEL: vmulnepbf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32} +# ATT: vmulbf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z} +# INTEL: vmulbf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32} 0x62,0xe5,0x45,0xd7,0x59,0x72,0x80 -# ATT: vmulnepbf16 268435456(%rbp,%r14,8), %ymm23, %ymm22 -# INTEL: vmulnepbf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456] +# ATT: vmulbf16 268435456(%rbp,%r14,8), %ymm23, %ymm22 +# INTEL: vmulbf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456] 0x62,0xa5,0x45,0x20,0x59,0xb4,0xf5,0x00,0x00,0x00,0x10 -# ATT: vmulnepbf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7} -# INTEL: vmulnepbf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291] +# ATT: vmulbf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7} +# INTEL: vmulbf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291] 0x62,0xc5,0x45,0x27,0x59,0xb4,0x80,0x23,0x01,0x00,0x00 -# ATT: vmulnepbf16 (%rip){1to16}, %ymm23, %ymm22 -# INTEL: vmulnepbf16 ymm22, ymm23, word ptr [rip]{1to16} +# ATT: vmulbf16 (%rip){1to16}, %ymm23, %ymm22 +# INTEL: vmulbf16 ymm22, ymm23, word ptr [rip]{1to16} 0x62,0xe5,0x45,0x30,0x59,0x35,0x00,0x00,0x00,0x00 -# ATT: vmulnepbf16 -1024(,%rbp,2), %ymm23, %ymm22 -# INTEL: vmulnepbf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024] +# ATT: vmulbf16 -1024(,%rbp,2), %ymm23, %ymm22 +# INTEL: vmulbf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024] 0x62,0xe5,0x45,0x20,0x59,0x34,0x6d,0x00,0xfc,0xff,0xff -# ATT: vmulnepbf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z} -# INTEL: vmulnepbf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064] +# ATT: vmulbf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z} +# INTEL: vmulbf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064] 0x62,0xe5,0x45,0xa7,0x59,0x71,0x7f -# ATT: vmulnepbf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z} -# INTEL: vmulnepbf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16} +# ATT: vmulbf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z} +# INTEL: vmulbf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16} 0x62,0xe5,0x45,0xb7,0x59,0x72,0x80 -# ATT: vmulnepbf16 268435456(%rbp,%r14,8), %xmm23, %xmm22 -# INTEL: vmulnepbf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456] +# ATT: vmulbf16 268435456(%rbp,%r14,8), %xmm23, %xmm22 +# INTEL: vmulbf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456] 0x62,0xa5,0x45,0x00,0x59,0xb4,0xf5,0x00,0x00,0x00,0x10 -# ATT: vmulnepbf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7} -# INTEL: vmulnepbf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291] +# ATT: vmulbf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7} +# INTEL: vmulbf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291] 0x62,0xc5,0x45,0x07,0x59,0xb4,0x80,0x23,0x01,0x00,0x00 -# ATT: vmulnepbf16 (%rip){1to8}, %xmm23, %xmm22 -# INTEL: vmulnepbf16 xmm22, xmm23, word ptr [rip]{1to8} +# ATT: vmulbf16 (%rip){1to8}, %xmm23, %xmm22 +# INTEL: vmulbf16 xmm22, xmm23, word ptr [rip]{1to8} 0x62,0xe5,0x45,0x10,0x59,0x35,0x00,0x00,0x00,0x00 -# ATT: vmulnepbf16 -512(,%rbp,2), %xmm23, %xmm22 -# INTEL: vmulnepbf16 xmm22, xmm23, xmmword ptr [2*rbp - 512] +# ATT: vmulbf16 -512(,%rbp,2), %xmm23, %xmm22 +# INTEL: vmulbf16 xmm22, xmm23, xmmword ptr [2*rbp - 512] 0x62,0xe5,0x45,0x00,0x59,0x34,0x6d,0x00,0xfe,0xff,0xff -# ATT: vmulnepbf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z} -# INTEL: vmulnepbf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032] +# ATT: vmulbf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z} +# INTEL: vmulbf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032] 0x62,0xe5,0x45,0x87,0x59,0x71,0x7f -# ATT: vmulnepbf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z} -# INTEL: vmulnepbf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8} +# ATT: vmulbf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z} +# INTEL: vmulbf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8} 0x62,0xe5,0x45,0x97,0x59,0x72,0x80 -# ATT: vrcppbf16 %xmm23, %xmm22 -# INTEL: vrcppbf16 xmm22, xmm23 +# ATT: vrcpbf16 %xmm23, %xmm22 +# INTEL: vrcpbf16 xmm22, xmm23 0x62,0xa6,0x7c,0x08,0x4c,0xf7 -# ATT: vrcppbf16 %xmm23, %xmm22 {%k7} -# INTEL: vrcppbf16 xmm22 {k7}, xmm23 +# ATT: vrcpbf16 %xmm23, %xmm22 {%k7} +# INTEL: vrcpbf16 xmm22 {k7}, xmm23 0x62,0xa6,0x7c,0x0f,0x4c,0xf7 -# ATT: vrcppbf16 %xmm23, %xmm22 {%k7} {z} -# INTEL: vrcppbf16 xmm22 {k7} {z}, xmm23 +# ATT: vrcpbf16 %xmm23, %xmm22 {%k7} {z} +# INTEL: vrcpbf16 xmm22 {k7} {z}, xmm23 0x62,0xa6,0x7c,0x8f,0x4c,0xf7 -# ATT: vrcppbf16 %zmm23, %zmm22 -# INTEL: vrcppbf16 zmm22, zmm23 +# ATT: vrcpbf16 %zmm23, %zmm22 +# INTEL: vrcpbf16 zmm22, zmm23 0x62,0xa6,0x7c,0x48,0x4c,0xf7 -# ATT: vrcppbf16 %zmm23, %zmm22 {%k7} -# INTEL: vrcppbf16 zmm22 {k7}, zmm23 +# ATT: vrcpbf16 %zmm23, %zmm22 {%k7} +# INTEL: vrcpbf16 zmm22 {k7}, zmm23 0x62,0xa6,0x7c,0x4f,0x4c,0xf7 -# ATT: vrcppbf16 %zmm23, %zmm22 {%k7} {z} -# INTEL: vrcppbf16 zmm22 {k7} {z}, zmm23 +# ATT: vrcpbf16 %zmm23, %zmm22 {%k7} {z} +# INTEL: vrcpbf16 zmm22 {k7} {z}, zmm23 0x62,0xa6,0x7c,0xcf,0x4c,0xf7 -# ATT: vrcppbf16 %ymm23, %ymm22 -# INTEL: vrcppbf16 ymm22, ymm23 +# ATT: vrcpbf16 %ymm23, %ymm22 +# INTEL: vrcpbf16 ymm22, ymm23 0x62,0xa6,0x7c,0x28,0x4c,0xf7 -# ATT: vrcppbf16 %ymm23, %ymm22 {%k7} -# INTEL: vrcppbf16 ymm22 {k7}, ymm23 +# ATT: vrcpbf16 %ymm23, %ymm22 {%k7} +# INTEL: vrcpbf16 ymm22 {k7}, ymm23 0x62,0xa6,0x7c,0x2f,0x4c,0xf7 -# ATT: vrcppbf16 %ymm23, %ymm22 {%k7} {z} -# INTEL: vrcppbf16 ymm22 {k7} {z}, ymm23 +# ATT: vrcpbf16 %ymm23, %ymm22 {%k7} {z} +# INTEL: vrcpbf16 ymm22 {k7} {z}, ymm23 0x62,0xa6,0x7c,0xaf,0x4c,0xf7 -# ATT: vrcppbf16 268435456(%rbp,%r14,8), %xmm22 -# INTEL: vrcppbf16 xmm22, xmmword ptr [rbp + 8*r14 + 268435456] +# ATT: vrcpbf16 268435456(%rbp,%r14,8), %xmm22 +# INTEL: vrcpbf16 xmm22, xmmword ptr [rbp + 8*r14 + 268435456] 0x62,0xa6,0x7c,0x08,0x4c,0xb4,0xf5,0x00,0x00,0x00,0x10 -# ATT: vrcppbf16 291(%r8,%rax,4), %xmm22 {%k7} -# INTEL: vrcppbf16 xmm22 {k7}, xmmword ptr [r8 + 4*rax + 291] +# ATT: vrcpbf16 291(%r8,%rax,4), %xmm22 {%k7} +# INTEL: vrcpbf16 xmm22 {k7}, xmmword ptr [r8 + 4*rax + 291] 0x62,0xc6,0x7c,0x0f,0x4c,0xb4,0x80,0x23,0x01,0x00,0x00 -# ATT: vrcppbf16 (%rip){1to8}, %xmm22 -# INTEL: vrcppbf16 xmm22, word ptr [rip]{1to8} +# ATT: vrcpbf16 (%rip){1to8}, %xmm22 +# INTEL: vrcpbf16 xmm22, word ptr [rip]{1to8} 0x62,0xe6,0x7c,0x18,0x4c,0x35,0x00,0x00,0x00,0x00 -# ATT: vrcppbf16 -512(,%rbp,2), %xmm22 -# INTEL: vrcppbf16 xmm22, xmmword ptr [2*rbp - 512] +# ATT: vrcpbf16 -512(,%rbp,2), %xmm22 +# INTEL: vrcpbf16 xmm22, xmmword ptr [2*rbp - 512] 0x62,0xe6,0x7c,0x08,0x4c,0x34,0x6d,0x00,0xfe,0xff,0xff -# ATT: vrcppbf16 2032(%rcx), %xmm22 {%k7} {z} -# INTEL: vrcppbf16 xmm22 {k7} {z}, xmmword ptr [rcx + 2032] +# ATT: vrcpbf16 2032(%rcx), %xmm22 {%k7} {z} +# INTEL: vrcpbf16 xmm22 {k7} {z}, xmmword ptr [rcx + 2032] 0x62,0xe6,0x7c,0x8f,0x4c,0x71,0x7f -# ATT: vrcppbf16 -256(%rdx){1to8}, %xmm22 {%k7} {z} -# INTEL: vrcppbf16 xmm22 {k7} {z}, word ptr [rdx - 256]{1to8} +# ATT: vrcpbf16 -256(%rdx){1to8}, %xmm22 {%k7} {z} +# INTEL: vrcpbf16 xmm22 {k7} {z}, word ptr [rdx - 256]{1to8} 0x62,0xe6,0x7c,0x9f,0x4c,0x72,0x80 -# ATT: vrcppbf16 268435456(%rbp,%r14,8), %ymm22 -# INTEL: vrcppbf16 ymm22, ymmword ptr [rbp + 8*r14 + 268435456] +# ATT: vrcpbf16 268435456(%rbp,%r14,8), %ymm22 +# INTEL: vrcpbf16 ymm22, ymmword ptr [rbp + 8*r14 + 268435456] 0x62,0xa6,0x7c,0x28,0x4c,0xb4,0xf5,0x00,0x00,0x00,0x10 -# ATT: vrcppbf16 291(%r8,%rax,4), %ymm22 {%k7} -# INTEL: vrcppbf16 ymm22 {k7}, ymmword ptr [r8 + 4*rax + 291] +# ATT: vrcpbf16 291(%r8,%rax,4), %ymm22 {%k7} +# INTEL: vrcpbf16 ymm22 {k7}, ymmword ptr [r8 + 4*rax + 291] 0x62,0xc6,0x7c,0x2f,0x4c,0xb4,0x80,0x23,0x01,0x00,0x00 -# ATT: vrcppbf16 (%rip){1to16}, %ymm22 -# INTEL: vrcppbf16 ymm22, word ptr [rip]{1to16} +# ATT: vrcpbf16 (%rip){1to16}, %ymm22 +# INTEL: vrcpbf16 ymm22, word ptr [rip]{1to16} 0x62,0xe6,0x7c,0x38,0x4c,0x35,0x00,0x00,0x00,0x00 -# ATT: vrcppbf16 -1024(,%rbp,2), %ymm22 -# INTEL: vrcppbf16 ymm22, ymmword ptr [2*rbp - 1024] +# ATT: vrcpbf16 -1024(,%rbp,2), %ymm22 +# INTEL: vrcpbf16 ymm22, ymmword ptr [2*rbp - 1024] 0x62,0xe6,0x7c,0x28,0x4c,0x34,0x6d,0x00,0xfc,0xff,0xff -# ATT: vrcppbf16 4064(%rcx), %ymm22 {%k7} {z} -# INTEL: vrcppbf16 ymm22 {k7} {z}, ymmword ptr [rcx + 4064] +# ATT: vrcpbf16 4064(%rcx), %ymm22 {%k7} {z} +# INTEL: vrcpbf16 ymm22 {k7} {z}, ymmword ptr [rcx + 4064] 0x62,0xe6,0x7c,0xaf,0x4c,0x71,0x7f -# ATT: vrcppbf16 -256(%rdx){1to16}, %ymm22 {%k7} {z} -# INTEL: vrcppbf16 ymm22 {k7} {z}, word ptr [rdx - 256]{1to16} +# ATT: vrcpbf16 -256(%rdx){1to16}, %ymm22 {%k7} {z} +# INTEL: vrcpbf16 ymm22 {k7} {z}, word ptr [rdx - 256]{1to16} 0x62,0xe6,0x7c,0xbf,0x4c,0x72,0x80 -# ATT: vrcppbf16 268435456(%rbp,%r14,8), %zmm22 -# INTEL: vrcppbf16 zmm22, zmmword ptr [rbp + 8*r14 + 268435456] +# ATT: vrcpbf16 268435456(%rbp,%r14,8), %zmm22 +# INTEL: vrcpbf16 zmm22, zmmword ptr [rbp + 8*r14 + 268435456] 0x62,0xa6,0x7c,0x48,0x4c,0xb4,0xf5,0x00,0x00,0x00,0x10 -# ATT: vrcppbf16 291(%r8,%rax,4), %zmm22 {%k7} -# INTEL: vrcppbf16 zmm22 {k7}, zmmword ptr [r8 + 4*rax + 291] +# ATT: vrcpbf16 291(%r8,%rax,4), %zmm22 {%k7} +# INTEL: vrcpbf16 zmm22 {k7}, zmmword ptr [r8 + 4*rax + 291] 0x62,0xc6,0x7c,0x4f,0x4c,0xb4,0x80,0x23,0x01,0x00,0x00 -# ATT: vrcppbf16 (%rip){1to32}, %zmm22 -# INTEL: vrcppbf16 zmm22, word ptr [rip]{1to32} +# ATT: vrcpbf16 (%rip){1to32}, %zmm22 +# INTEL: vrcpbf16 zmm22, word ptr [rip]{1to32} 0x62,0xe6,0x7c,0x58,0x4c,0x35,0x00,0x00,0x00,0x00 -# ATT: vrcppbf16 -2048(,%rbp,2), %zmm22 -# INTEL: vrcppbf16 zmm22, zmmword ptr [2*rbp - 2048] +# ATT: vrcpbf16 -2048(,%rbp,2), %zmm22 +# INTEL: vrcpbf16 zmm22, zmmword ptr [2*rbp - 2048] 0x62,0xe6,0x7c,0x48,0x4c,0x34,0x6d,0x00,0xf8,0xff,0xff -# ATT: vrcppbf16 8128(%rcx), %zmm22 {%k7} {z} -# INTEL: vrcppbf16 zmm22 {k7} {z}, zmmword ptr [rcx + 8128] +# ATT: vrcpbf16 8128(%rcx), %zmm22 {%k7} {z} +# INTEL: vrcpbf16 zmm22 {k7} {z}, zmmword ptr [rcx + 8128] 0x62,0xe6,0x7c,0xcf,0x4c,0x71,0x7f -# ATT: vrcppbf16 -256(%rdx){1to32}, %zmm22 {%k7} {z} -# INTEL: vrcppbf16 zmm22 {k7} {z}, word ptr [rdx - 256]{1to32} +# ATT: vrcpbf16 -256(%rdx){1to32}, %zmm22 {%k7} {z} +# INTEL: vrcpbf16 zmm22 {k7} {z}, word ptr [rdx - 256]{1to32} 0x62,0xe6,0x7c,0xdf,0x4c,0x72,0x80 -# ATT: vreducenepbf16 $123, %zmm23, %zmm22 -# INTEL: vreducenepbf16 zmm22, zmm23, 123 +# ATT: vreducebf16 $123, %zmm23, %zmm22 +# INTEL: vreducebf16 zmm22, zmm23, 123 0x62,0xa3,0x7f,0x48,0x56,0xf7,0x7b -# ATT: vreducenepbf16 $123, %zmm23, %zmm22 {%k7} -# INTEL: vreducenepbf16 zmm22 {k7}, zmm23, 123 +# ATT: vreducebf16 $123, %zmm23, %zmm22 {%k7} +# INTEL: vreducebf16 zmm22 {k7}, zmm23, 123 0x62,0xa3,0x7f,0x4f,0x56,0xf7,0x7b -# ATT: vreducenepbf16 $123, %zmm23, %zmm22 {%k7} {z} -# INTEL: vreducenepbf16 zmm22 {k7} {z}, zmm23, 123 +# ATT: vreducebf16 $123, %zmm23, %zmm22 {%k7} {z} +# INTEL: vreducebf16 zmm22 {k7} {z}, zmm23, 123 0x62,0xa3,0x7f,0xcf,0x56,0xf7,0x7b -# ATT: vreducenepbf16 $123, %ymm23, %ymm22 -# INTEL: vreducenepbf16 ymm22, ymm23, 123 +# ATT: vreducebf16 $123, %ymm23, %ymm22 +# INTEL: vreducebf16 ymm22, ymm23, 123 0x62,0xa3,0x7f,0x28,0x56,0xf7,0x7b -# ATT: vreducenepbf16 $123, %ymm23, %ymm22 {%k7} -# INTEL: vreducenepbf16 ymm22 {k7}, ymm23, 123 +# ATT: vreducebf16 $123, %ymm23, %ymm22 {%k7} +# INTEL: vreducebf16 ymm22 {k7}, ymm23, 123 0x62,0xa3,0x7f,0x2f,0x56,0xf7,0x7b -# ATT: vreducenepbf16 $123, %ymm23, %ymm22 {%k7} {z} -# INTEL: vreducenepbf16 ymm22 {k7} {z}, ymm23, 123 +# ATT: vreducebf16 $123, %ymm23, %ymm22 {%k7} {z} +# INTEL: vreducebf16 ymm22 {k7} {z}, ymm23, 123 0x62,0xa3,0x7f,0xaf,0x56,0xf7,0x7b -# ATT: vreducenepbf16 $123, %xmm23, %xmm22 -# INTEL: vreducenepbf16 xmm22, xmm23, 123 +# ATT: vreducebf16 $123, %xmm23, %xmm22 +# INTEL: vreducebf16 xmm22, xmm23, 123 0x62,0xa3,0x7f,0x08,0x56,0xf7,0x7b -# ATT: vreducenepbf16 $123, %xmm23, %xmm22 {%k7} -# INTEL: vreducenepbf16 xmm22 {k7}, xmm23, 123 +# ATT: vreducebf16 $123, %xmm23, %xmm22 {%k7} +# INTEL: vreducebf16 xmm22 {k7}, xmm23, 123 0x62,0xa3,0x7f,0x0f,0x56,0xf7,0x7b -# ATT: vreducenepbf16 $123, %xmm23, %xmm22 {%k7} {z} -# INTEL: vreducenepbf16 xmm22 {k7} {z}, xmm23, 123 +# ATT: vreducebf16 $123, %xmm23, %xmm22 {%k7} {z} +# INTEL: vreducebf16 xmm22 {k7} {z}, xmm23, 123 0x62,0xa3,0x7f,0x8f,0x56,0xf7,0x7b -# ATT: vreducenepbf16 $123, 268435456(%rbp,%r14,8), %xmm22 -# INTEL: vreducenepbf16 xmm22, xmmword ptr [rbp + 8*r14 + 268435456], 123 +# ATT: vreducebf16 $123, 268435456(%rbp,%r14,8), %xmm22 +# INTEL: vreducebf16 xmm22, xmmword ptr [rbp + 8*r14 + 268435456], 123 0x62,0xa3,0x7f,0x08,0x56,0xb4,0xf5,0x00,0x00,0x00,0x10,0x7b -# ATT: vreducenepbf16 $123, 291(%r8,%rax,4), %xmm22 {%k7} -# INTEL: vreducenepbf16 xmm22 {k7}, xmmword ptr [r8 + 4*rax + 291], 123 +# ATT: vreducebf16 $123, 291(%r8,%rax,4), %xmm22 {%k7} +# INTEL: vreducebf16 xmm22 {k7}, xmmword ptr [r8 + 4*rax + 291], 123 0x62,0xc3,0x7f,0x0f,0x56,0xb4,0x80,0x23,0x01,0x00,0x00,0x7b -# ATT: vreducenepbf16 $123, (%rip){1to8}, %xmm22 -# INTEL: vreducenepbf16 xmm22, word ptr [rip]{1to8}, 123 +# ATT: vreducebf16 $123, (%rip){1to8}, %xmm22 +# INTEL: vreducebf16 xmm22, word ptr [rip]{1to8}, 123 0x62,0xe3,0x7f,0x18,0x56,0x35,0x00,0x00,0x00,0x00,0x7b -# ATT: vreducenepbf16 $123, -512(,%rbp,2), %xmm22 -# INTEL: vreducenepbf16 xmm22, xmmword ptr [2*rbp - 512], 123 +# ATT: vreducebf16 $123, -512(,%rbp,2), %xmm22 +# INTEL: vreducebf16 xmm22, xmmword ptr [2*rbp - 512], 123 0x62,0xe3,0x7f,0x08,0x56,0x34,0x6d,0x00,0xfe,0xff,0xff,0x7b -# ATT: vreducenepbf16 $123, 2032(%rcx), %xmm22 {%k7} {z} -# INTEL: vreducenepbf16 xmm22 {k7} {z}, xmmword ptr [rcx + 2032], 123 +# ATT: vreducebf16 $123, 2032(%rcx), %xmm22 {%k7} {z} +# INTEL: vreducebf16 xmm22 {k7} {z}, xmmword ptr [rcx + 2032], 123 0x62,0xe3,0x7f,0x8f,0x56,0x71,0x7f,0x7b -# ATT: vreducenepbf16 $123, -256(%rdx){1to8}, %xmm22 {%k7} {z} -# INTEL: vreducenepbf16 xmm22 {k7} {z}, word ptr [rdx - 256]{1to8}, 123 +# ATT: vreducebf16 $123, -256(%rdx){1to8}, %xmm22 {%k7} {z} +# INTEL: vreducebf16 xmm22 {k7} {z}, word ptr [rdx - 256]{1to8}, 123 0x62,0xe3,0x7f,0x9f,0x56,0x72,0x80,0x7b -# ATT: vreducenepbf16 $123, 268435456(%rbp,%r14,8), %ymm22 -# INTEL: vreducenepbf16 ymm22, ymmword ptr [rbp + 8*r14 + 268435456], 123 +# ATT: vreducebf16 $123, 268435456(%rbp,%r14,8), %ymm22 +# INTEL: vreducebf16 ymm22, ymmword ptr [rbp + 8*r14 + 268435456], 123 0x62,0xa3,0x7f,0x28,0x56,0xb4,0xf5,0x00,0x00,0x00,0x10,0x7b -# ATT: vreducenepbf16 $123, 291(%r8,%rax,4), %ymm22 {%k7} -# INTEL: vreducenepbf16 ymm22 {k7}, ymmword ptr [r8 + 4*rax + 291], 123 +# ATT: vreducebf16 $123, 291(%r8,%rax,4), %ymm22 {%k7} +# INTEL: vreducebf16 ymm22 {k7}, ymmword ptr [r8 + 4*rax + 291], 123 0x62,0xc3,0x7f,0x2f,0x56,0xb4,0x80,0x23,0x01,0x00,0x00,0x7b -# ATT: vreducenepbf16 $123, (%rip){1to16}, %ymm22 -# INTEL: vreducenepbf16 ymm22, word ptr [rip]{1to16}, 123 +# ATT: vreducebf16 $123, (%rip){1to16}, %ymm22 +# INTEL: vreducebf16 ymm22, word ptr [rip]{1to16}, 123 0x62,0xe3,0x7f,0x38,0x56,0x35,0x00,0x00,0x00,0x00,0x7b -# ATT: vreducenepbf16 $123, -1024(,%rbp,2), %ymm22 -# INTEL: vreducenepbf16 ymm22, ymmword ptr [2*rbp - 1024], 123 +# ATT: vreducebf16 $123, -1024(,%rbp,2), %ymm22 +# INTEL: vreducebf16 ymm22, ymmword ptr [2*rbp - 1024], 123 0x62,0xe3,0x7f,0x28,0x56,0x34,0x6d,0x00,0xfc,0xff,0xff,0x7b -# ATT: vreducenepbf16 $123, 4064(%rcx), %ymm22 {%k7} {z} -# INTEL: vreducenepbf16 ymm22 {k7} {z}, ymmword ptr [rcx + 4064], 123 +# ATT: vreducebf16 $123, 4064(%rcx), %ymm22 {%k7} {z} +# INTEL: vreducebf16 ymm22 {k7} {z}, ymmword ptr [rcx + 4064], 123 0x62,0xe3,0x7f,0xaf,0x56,0x71,0x7f,0x7b -# ATT: vreducenepbf16 $123, -256(%rdx){1to16}, %ymm22 {%k7} {z} -# INTEL: vreducenepbf16 ymm22 {k7} {z}, word ptr [rdx - 256]{1to16}, 123 +# ATT: vreducebf16 $123, -256(%rdx){1to16}, %ymm22 {%k7} {z} +# INTEL: vreducebf16 ymm22 {k7} {z}, word ptr [rdx - 256]{1to16}, 123 0x62,0xe3,0x7f,0xbf,0x56,0x72,0x80,0x7b -# ATT: vreducenepbf16 $123, 268435456(%rbp,%r14,8), %zmm22 -# INTEL: vreducenepbf16 zmm22, zmmword ptr [rbp + 8*r14 + 268435456], 123 +# ATT: vreducebf16 $123, 268435456(%rbp,%r14,8), %zmm22 +# INTEL: vreducebf16 zmm22, zmmword ptr [rbp + 8*r14 + 268435456], 123 0x62,0xa3,0x7f,0x48,0x56,0xb4,0xf5,0x00,0x00,0x00,0x10,0x7b -# ATT: vreducenepbf16 $123, 291(%r8,%rax,4), %zmm22 {%k7} -# INTEL: vreducenepbf16 zmm22 {k7}, zmmword ptr [r8 + 4*rax + 291], 123 +# ATT: vreducebf16 $123, 291(%r8,%rax,4), %zmm22 {%k7} +# INTEL: vreducebf16 zmm22 {k7}, zmmword ptr [r8 + 4*rax + 291], 123 0x62,0xc3,0x7f,0x4f,0x56,0xb4,0x80,0x23,0x01,0x00,0x00,0x7b -# ATT: vreducenepbf16 $123, (%rip){1to32}, %zmm22 -# INTEL: vreducenepbf16 zmm22, word ptr [rip]{1to32}, 123 +# ATT: vreducebf16 $123, (%rip){1to32}, %zmm22 +# INTEL: vreducebf16 zmm22, word ptr [rip]{1to32}, 123 0x62,0xe3,0x7f,0x58,0x56,0x35,0x00,0x00,0x00,0x00,0x7b -# ATT: vreducenepbf16 $123, -2048(,%rbp,2), %zmm22 -# INTEL: vreducenepbf16 zmm22, zmmword ptr [2*rbp - 2048], 123 +# ATT: vreducebf16 $123, -2048(,%rbp,2), %zmm22 +# INTEL: vreducebf16 zmm22, zmmword ptr [2*rbp - 2048], 123 0x62,0xe3,0x7f,0x48,0x56,0x34,0x6d,0x00,0xf8,0xff,0xff,0x7b -# ATT: vreducenepbf16 $123, 8128(%rcx), %zmm22 {%k7} {z} -# INTEL: vreducenepbf16 zmm22 {k7} {z}, zmmword ptr [rcx + 8128], 123 +# ATT: vreducebf16 $123, 8128(%rcx), %zmm22 {%k7} {z} +# INTEL: vreducebf16 zmm22 {k7} {z}, zmmword ptr [rcx + 8128], 123 0x62,0xe3,0x7f,0xcf,0x56,0x71,0x7f,0x7b -# ATT: vreducenepbf16 $123, -256(%rdx){1to32}, %zmm22 {%k7} {z} -# INTEL: vreducenepbf16 zmm22 {k7} {z}, word ptr [rdx - 256]{1to32}, 123 +# ATT: vreducebf16 $123, -256(%rdx){1to32}, %zmm22 {%k7} {z} +# INTEL: vreducebf16 zmm22 {k7} {z}, word ptr [rdx - 256]{1to32}, 123 0x62,0xe3,0x7f,0xdf,0x56,0x72,0x80,0x7b -# ATT: vrndscalenepbf16 $123, %zmm23, %zmm22 -# INTEL: vrndscalenepbf16 zmm22, zmm23, 123 +# ATT: vrndscalebf16 $123, %zmm23, %zmm22 +# INTEL: vrndscalebf16 zmm22, zmm23, 123 0x62,0xa3,0x7f,0x48,0x08,0xf7,0x7b -# ATT: vrndscalenepbf16 $123, %zmm23, %zmm22 {%k7} -# INTEL: vrndscalenepbf16 zmm22 {k7}, zmm23, 123 +# ATT: vrndscalebf16 $123, %zmm23, %zmm22 {%k7} +# INTEL: vrndscalebf16 zmm22 {k7}, zmm23, 123 0x62,0xa3,0x7f,0x4f,0x08,0xf7,0x7b -# ATT: vrndscalenepbf16 $123, %zmm23, %zmm22 {%k7} {z} -# INTEL: vrndscalenepbf16 zmm22 {k7} {z}, zmm23, 123 +# ATT: vrndscalebf16 $123, %zmm23, %zmm22 {%k7} {z} +# INTEL: vrndscalebf16 zmm22 {k7} {z}, zmm23, 123 0x62,0xa3,0x7f,0xcf,0x08,0xf7,0x7b -# ATT: vrndscalenepbf16 $123, %ymm23, %ymm22 -# INTEL: vrndscalenepbf16 ymm22, ymm23, 123 +# ATT: vrndscalebf16 $123, %ymm23, %ymm22 +# INTEL: vrndscalebf16 ymm22, ymm23, 123 0x62,0xa3,0x7f,0x28,0x08,0xf7,0x7b -# ATT: vrndscalenepbf16 $123, %ymm23, %ymm22 {%k7} -# INTEL: vrndscalenepbf16 ymm22 {k7}, ymm23, 123 +# ATT: vrndscalebf16 $123, %ymm23, %ymm22 {%k7} +# INTEL: vrndscalebf16 ymm22 {k7}, ymm23, 123 0x62,0xa3,0x7f,0x2f,0x08,0xf7,0x7b -# ATT: vrndscalenepbf16 $123, %ymm23, %ymm22 {%k7} {z} -# INTEL: vrndscalenepbf16 ymm22 {k7} {z}, ymm23, 123 +# ATT: vrndscalebf16 $123, %ymm23, %ymm22 {%k7} {z} +# INTEL: vrndscalebf16 ymm22 {k7} {z}, ymm23, 123 0x62,0xa3,0x7f,0xaf,0x08,0xf7,0x7b -# ATT: vrndscalenepbf16 $123, %xmm23, %xmm22 -# INTEL: vrndscalenepbf16 xmm22, xmm23, 123 +# ATT: vrndscalebf16 $123, %xmm23, %xmm22 +# INTEL: vrndscalebf16 xmm22, xmm23, 123 0x62,0xa3,0x7f,0x08,0x08,0xf7,0x7b -# ATT: vrndscalenepbf16 $123, %xmm23, %xmm22 {%k7} -# INTEL: vrndscalenepbf16 xmm22 {k7}, xmm23, 123 +# ATT: vrndscalebf16 $123, %xmm23, %xmm22 {%k7} +# INTEL: vrndscalebf16 xmm22 {k7}, xmm23, 123 0x62,0xa3,0x7f,0x0f,0x08,0xf7,0x7b -# ATT: vrndscalenepbf16 $123, %xmm23, %xmm22 {%k7} {z} -# INTEL: vrndscalenepbf16 xmm22 {k7} {z}, xmm23, 123 +# ATT: vrndscalebf16 $123, %xmm23, %xmm22 {%k7} {z} +# INTEL: vrndscalebf16 xmm22 {k7} {z}, xmm23, 123 0x62,0xa3,0x7f,0x8f,0x08,0xf7,0x7b -# ATT: vrndscalenepbf16 $123, 268435456(%rbp,%r14,8), %xmm22 -# INTEL: vrndscalenepbf16 xmm22, xmmword ptr [rbp + 8*r14 + 268435456], 123 +# ATT: vrndscalebf16 $123, 268435456(%rbp,%r14,8), %xmm22 +# INTEL: vrndscalebf16 xmm22, xmmword ptr [rbp + 8*r14 + 268435456], 123 0x62,0xa3,0x7f,0x08,0x08,0xb4,0xf5,0x00,0x00,0x00,0x10,0x7b -# ATT: vrndscalenepbf16 $123, 291(%r8,%rax,4), %xmm22 {%k7} -# INTEL: vrndscalenepbf16 xmm22 {k7}, xmmword ptr [r8 + 4*rax + 291], 123 +# ATT: vrndscalebf16 $123, 291(%r8,%rax,4), %xmm22 {%k7} +# INTEL: vrndscalebf16 xmm22 {k7}, xmmword ptr [r8 + 4*rax + 291], 123 0x62,0xc3,0x7f,0x0f,0x08,0xb4,0x80,0x23,0x01,0x00,0x00,0x7b -# ATT: vrndscalenepbf16 $123, (%rip){1to8}, %xmm22 -# INTEL: vrndscalenepbf16 xmm22, word ptr [rip]{1to8}, 123 +# ATT: vrndscalebf16 $123, (%rip){1to8}, %xmm22 +# INTEL: vrndscalebf16 xmm22, word ptr [rip]{1to8}, 123 0x62,0xe3,0x7f,0x18,0x08,0x35,0x00,0x00,0x00,0x00,0x7b -# ATT: vrndscalenepbf16 $123, -512(,%rbp,2), %xmm22 -# INTEL: vrndscalenepbf16 xmm22, xmmword ptr [2*rbp - 512], 123 +# ATT: vrndscalebf16 $123, -512(,%rbp,2), %xmm22 +# INTEL: vrndscalebf16 xmm22, xmmword ptr [2*rbp - 512], 123 0x62,0xe3,0x7f,0x08,0x08,0x34,0x6d,0x00,0xfe,0xff,0xff,0x7b -# ATT: vrndscalenepbf16 $123, 2032(%rcx), %xmm22 {%k7} {z} -# INTEL: vrndscalenepbf16 xmm22 {k7} {z}, xmmword ptr [rcx + 2032], 123 +# ATT: vrndscalebf16 $123, 2032(%rcx), %xmm22 {%k7} {z} +# INTEL: vrndscalebf16 xmm22 {k7} {z}, xmmword ptr [rcx + 2032], 123 0x62,0xe3,0x7f,0x8f,0x08,0x71,0x7f,0x7b -# ATT: vrndscalenepbf16 $123, -256(%rdx){1to8}, %xmm22 {%k7} {z} -# INTEL: vrndscalenepbf16 xmm22 {k7} {z}, word ptr [rdx - 256]{1to8}, 123 +# ATT: vrndscalebf16 $123, -256(%rdx){1to8}, %xmm22 {%k7} {z} +# INTEL: vrndscalebf16 xmm22 {k7} {z}, word ptr [rdx - 256]{1to8}, 123 0x62,0xe3,0x7f,0x9f,0x08,0x72,0x80,0x7b -# ATT: vrndscalenepbf16 $123, 268435456(%rbp,%r14,8), %ymm22 -# INTEL: vrndscalenepbf16 ymm22, ymmword ptr [rbp + 8*r14 + 268435456], 123 +# ATT: vrndscalebf16 $123, 268435456(%rbp,%r14,8), %ymm22 +# INTEL: vrndscalebf16 ymm22, ymmword ptr [rbp + 8*r14 + 268435456], 123 0x62,0xa3,0x7f,0x28,0x08,0xb4,0xf5,0x00,0x00,0x00,0x10,0x7b -# ATT: vrndscalenepbf16 $123, 291(%r8,%rax,4), %ymm22 {%k7} -# INTEL: vrndscalenepbf16 ymm22 {k7}, ymmword ptr [r8 + 4*rax + 291], 123 +# ATT: vrndscalebf16 $123, 291(%r8,%rax,4), %ymm22 {%k7} +# INTEL: vrndscalebf16 ymm22 {k7}, ymmword ptr [r8 + 4*rax + 291], 123 0x62,0xc3,0x7f,0x2f,0x08,0xb4,0x80,0x23,0x01,0x00,0x00,0x7b -# ATT: vrndscalenepbf16 $123, (%rip){1to16}, %ymm22 -# INTEL: vrndscalenepbf16 ymm22, word ptr [rip]{1to16}, 123 +# ATT: vrndscalebf16 $123, (%rip){1to16}, %ymm22 +# INTEL: vrndscalebf16 ymm22, word ptr [rip]{1to16}, 123 0x62,0xe3,0x7f,0x38,0x08,0x35,0x00,0x00,0x00,0x00,0x7b -# ATT: vrndscalenepbf16 $123, -1024(,%rbp,2), %ymm22 -# INTEL: vrndscalenepbf16 ymm22, ymmword ptr [2*rbp - 1024], 123 +# ATT: vrndscalebf16 $123, -1024(,%rbp,2), %ymm22 +# INTEL: vrndscalebf16 ymm22, ymmword ptr [2*rbp - 1024], 123 0x62,0xe3,0x7f,0x28,0x08,0x34,0x6d,0x00,0xfc,0xff,0xff,0x7b -# ATT: vrndscalenepbf16 $123, 4064(%rcx), %ymm22 {%k7} {z} -# INTEL: vrndscalenepbf16 ymm22 {k7} {z}, ymmword ptr [rcx + 4064], 123 +# ATT: vrndscalebf16 $123, 4064(%rcx), %ymm22 {%k7} {z} +# INTEL: vrndscalebf16 ymm22 {k7} {z}, ymmword ptr [rcx + 4064], 123 0x62,0xe3,0x7f,0xaf,0x08,0x71,0x7f,0x7b -# ATT: vrndscalenepbf16 $123, -256(%rdx){1to16}, %ymm22 {%k7} {z} -# INTEL: vrndscalenepbf16 ymm22 {k7} {z}, word ptr [rdx - 256]{1to16}, 123 +# ATT: vrndscalebf16 $123, -256(%rdx){1to16}, %ymm22 {%k7} {z} +# INTEL: vrndscalebf16 ymm22 {k7} {z}, word ptr [rdx - 256]{1to16}, 123 0x62,0xe3,0x7f,0xbf,0x08,0x72,0x80,0x7b -# ATT: vrndscalenepbf16 $123, 268435456(%rbp,%r14,8), %zmm22 -# INTEL: vrndscalenepbf16 zmm22, zmmword ptr [rbp + 8*r14 + 268435456], 123 +# ATT: vrndscalebf16 $123, 268435456(%rbp,%r14,8), %zmm22 +# INTEL: vrndscalebf16 zmm22, zmmword ptr [rbp + 8*r14 + 268435456], 123 0x62,0xa3,0x7f,0x48,0x08,0xb4,0xf5,0x00,0x00,0x00,0x10,0x7b -# ATT: vrndscalenepbf16 $123, 291(%r8,%rax,4), %zmm22 {%k7} -# INTEL: vrndscalenepbf16 zmm22 {k7}, zmmword ptr [r8 + 4*rax + 291], 123 +# ATT: vrndscalebf16 $123, 291(%r8,%rax,4), %zmm22 {%k7} +# INTEL: vrndscalebf16 zmm22 {k7}, zmmword ptr [r8 + 4*rax + 291], 123 0x62,0xc3,0x7f,0x4f,0x08,0xb4,0x80,0x23,0x01,0x00,0x00,0x7b -# ATT: vrndscalenepbf16 $123, (%rip){1to32}, %zmm22 -# INTEL: vrndscalenepbf16 zmm22, word ptr [rip]{1to32}, 123 +# ATT: vrndscalebf16 $123, (%rip){1to32}, %zmm22 +# INTEL: vrndscalebf16 zmm22, word ptr [rip]{1to32}, 123 0x62,0xe3,0x7f,0x58,0x08,0x35,0x00,0x00,0x00,0x00,0x7b -# ATT: vrndscalenepbf16 $123, -2048(,%rbp,2), %zmm22 -# INTEL: vrndscalenepbf16 zmm22, zmmword ptr [2*rbp - 2048], 123 +# ATT: vrndscalebf16 $123, -2048(,%rbp,2), %zmm22 +# INTEL: vrndscalebf16 zmm22, zmmword ptr [2*rbp - 2048], 123 0x62,0xe3,0x7f,0x48,0x08,0x34,0x6d,0x00,0xf8,0xff,0xff,0x7b -# ATT: vrndscalenepbf16 $123, 8128(%rcx), %zmm22 {%k7} {z} -# INTEL: vrndscalenepbf16 zmm22 {k7} {z}, zmmword ptr [rcx + 8128], 123 +# ATT: vrndscalebf16 $123, 8128(%rcx), %zmm22 {%k7} {z} +# INTEL: vrndscalebf16 zmm22 {k7} {z}, zmmword ptr [rcx + 8128], 123 0x62,0xe3,0x7f,0xcf,0x08,0x71,0x7f,0x7b -# ATT: vrndscalenepbf16 $123, -256(%rdx){1to32}, %zmm22 {%k7} {z} -# INTEL: vrndscalenepbf16 zmm22 {k7} {z}, word ptr [rdx - 256]{1to32}, 123 +# ATT: vrndscalebf16 $123, -256(%rdx){1to32}, %zmm22 {%k7} {z} +# INTEL: vrndscalebf16 zmm22 {k7} {z}, word ptr [rdx - 256]{1to32}, 123 0x62,0xe3,0x7f,0xdf,0x08,0x72,0x80,0x7b -# ATT: vrsqrtpbf16 %xmm23, %xmm22 -# INTEL: vrsqrtpbf16 xmm22, xmm23 +# ATT: vrsqrtbf16 %xmm23, %xmm22 +# INTEL: vrsqrtbf16 xmm22, xmm23 0x62,0xa6,0x7c,0x08,0x4e,0xf7 -# ATT: vrsqrtpbf16 %xmm23, %xmm22 {%k7} -# INTEL: vrsqrtpbf16 xmm22 {k7}, xmm23 +# ATT: vrsqrtbf16 %xmm23, %xmm22 {%k7} +# INTEL: vrsqrtbf16 xmm22 {k7}, xmm23 0x62,0xa6,0x7c,0x0f,0x4e,0xf7 -# ATT: vrsqrtpbf16 %xmm23, %xmm22 {%k7} {z} -# INTEL: vrsqrtpbf16 xmm22 {k7} {z}, xmm23 +# ATT: vrsqrtbf16 %xmm23, %xmm22 {%k7} {z} +# INTEL: vrsqrtbf16 xmm22 {k7} {z}, xmm23 0x62,0xa6,0x7c,0x8f,0x4e,0xf7 -# ATT: vrsqrtpbf16 %zmm23, %zmm22 -# INTEL: vrsqrtpbf16 zmm22, zmm23 +# ATT: vrsqrtbf16 %zmm23, %zmm22 +# INTEL: vrsqrtbf16 zmm22, zmm23 0x62,0xa6,0x7c,0x48,0x4e,0xf7 -# ATT: vrsqrtpbf16 %zmm23, %zmm22 {%k7} -# INTEL: vrsqrtpbf16 zmm22 {k7}, zmm23 +# ATT: vrsqrtbf16 %zmm23, %zmm22 {%k7} +# INTEL: vrsqrtbf16 zmm22 {k7}, zmm23 0x62,0xa6,0x7c,0x4f,0x4e,0xf7 -# ATT: vrsqrtpbf16 %zmm23, %zmm22 {%k7} {z} -# INTEL: vrsqrtpbf16 zmm22 {k7} {z}, zmm23 +# ATT: vrsqrtbf16 %zmm23, %zmm22 {%k7} {z} +# INTEL: vrsqrtbf16 zmm22 {k7} {z}, zmm23 0x62,0xa6,0x7c,0xcf,0x4e,0xf7 -# ATT: vrsqrtpbf16 %ymm23, %ymm22 -# INTEL: vrsqrtpbf16 ymm22, ymm23 +# ATT: vrsqrtbf16 %ymm23, %ymm22 +# INTEL: vrsqrtbf16 ymm22, ymm23 0x62,0xa6,0x7c,0x28,0x4e,0xf7 -# ATT: vrsqrtpbf16 %ymm23, %ymm22 {%k7} -# INTEL: vrsqrtpbf16 ymm22 {k7}, ymm23 +# ATT: vrsqrtbf16 %ymm23, %ymm22 {%k7} +# INTEL: vrsqrtbf16 ymm22 {k7}, ymm23 0x62,0xa6,0x7c,0x2f,0x4e,0xf7 -# ATT: vrsqrtpbf16 %ymm23, %ymm22 {%k7} {z} -# INTEL: vrsqrtpbf16 ymm22 {k7} {z}, ymm23 +# ATT: vrsqrtbf16 %ymm23, %ymm22 {%k7} {z} +# INTEL: vrsqrtbf16 ymm22 {k7} {z}, ymm23 0x62,0xa6,0x7c,0xaf,0x4e,0xf7 -# ATT: vrsqrtpbf16 268435456(%rbp,%r14,8), %xmm22 -# INTEL: vrsqrtpbf16 xmm22, xmmword ptr [rbp + 8*r14 + 268435456] +# ATT: vrsqrtbf16 268435456(%rbp,%r14,8), %xmm22 +# INTEL: vrsqrtbf16 xmm22, xmmword ptr [rbp + 8*r14 + 268435456] 0x62,0xa6,0x7c,0x08,0x4e,0xb4,0xf5,0x00,0x00,0x00,0x10 -# ATT: vrsqrtpbf16 291(%r8,%rax,4), %xmm22 {%k7} -# INTEL: vrsqrtpbf16 xmm22 {k7}, xmmword ptr [r8 + 4*rax + 291] +# ATT: vrsqrtbf16 291(%r8,%rax,4), %xmm22 {%k7} +# INTEL: vrsqrtbf16 xmm22 {k7}, xmmword ptr [r8 + 4*rax + 291] 0x62,0xc6,0x7c,0x0f,0x4e,0xb4,0x80,0x23,0x01,0x00,0x00 -# ATT: vrsqrtpbf16 (%rip){1to8}, %xmm22 -# INTEL: vrsqrtpbf16 xmm22, word ptr [rip]{1to8} +# ATT: vrsqrtbf16 (%rip){1to8}, %xmm22 +# INTEL: vrsqrtbf16 xmm22, word ptr [rip]{1to8} 0x62,0xe6,0x7c,0x18,0x4e,0x35,0x00,0x00,0x00,0x00 -# ATT: vrsqrtpbf16 -512(,%rbp,2), %xmm22 -# INTEL: vrsqrtpbf16 xmm22, xmmword ptr [2*rbp - 512] +# ATT: vrsqrtbf16 -512(,%rbp,2), %xmm22 +# INTEL: vrsqrtbf16 xmm22, xmmword ptr [2*rbp - 512] 0x62,0xe6,0x7c,0x08,0x4e,0x34,0x6d,0x00,0xfe,0xff,0xff -# ATT: vrsqrtpbf16 2032(%rcx), %xmm22 {%k7} {z} -# INTEL: vrsqrtpbf16 xmm22 {k7} {z}, xmmword ptr [rcx + 2032] +# ATT: vrsqrtbf16 2032(%rcx), %xmm22 {%k7} {z} +# INTEL: vrsqrtbf16 xmm22 {k7} {z}, xmmword ptr [rcx + 2032] 0x62,0xe6,0x7c,0x8f,0x4e,0x71,0x7f -# ATT: vrsqrtpbf16 -256(%rdx){1to8}, %xmm22 {%k7} {z} -# INTEL: vrsqrtpbf16 xmm22 {k7} {z}, word ptr [rdx - 256]{1to8} +# ATT: vrsqrtbf16 -256(%rdx){1to8}, %xmm22 {%k7} {z} +# INTEL: vrsqrtbf16 xmm22 {k7} {z}, word ptr [rdx - 256]{1to8} 0x62,0xe6,0x7c,0x9f,0x4e,0x72,0x80 -# ATT: vrsqrtpbf16 268435456(%rbp,%r14,8), %ymm22 -# INTEL: vrsqrtpbf16 ymm22, ymmword ptr [rbp + 8*r14 + 268435456] +# ATT: vrsqrtbf16 268435456(%rbp,%r14,8), %ymm22 +# INTEL: vrsqrtbf16 ymm22, ymmword ptr [rbp + 8*r14 + 268435456] 0x62,0xa6,0x7c,0x28,0x4e,0xb4,0xf5,0x00,0x00,0x00,0x10 -# ATT: vrsqrtpbf16 291(%r8,%rax,4), %ymm22 {%k7} -# INTEL: vrsqrtpbf16 ymm22 {k7}, ymmword ptr [r8 + 4*rax + 291] +# ATT: vrsqrtbf16 291(%r8,%rax,4), %ymm22 {%k7} +# INTEL: vrsqrtbf16 ymm22 {k7}, ymmword ptr [r8 + 4*rax + 291] 0x62,0xc6,0x7c,0x2f,0x4e,0xb4,0x80,0x23,0x01,0x00,0x00 -# ATT: vrsqrtpbf16 (%rip){1to16}, %ymm22 -# INTEL: vrsqrtpbf16 ymm22, word ptr [rip]{1to16} +# ATT: vrsqrtbf16 (%rip){1to16}, %ymm22 +# INTEL: vrsqrtbf16 ymm22, word ptr [rip]{1to16} 0x62,0xe6,0x7c,0x38,0x4e,0x35,0x00,0x00,0x00,0x00 -# ATT: vrsqrtpbf16 -1024(,%rbp,2), %ymm22 -# INTEL: vrsqrtpbf16 ymm22, ymmword ptr [2*rbp - 1024] +# ATT: vrsqrtbf16 -1024(,%rbp,2), %ymm22 +# INTEL: vrsqrtbf16 ymm22, ymmword ptr [2*rbp - 1024] 0x62,0xe6,0x7c,0x28,0x4e,0x34,0x6d,0x00,0xfc,0xff,0xff -# ATT: vrsqrtpbf16 4064(%rcx), %ymm22 {%k7} {z} -# INTEL: vrsqrtpbf16 ymm22 {k7} {z}, ymmword ptr [rcx + 4064] +# ATT: vrsqrtbf16 4064(%rcx), %ymm22 {%k7} {z} +# INTEL: vrsqrtbf16 ymm22 {k7} {z}, ymmword ptr [rcx + 4064] 0x62,0xe6,0x7c,0xaf,0x4e,0x71,0x7f -# ATT: vrsqrtpbf16 -256(%rdx){1to16}, %ymm22 {%k7} {z} -# INTEL: vrsqrtpbf16 ymm22 {k7} {z}, word ptr [rdx - 256]{1to16} +# ATT: vrsqrtbf16 -256(%rdx){1to16}, %ymm22 {%k7} {z} +# INTEL: vrsqrtbf16 ymm22 {k7} {z}, word ptr [rdx - 256]{1to16} 0x62,0xe6,0x7c,0xbf,0x4e,0x72,0x80 -# ATT: vrsqrtpbf16 268435456(%rbp,%r14,8), %zmm22 -# INTEL: vrsqrtpbf16 zmm22, zmmword ptr [rbp + 8*r14 + 268435456] +# ATT: vrsqrtbf16 268435456(%rbp,%r14,8), %zmm22 +# INTEL: vrsqrtbf16 zmm22, zmmword ptr [rbp + 8*r14 + 268435456] 0x62,0xa6,0x7c,0x48,0x4e,0xb4,0xf5,0x00,0x00,0x00,0x10 -# ATT: vrsqrtpbf16 291(%r8,%rax,4), %zmm22 {%k7} -# INTEL: vrsqrtpbf16 zmm22 {k7}, zmmword ptr [r8 + 4*rax + 291] +# ATT: vrsqrtbf16 291(%r8,%rax,4), %zmm22 {%k7} +# INTEL: vrsqrtbf16 zmm22 {k7}, zmmword ptr [r8 + 4*rax + 291] 0x62,0xc6,0x7c,0x4f,0x4e,0xb4,0x80,0x23,0x01,0x00,0x00 -# ATT: vrsqrtpbf16 (%rip){1to32}, %zmm22 -# INTEL: vrsqrtpbf16 zmm22, word ptr [rip]{1to32} +# ATT: vrsqrtbf16 (%rip){1to32}, %zmm22 +# INTEL: vrsqrtbf16 zmm22, word ptr [rip]{1to32} 0x62,0xe6,0x7c,0x58,0x4e,0x35,0x00,0x00,0x00,0x00 -# ATT: vrsqrtpbf16 -2048(,%rbp,2), %zmm22 -# INTEL: vrsqrtpbf16 zmm22, zmmword ptr [2*rbp - 2048] +# ATT: vrsqrtbf16 -2048(,%rbp,2), %zmm22 +# INTEL: vrsqrtbf16 zmm22, zmmword ptr [2*rbp - 2048] 0x62,0xe6,0x7c,0x48,0x4e,0x34,0x6d,0x00,0xf8,0xff,0xff -# ATT: vrsqrtpbf16 8128(%rcx), %zmm22 {%k7} {z} -# INTEL: vrsqrtpbf16 zmm22 {k7} {z}, zmmword ptr [rcx + 8128] +# ATT: vrsqrtbf16 8128(%rcx), %zmm22 {%k7} {z} +# INTEL: vrsqrtbf16 zmm22 {k7} {z}, zmmword ptr [rcx + 8128] 0x62,0xe6,0x7c,0xcf,0x4e,0x71,0x7f -# ATT: vrsqrtpbf16 -256(%rdx){1to32}, %zmm22 {%k7} {z} -# INTEL: vrsqrtpbf16 zmm22 {k7} {z}, word ptr [rdx - 256]{1to32} +# ATT: vrsqrtbf16 -256(%rdx){1to32}, %zmm22 {%k7} {z} +# INTEL: vrsqrtbf16 zmm22 {k7} {z}, word ptr [rdx - 256]{1to32} 0x62,0xe6,0x7c,0xdf,0x4e,0x72,0x80 -# ATT: vscalefpbf16 %ymm24, %ymm23, %ymm22 -# INTEL: vscalefpbf16 ymm22, ymm23, ymm24 +# ATT: vscalefbf16 %ymm24, %ymm23, %ymm22 +# INTEL: vscalefbf16 ymm22, ymm23, ymm24 0x62,0x86,0x44,0x20,0x2c,0xf0 -# ATT: vscalefpbf16 %ymm24, %ymm23, %ymm22 {%k7} -# INTEL: vscalefpbf16 ymm22 {k7}, ymm23, ymm24 +# ATT: vscalefbf16 %ymm24, %ymm23, %ymm22 {%k7} +# INTEL: vscalefbf16 ymm22 {k7}, ymm23, ymm24 0x62,0x86,0x44,0x27,0x2c,0xf0 -# ATT: vscalefpbf16 %ymm24, %ymm23, %ymm22 {%k7} {z} -# INTEL: vscalefpbf16 ymm22 {k7} {z}, ymm23, ymm24 +# ATT: vscalefbf16 %ymm24, %ymm23, %ymm22 {%k7} {z} +# INTEL: vscalefbf16 ymm22 {k7} {z}, ymm23, ymm24 0x62,0x86,0x44,0xa7,0x2c,0xf0 -# ATT: vscalefpbf16 %zmm24, %zmm23, %zmm22 -# INTEL: vscalefpbf16 zmm22, zmm23, zmm24 +# ATT: vscalefbf16 %zmm24, %zmm23, %zmm22 +# INTEL: vscalefbf16 zmm22, zmm23, zmm24 0x62,0x86,0x44,0x40,0x2c,0xf0 -# ATT: vscalefpbf16 %zmm24, %zmm23, %zmm22 {%k7} -# INTEL: vscalefpbf16 zmm22 {k7}, zmm23, zmm24 +# ATT: vscalefbf16 %zmm24, %zmm23, %zmm22 {%k7} +# INTEL: vscalefbf16 zmm22 {k7}, zmm23, zmm24 0x62,0x86,0x44,0x47,0x2c,0xf0 -# ATT: vscalefpbf16 %zmm24, %zmm23, %zmm22 {%k7} {z} -# INTEL: vscalefpbf16 zmm22 {k7} {z}, zmm23, zmm24 +# ATT: vscalefbf16 %zmm24, %zmm23, %zmm22 {%k7} {z} +# INTEL: vscalefbf16 zmm22 {k7} {z}, zmm23, zmm24 0x62,0x86,0x44,0xc7,0x2c,0xf0 -# ATT: vscalefpbf16 %xmm24, %xmm23, %xmm22 -# INTEL: vscalefpbf16 xmm22, xmm23, xmm24 +# ATT: vscalefbf16 %xmm24, %xmm23, %xmm22 +# INTEL: vscalefbf16 xmm22, xmm23, xmm24 0x62,0x86,0x44,0x00,0x2c,0xf0 -# ATT: vscalefpbf16 %xmm24, %xmm23, %xmm22 {%k7} -# INTEL: vscalefpbf16 xmm22 {k7}, xmm23, xmm24 +# ATT: vscalefbf16 %xmm24, %xmm23, %xmm22 {%k7} +# INTEL: vscalefbf16 xmm22 {k7}, xmm23, xmm24 0x62,0x86,0x44,0x07,0x2c,0xf0 -# ATT: vscalefpbf16 %xmm24, %xmm23, %xmm22 {%k7} {z} -# INTEL: vscalefpbf16 xmm22 {k7} {z}, xmm23, xmm24 +# ATT: vscalefbf16 %xmm24, %xmm23, %xmm22 {%k7} {z} +# INTEL: vscalefbf16 xmm22 {k7} {z}, xmm23, xmm24 0x62,0x86,0x44,0x87,0x2c,0xf0 -# ATT: vscalefpbf16 268435456(%rbp,%r14,8), %zmm23, %zmm22 -# INTEL: vscalefpbf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456] +# ATT: vscalefbf16 268435456(%rbp,%r14,8), %zmm23, %zmm22 +# INTEL: vscalefbf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456] 0x62,0xa6,0x44,0x40,0x2c,0xb4,0xf5,0x00,0x00,0x00,0x10 -# ATT: vscalefpbf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7} -# INTEL: vscalefpbf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291] +# ATT: vscalefbf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7} +# INTEL: vscalefbf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291] 0x62,0xc6,0x44,0x47,0x2c,0xb4,0x80,0x23,0x01,0x00,0x00 -# ATT: vscalefpbf16 (%rip){1to32}, %zmm23, %zmm22 -# INTEL: vscalefpbf16 zmm22, zmm23, word ptr [rip]{1to32} +# ATT: vscalefbf16 (%rip){1to32}, %zmm23, %zmm22 +# INTEL: vscalefbf16 zmm22, zmm23, word ptr [rip]{1to32} 0x62,0xe6,0x44,0x50,0x2c,0x35,0x00,0x00,0x00,0x00 -# ATT: vscalefpbf16 -2048(,%rbp,2), %zmm23, %zmm22 -# INTEL: vscalefpbf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048] +# ATT: vscalefbf16 -2048(,%rbp,2), %zmm23, %zmm22 +# INTEL: vscalefbf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048] 0x62,0xe6,0x44,0x40,0x2c,0x34,0x6d,0x00,0xf8,0xff,0xff -# ATT: vscalefpbf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z} -# INTEL: vscalefpbf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128] +# ATT: vscalefbf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z} +# INTEL: vscalefbf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128] 0x62,0xe6,0x44,0xc7,0x2c,0x71,0x7f -# ATT: vscalefpbf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z} -# INTEL: vscalefpbf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32} +# ATT: vscalefbf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z} +# INTEL: vscalefbf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32} 0x62,0xe6,0x44,0xd7,0x2c,0x72,0x80 -# ATT: vscalefpbf16 268435456(%rbp,%r14,8), %ymm23, %ymm22 -# INTEL: vscalefpbf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456] +# ATT: vscalefbf16 268435456(%rbp,%r14,8), %ymm23, %ymm22 +# INTEL: vscalefbf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456] 0x62,0xa6,0x44,0x20,0x2c,0xb4,0xf5,0x00,0x00,0x00,0x10 -# ATT: vscalefpbf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7} -# INTEL: vscalefpbf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291] +# ATT: vscalefbf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7} +# INTEL: vscalefbf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291] 0x62,0xc6,0x44,0x27,0x2c,0xb4,0x80,0x23,0x01,0x00,0x00 -# ATT: vscalefpbf16 (%rip){1to16}, %ymm23, %ymm22 -# INTEL: vscalefpbf16 ymm22, ymm23, word ptr [rip]{1to16} +# ATT: vscalefbf16 (%rip){1to16}, %ymm23, %ymm22 +# INTEL: vscalefbf16 ymm22, ymm23, word ptr [rip]{1to16} 0x62,0xe6,0x44,0x30,0x2c,0x35,0x00,0x00,0x00,0x00 -# ATT: vscalefpbf16 -1024(,%rbp,2), %ymm23, %ymm22 -# INTEL: vscalefpbf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024] +# ATT: vscalefbf16 -1024(,%rbp,2), %ymm23, %ymm22 +# INTEL: vscalefbf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024] 0x62,0xe6,0x44,0x20,0x2c,0x34,0x6d,0x00,0xfc,0xff,0xff -# ATT: vscalefpbf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z} -# INTEL: vscalefpbf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064] +# ATT: vscalefbf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z} +# INTEL: vscalefbf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064] 0x62,0xe6,0x44,0xa7,0x2c,0x71,0x7f -# ATT: vscalefpbf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z} -# INTEL: vscalefpbf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16} +# ATT: vscalefbf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z} +# INTEL: vscalefbf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16} 0x62,0xe6,0x44,0xb7,0x2c,0x72,0x80 -# ATT: vscalefpbf16 268435456(%rbp,%r14,8), %xmm23, %xmm22 -# INTEL: vscalefpbf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456] +# ATT: vscalefbf16 268435456(%rbp,%r14,8), %xmm23, %xmm22 +# INTEL: vscalefbf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456] 0x62,0xa6,0x44,0x00,0x2c,0xb4,0xf5,0x00,0x00,0x00,0x10 -# ATT: vscalefpbf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7} -# INTEL: vscalefpbf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291] +# ATT: vscalefbf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7} +# INTEL: vscalefbf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291] 0x62,0xc6,0x44,0x07,0x2c,0xb4,0x80,0x23,0x01,0x00,0x00 -# ATT: vscalefpbf16 (%rip){1to8}, %xmm23, %xmm22 -# INTEL: vscalefpbf16 xmm22, xmm23, word ptr [rip]{1to8} +# ATT: vscalefbf16 (%rip){1to8}, %xmm23, %xmm22 +# INTEL: vscalefbf16 xmm22, xmm23, word ptr [rip]{1to8} 0x62,0xe6,0x44,0x10,0x2c,0x35,0x00,0x00,0x00,0x00 -# ATT: vscalefpbf16 -512(,%rbp,2), %xmm23, %xmm22 -# INTEL: vscalefpbf16 xmm22, xmm23, xmmword ptr [2*rbp - 512] +# ATT: vscalefbf16 -512(,%rbp,2), %xmm23, %xmm22 +# INTEL: vscalefbf16 xmm22, xmm23, xmmword ptr [2*rbp - 512] 0x62,0xe6,0x44,0x00,0x2c,0x34,0x6d,0x00,0xfe,0xff,0xff -# ATT: vscalefpbf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z} -# INTEL: vscalefpbf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032] +# ATT: vscalefbf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z} +# INTEL: vscalefbf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032] 0x62,0xe6,0x44,0x87,0x2c,0x71,0x7f -# ATT: vscalefpbf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z} -# INTEL: vscalefpbf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8} +# ATT: vscalefbf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z} +# INTEL: vscalefbf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8} 0x62,0xe6,0x44,0x97,0x2c,0x72,0x80 -# ATT: vsqrtnepbf16 %xmm23, %xmm22 -# INTEL: vsqrtnepbf16 xmm22, xmm23 +# ATT: vsqrtbf16 %xmm23, %xmm22 +# INTEL: vsqrtbf16 xmm22, xmm23 0x62,0xa5,0x7d,0x08,0x51,0xf7 -# ATT: vsqrtnepbf16 %xmm23, %xmm22 {%k7} -# INTEL: vsqrtnepbf16 xmm22 {k7}, xmm23 +# ATT: vsqrtbf16 %xmm23, %xmm22 {%k7} +# INTEL: vsqrtbf16 xmm22 {k7}, xmm23 0x62,0xa5,0x7d,0x0f,0x51,0xf7 -# ATT: vsqrtnepbf16 %xmm23, %xmm22 {%k7} {z} -# INTEL: vsqrtnepbf16 xmm22 {k7} {z}, xmm23 +# ATT: vsqrtbf16 %xmm23, %xmm22 {%k7} {z} +# INTEL: vsqrtbf16 xmm22 {k7} {z}, xmm23 0x62,0xa5,0x7d,0x8f,0x51,0xf7 -# ATT: vsqrtnepbf16 %zmm23, %zmm22 -# INTEL: vsqrtnepbf16 zmm22, zmm23 +# ATT: vsqrtbf16 %zmm23, %zmm22 +# INTEL: vsqrtbf16 zmm22, zmm23 0x62,0xa5,0x7d,0x48,0x51,0xf7 -# ATT: vsqrtnepbf16 %zmm23, %zmm22 {%k7} -# INTEL: vsqrtnepbf16 zmm22 {k7}, zmm23 +# ATT: vsqrtbf16 %zmm23, %zmm22 {%k7} +# INTEL: vsqrtbf16 zmm22 {k7}, zmm23 0x62,0xa5,0x7d,0x4f,0x51,0xf7 -# ATT: vsqrtnepbf16 %zmm23, %zmm22 {%k7} {z} -# INTEL: vsqrtnepbf16 zmm22 {k7} {z}, zmm23 +# ATT: vsqrtbf16 %zmm23, %zmm22 {%k7} {z} +# INTEL: vsqrtbf16 zmm22 {k7} {z}, zmm23 0x62,0xa5,0x7d,0xcf,0x51,0xf7 -# ATT: vsqrtnepbf16 %ymm23, %ymm22 -# INTEL: vsqrtnepbf16 ymm22, ymm23 +# ATT: vsqrtbf16 %ymm23, %ymm22 +# INTEL: vsqrtbf16 ymm22, ymm23 0x62,0xa5,0x7d,0x28,0x51,0xf7 -# ATT: vsqrtnepbf16 %ymm23, %ymm22 {%k7} -# INTEL: vsqrtnepbf16 ymm22 {k7}, ymm23 +# ATT: vsqrtbf16 %ymm23, %ymm22 {%k7} +# INTEL: vsqrtbf16 ymm22 {k7}, ymm23 0x62,0xa5,0x7d,0x2f,0x51,0xf7 -# ATT: vsqrtnepbf16 %ymm23, %ymm22 {%k7} {z} -# INTEL: vsqrtnepbf16 ymm22 {k7} {z}, ymm23 +# ATT: vsqrtbf16 %ymm23, %ymm22 {%k7} {z} +# INTEL: vsqrtbf16 ymm22 {k7} {z}, ymm23 0x62,0xa5,0x7d,0xaf,0x51,0xf7 -# ATT: vsqrtnepbf16 268435456(%rbp,%r14,8), %xmm22 -# INTEL: vsqrtnepbf16 xmm22, xmmword ptr [rbp + 8*r14 + 268435456] +# ATT: vsqrtbf16 268435456(%rbp,%r14,8), %xmm22 +# INTEL: vsqrtbf16 xmm22, xmmword ptr [rbp + 8*r14 + 268435456] 0x62,0xa5,0x7d,0x08,0x51,0xb4,0xf5,0x00,0x00,0x00,0x10 -# ATT: vsqrtnepbf16 291(%r8,%rax,4), %xmm22 {%k7} -# INTEL: vsqrtnepbf16 xmm22 {k7}, xmmword ptr [r8 + 4*rax + 291] +# ATT: vsqrtbf16 291(%r8,%rax,4), %xmm22 {%k7} +# INTEL: vsqrtbf16 xmm22 {k7}, xmmword ptr [r8 + 4*rax + 291] 0x62,0xc5,0x7d,0x0f,0x51,0xb4,0x80,0x23,0x01,0x00,0x00 -# ATT: vsqrtnepbf16 (%rip){1to8}, %xmm22 -# INTEL: vsqrtnepbf16 xmm22, word ptr [rip]{1to8} +# ATT: vsqrtbf16 (%rip){1to8}, %xmm22 +# INTEL: vsqrtbf16 xmm22, word ptr [rip]{1to8} 0x62,0xe5,0x7d,0x18,0x51,0x35,0x00,0x00,0x00,0x00 -# ATT: vsqrtnepbf16 -512(,%rbp,2), %xmm22 -# INTEL: vsqrtnepbf16 xmm22, xmmword ptr [2*rbp - 512] +# ATT: vsqrtbf16 -512(,%rbp,2), %xmm22 +# INTEL: vsqrtbf16 xmm22, xmmword ptr [2*rbp - 512] 0x62,0xe5,0x7d,0x08,0x51,0x34,0x6d,0x00,0xfe,0xff,0xff -# ATT: vsqrtnepbf16 2032(%rcx), %xmm22 {%k7} {z} -# INTEL: vsqrtnepbf16 xmm22 {k7} {z}, xmmword ptr [rcx + 2032] +# ATT: vsqrtbf16 2032(%rcx), %xmm22 {%k7} {z} +# INTEL: vsqrtbf16 xmm22 {k7} {z}, xmmword ptr [rcx + 2032] 0x62,0xe5,0x7d,0x8f,0x51,0x71,0x7f -# ATT: vsqrtnepbf16 -256(%rdx){1to8}, %xmm22 {%k7} {z} -# INTEL: vsqrtnepbf16 xmm22 {k7} {z}, word ptr [rdx - 256]{1to8} +# ATT: vsqrtbf16 -256(%rdx){1to8}, %xmm22 {%k7} {z} +# INTEL: vsqrtbf16 xmm22 {k7} {z}, word ptr [rdx - 256]{1to8} 0x62,0xe5,0x7d,0x9f,0x51,0x72,0x80 -# ATT: vsqrtnepbf16 268435456(%rbp,%r14,8), %ymm22 -# INTEL: vsqrtnepbf16 ymm22, ymmword ptr [rbp + 8*r14 + 268435456] +# ATT: vsqrtbf16 268435456(%rbp,%r14,8), %ymm22 +# INTEL: vsqrtbf16 ymm22, ymmword ptr [rbp + 8*r14 + 268435456] 0x62,0xa5,0x7d,0x28,0x51,0xb4,0xf5,0x00,0x00,0x00,0x10 -# ATT: vsqrtnepbf16 291(%r8,%rax,4), %ymm22 {%k7} -# INTEL: vsqrtnepbf16 ymm22 {k7}, ymmword ptr [r8 + 4*rax + 291] +# ATT: vsqrtbf16 291(%r8,%rax,4), %ymm22 {%k7} +# INTEL: vsqrtbf16 ymm22 {k7}, ymmword ptr [r8 + 4*rax + 291] 0x62,0xc5,0x7d,0x2f,0x51,0xb4,0x80,0x23,0x01,0x00,0x00 -# ATT: vsqrtnepbf16 (%rip){1to16}, %ymm22 -# INTEL: vsqrtnepbf16 ymm22, word ptr [rip]{1to16} +# ATT: vsqrtbf16 (%rip){1to16}, %ymm22 +# INTEL: vsqrtbf16 ymm22, word ptr [rip]{1to16} 0x62,0xe5,0x7d,0x38,0x51,0x35,0x00,0x00,0x00,0x00 -# ATT: vsqrtnepbf16 -1024(,%rbp,2), %ymm22 -# INTEL: vsqrtnepbf16 ymm22, ymmword ptr [2*rbp - 1024] +# ATT: vsqrtbf16 -1024(,%rbp,2), %ymm22 +# INTEL: vsqrtbf16 ymm22, ymmword ptr [2*rbp - 1024] 0x62,0xe5,0x7d,0x28,0x51,0x34,0x6d,0x00,0xfc,0xff,0xff -# ATT: vsqrtnepbf16 4064(%rcx), %ymm22 {%k7} {z} -# INTEL: vsqrtnepbf16 ymm22 {k7} {z}, ymmword ptr [rcx + 4064] +# ATT: vsqrtbf16 4064(%rcx), %ymm22 {%k7} {z} +# INTEL: vsqrtbf16 ymm22 {k7} {z}, ymmword ptr [rcx + 4064] 0x62,0xe5,0x7d,0xaf,0x51,0x71,0x7f -# ATT: vsqrtnepbf16 -256(%rdx){1to16}, %ymm22 {%k7} {z} -# INTEL: vsqrtnepbf16 ymm22 {k7} {z}, word ptr [rdx - 256]{1to16} +# ATT: vsqrtbf16 -256(%rdx){1to16}, %ymm22 {%k7} {z} +# INTEL: vsqrtbf16 ymm22 {k7} {z}, word ptr [rdx - 256]{1to16} 0x62,0xe5,0x7d,0xbf,0x51,0x72,0x80 -# ATT: vsqrtnepbf16 268435456(%rbp,%r14,8), %zmm22 -# INTEL: vsqrtnepbf16 zmm22, zmmword ptr [rbp + 8*r14 + 268435456] +# ATT: vsqrtbf16 268435456(%rbp,%r14,8), %zmm22 +# INTEL: vsqrtbf16 zmm22, zmmword ptr [rbp + 8*r14 + 268435456] 0x62,0xa5,0x7d,0x48,0x51,0xb4,0xf5,0x00,0x00,0x00,0x10 -# ATT: vsqrtnepbf16 291(%r8,%rax,4), %zmm22 {%k7} -# INTEL: vsqrtnepbf16 zmm22 {k7}, zmmword ptr [r8 + 4*rax + 291] +# ATT: vsqrtbf16 291(%r8,%rax,4), %zmm22 {%k7} +# INTEL: vsqrtbf16 zmm22 {k7}, zmmword ptr [r8 + 4*rax + 291] 0x62,0xc5,0x7d,0x4f,0x51,0xb4,0x80,0x23,0x01,0x00,0x00 -# ATT: vsqrtnepbf16 (%rip){1to32}, %zmm22 -# INTEL: vsqrtnepbf16 zmm22, word ptr [rip]{1to32} +# ATT: vsqrtbf16 (%rip){1to32}, %zmm22 +# INTEL: vsqrtbf16 zmm22, word ptr [rip]{1to32} 0x62,0xe5,0x7d,0x58,0x51,0x35,0x00,0x00,0x00,0x00 -# ATT: vsqrtnepbf16 -2048(,%rbp,2), %zmm22 -# INTEL: vsqrtnepbf16 zmm22, zmmword ptr [2*rbp - 2048] +# ATT: vsqrtbf16 -2048(,%rbp,2), %zmm22 +# INTEL: vsqrtbf16 zmm22, zmmword ptr [2*rbp - 2048] 0x62,0xe5,0x7d,0x48,0x51,0x34,0x6d,0x00,0xf8,0xff,0xff -# ATT: vsqrtnepbf16 8128(%rcx), %zmm22 {%k7} {z} -# INTEL: vsqrtnepbf16 zmm22 {k7} {z}, zmmword ptr [rcx + 8128] +# ATT: vsqrtbf16 8128(%rcx), %zmm22 {%k7} {z} +# INTEL: vsqrtbf16 zmm22 {k7} {z}, zmmword ptr [rcx + 8128] 0x62,0xe5,0x7d,0xcf,0x51,0x71,0x7f -# ATT: vsqrtnepbf16 -256(%rdx){1to32}, %zmm22 {%k7} {z} -# INTEL: vsqrtnepbf16 zmm22 {k7} {z}, word ptr [rdx - 256]{1to32} +# ATT: vsqrtbf16 -256(%rdx){1to32}, %zmm22 {%k7} {z} +# INTEL: vsqrtbf16 zmm22 {k7} {z}, word ptr [rdx - 256]{1to32} 0x62,0xe5,0x7d,0xdf,0x51,0x72,0x80 -# ATT: vsubnepbf16 %ymm24, %ymm23, %ymm22 -# INTEL: vsubnepbf16 ymm22, ymm23, ymm24 +# ATT: vsubbf16 %ymm24, %ymm23, %ymm22 +# INTEL: vsubbf16 ymm22, ymm23, ymm24 0x62,0x85,0x45,0x20,0x5c,0xf0 -# ATT: vsubnepbf16 %ymm24, %ymm23, %ymm22 {%k7} -# INTEL: vsubnepbf16 ymm22 {k7}, ymm23, ymm24 +# ATT: vsubbf16 %ymm24, %ymm23, %ymm22 {%k7} +# INTEL: vsubbf16 ymm22 {k7}, ymm23, ymm24 0x62,0x85,0x45,0x27,0x5c,0xf0 -# ATT: vsubnepbf16 %ymm24, %ymm23, %ymm22 {%k7} {z} -# INTEL: vsubnepbf16 ymm22 {k7} {z}, ymm23, ymm24 +# ATT: vsubbf16 %ymm24, %ymm23, %ymm22 {%k7} {z} +# INTEL: vsubbf16 ymm22 {k7} {z}, ymm23, ymm24 0x62,0x85,0x45,0xa7,0x5c,0xf0 -# ATT: vsubnepbf16 %zmm24, %zmm23, %zmm22 -# INTEL: vsubnepbf16 zmm22, zmm23, zmm24 +# ATT: vsubbf16 %zmm24, %zmm23, %zmm22 +# INTEL: vsubbf16 zmm22, zmm23, zmm24 0x62,0x85,0x45,0x40,0x5c,0xf0 -# ATT: vsubnepbf16 %zmm24, %zmm23, %zmm22 {%k7} -# INTEL: vsubnepbf16 zmm22 {k7}, zmm23, zmm24 +# ATT: vsubbf16 %zmm24, %zmm23, %zmm22 {%k7} +# INTEL: vsubbf16 zmm22 {k7}, zmm23, zmm24 0x62,0x85,0x45,0x47,0x5c,0xf0 -# ATT: vsubnepbf16 %zmm24, %zmm23, %zmm22 {%k7} {z} -# INTEL: vsubnepbf16 zmm22 {k7} {z}, zmm23, zmm24 +# ATT: vsubbf16 %zmm24, %zmm23, %zmm22 {%k7} {z} +# INTEL: vsubbf16 zmm22 {k7} {z}, zmm23, zmm24 0x62,0x85,0x45,0xc7,0x5c,0xf0 -# ATT: vsubnepbf16 %xmm24, %xmm23, %xmm22 -# INTEL: vsubnepbf16 xmm22, xmm23, xmm24 +# ATT: vsubbf16 %xmm24, %xmm23, %xmm22 +# INTEL: vsubbf16 xmm22, xmm23, xmm24 0x62,0x85,0x45,0x00,0x5c,0xf0 -# ATT: vsubnepbf16 %xmm24, %xmm23, %xmm22 {%k7} -# INTEL: vsubnepbf16 xmm22 {k7}, xmm23, xmm24 +# ATT: vsubbf16 %xmm24, %xmm23, %xmm22 {%k7} +# INTEL: vsubbf16 xmm22 {k7}, xmm23, xmm24 0x62,0x85,0x45,0x07,0x5c,0xf0 -# ATT: vsubnepbf16 %xmm24, %xmm23, %xmm22 {%k7} {z} -# INTEL: vsubnepbf16 xmm22 {k7} {z}, xmm23, xmm24 +# ATT: vsubbf16 %xmm24, %xmm23, %xmm22 {%k7} {z} +# INTEL: vsubbf16 xmm22 {k7} {z}, xmm23, xmm24 0x62,0x85,0x45,0x87,0x5c,0xf0 -# ATT: vsubnepbf16 268435456(%rbp,%r14,8), %zmm23, %zmm22 -# INTEL: vsubnepbf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456] +# ATT: vsubbf16 268435456(%rbp,%r14,8), %zmm23, %zmm22 +# INTEL: vsubbf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456] 0x62,0xa5,0x45,0x40,0x5c,0xb4,0xf5,0x00,0x00,0x00,0x10 -# ATT: vsubnepbf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7} -# INTEL: vsubnepbf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291] +# ATT: vsubbf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7} +# INTEL: vsubbf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291] 0x62,0xc5,0x45,0x47,0x5c,0xb4,0x80,0x23,0x01,0x00,0x00 -# ATT: vsubnepbf16 (%rip){1to32}, %zmm23, %zmm22 -# INTEL: vsubnepbf16 zmm22, zmm23, word ptr [rip]{1to32} +# ATT: vsubbf16 (%rip){1to32}, %zmm23, %zmm22 +# INTEL: vsubbf16 zmm22, zmm23, word ptr [rip]{1to32} 0x62,0xe5,0x45,0x50,0x5c,0x35,0x00,0x00,0x00,0x00 -# ATT: vsubnepbf16 -2048(,%rbp,2), %zmm23, %zmm22 -# INTEL: vsubnepbf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048] +# ATT: vsubbf16 -2048(,%rbp,2), %zmm23, %zmm22 +# INTEL: vsubbf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048] 0x62,0xe5,0x45,0x40,0x5c,0x34,0x6d,0x00,0xf8,0xff,0xff -# ATT: vsubnepbf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z} -# INTEL: vsubnepbf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128] +# ATT: vsubbf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z} +# INTEL: vsubbf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128] 0x62,0xe5,0x45,0xc7,0x5c,0x71,0x7f -# ATT: vsubnepbf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z} -# INTEL: vsubnepbf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32} +# ATT: vsubbf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z} +# INTEL: vsubbf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32} 0x62,0xe5,0x45,0xd7,0x5c,0x72,0x80 -# ATT: vsubnepbf16 268435456(%rbp,%r14,8), %ymm23, %ymm22 -# INTEL: vsubnepbf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456] +# ATT: vsubbf16 268435456(%rbp,%r14,8), %ymm23, %ymm22 +# INTEL: vsubbf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456] 0x62,0xa5,0x45,0x20,0x5c,0xb4,0xf5,0x00,0x00,0x00,0x10 -# ATT: vsubnepbf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7} -# INTEL: vsubnepbf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291] +# ATT: vsubbf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7} +# INTEL: vsubbf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291] 0x62,0xc5,0x45,0x27,0x5c,0xb4,0x80,0x23,0x01,0x00,0x00 -# ATT: vsubnepbf16 (%rip){1to16}, %ymm23, %ymm22 -# INTEL: vsubnepbf16 ymm22, ymm23, word ptr [rip]{1to16} +# ATT: vsubbf16 (%rip){1to16}, %ymm23, %ymm22 +# INTEL: vsubbf16 ymm22, ymm23, word ptr [rip]{1to16} 0x62,0xe5,0x45,0x30,0x5c,0x35,0x00,0x00,0x00,0x00 -# ATT: vsubnepbf16 -1024(,%rbp,2), %ymm23, %ymm22 -# INTEL: vsubnepbf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024] +# ATT: vsubbf16 -1024(,%rbp,2), %ymm23, %ymm22 +# INTEL: vsubbf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024] 0x62,0xe5,0x45,0x20,0x5c,0x34,0x6d,0x00,0xfc,0xff,0xff -# ATT: vsubnepbf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z} -# INTEL: vsubnepbf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064] +# ATT: vsubbf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z} +# INTEL: vsubbf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064] 0x62,0xe5,0x45,0xa7,0x5c,0x71,0x7f -# ATT: vsubnepbf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z} -# INTEL: vsubnepbf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16} +# ATT: vsubbf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z} +# INTEL: vsubbf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16} 0x62,0xe5,0x45,0xb7,0x5c,0x72,0x80 -# ATT: vsubnepbf16 268435456(%rbp,%r14,8), %xmm23, %xmm22 -# INTEL: vsubnepbf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456] +# ATT: vsubbf16 268435456(%rbp,%r14,8), %xmm23, %xmm22 +# INTEL: vsubbf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456] 0x62,0xa5,0x45,0x00,0x5c,0xb4,0xf5,0x00,0x00,0x00,0x10 -# ATT: vsubnepbf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7} -# INTEL: vsubnepbf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291] +# ATT: vsubbf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7} +# INTEL: vsubbf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291] 0x62,0xc5,0x45,0x07,0x5c,0xb4,0x80,0x23,0x01,0x00,0x00 -# ATT: vsubnepbf16 (%rip){1to8}, %xmm23, %xmm22 -# INTEL: vsubnepbf16 xmm22, xmm23, word ptr [rip]{1to8} +# ATT: vsubbf16 (%rip){1to8}, %xmm23, %xmm22 +# INTEL: vsubbf16 xmm22, xmm23, word ptr [rip]{1to8} 0x62,0xe5,0x45,0x10,0x5c,0x35,0x00,0x00,0x00,0x00 -# ATT: vsubnepbf16 -512(,%rbp,2), %xmm23, %xmm22 -# INTEL: vsubnepbf16 xmm22, xmm23, xmmword ptr [2*rbp - 512] +# ATT: vsubbf16 -512(,%rbp,2), %xmm23, %xmm22 +# INTEL: vsubbf16 xmm22, xmm23, xmmword ptr [2*rbp - 512] 0x62,0xe5,0x45,0x00,0x5c,0x34,0x6d,0x00,0xfe,0xff,0xff -# ATT: vsubnepbf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z} -# INTEL: vsubnepbf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032] +# ATT: vsubbf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z} +# INTEL: vsubbf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032] 0x62,0xe5,0x45,0x87,0x5c,0x71,0x7f -# ATT: vsubnepbf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z} -# INTEL: vsubnepbf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8} +# ATT: vsubbf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z} +# INTEL: vsubbf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8} 0x62,0xe5,0x45,0x97,0x5c,0x72,0x80 diff --git a/llvm/test/MC/X86/avx10.2-bf16-32-att.s b/llvm/test/MC/X86/avx10.2-bf16-32-att.s index 9f62743177c9b..6b4f23c1ec01d 100644 --- a/llvm/test/MC/X86/avx10.2-bf16-32-att.s +++ b/llvm/test/MC/X86/avx10.2-bf16-32-att.s @@ -1,208 +1,208 @@ // RUN: llvm-mc -triple i386 --show-encoding %s | FileCheck %s -// CHECK: vaddnepbf16 %ymm4, %ymm3, %ymm2 +// CHECK: vaddbf16 %ymm4, %ymm3, %ymm2 // CHECK: encoding: [0x62,0xf5,0x65,0x28,0x58,0xd4] - vaddnepbf16 %ymm4, %ymm3, %ymm2 + vaddbf16 %ymm4, %ymm3, %ymm2 -// CHECK: vaddnepbf16 %ymm4, %ymm3, %ymm2 {%k7} +// CHECK: vaddbf16 %ymm4, %ymm3, %ymm2 {%k7} // CHECK: encoding: [0x62,0xf5,0x65,0x2f,0x58,0xd4] - vaddnepbf16 %ymm4, %ymm3, %ymm2 {%k7} + vaddbf16 %ymm4, %ymm3, %ymm2 {%k7} -// CHECK: vaddnepbf16 %ymm4, %ymm3, %ymm2 {%k7} {z} +// CHECK: vaddbf16 %ymm4, %ymm3, %ymm2 {%k7} {z} // CHECK: encoding: [0x62,0xf5,0x65,0xaf,0x58,0xd4] - vaddnepbf16 %ymm4, %ymm3, %ymm2 {%k7} {z} + vaddbf16 %ymm4, %ymm3, %ymm2 {%k7} {z} -// CHECK: vaddnepbf16 %zmm4, %zmm3, %zmm2 +// CHECK: vaddbf16 %zmm4, %zmm3, %zmm2 // CHECK: encoding: [0x62,0xf5,0x65,0x48,0x58,0xd4] - vaddnepbf16 %zmm4, %zmm3, %zmm2 + vaddbf16 %zmm4, %zmm3, %zmm2 -// CHECK: vaddnepbf16 %zmm4, %zmm3, %zmm2 {%k7} +// CHECK: vaddbf16 %zmm4, %zmm3, %zmm2 {%k7} // CHECK: encoding: [0x62,0xf5,0x65,0x4f,0x58,0xd4] - vaddnepbf16 %zmm4, %zmm3, %zmm2 {%k7} + vaddbf16 %zmm4, %zmm3, %zmm2 {%k7} -// CHECK: vaddnepbf16 %zmm4, %zmm3, %zmm2 {%k7} {z} +// CHECK: vaddbf16 %zmm4, %zmm3, %zmm2 {%k7} {z} // CHECK: encoding: [0x62,0xf5,0x65,0xcf,0x58,0xd4] - vaddnepbf16 %zmm4, %zmm3, %zmm2 {%k7} {z} + vaddbf16 %zmm4, %zmm3, %zmm2 {%k7} {z} -// CHECK: vaddnepbf16 %xmm4, %xmm3, %xmm2 +// CHECK: vaddbf16 %xmm4, %xmm3, %xmm2 // CHECK: encoding: [0x62,0xf5,0x65,0x08,0x58,0xd4] - vaddnepbf16 %xmm4, %xmm3, %xmm2 + vaddbf16 %xmm4, %xmm3, %xmm2 -// CHECK: vaddnepbf16 %xmm4, %xmm3, %xmm2 {%k7} +// CHECK: vaddbf16 %xmm4, %xmm3, %xmm2 {%k7} // CHECK: encoding: [0x62,0xf5,0x65,0x0f,0x58,0xd4] - vaddnepbf16 %xmm4, %xmm3, %xmm2 {%k7} + vaddbf16 %xmm4, %xmm3, %xmm2 {%k7} -// CHECK: vaddnepbf16 %xmm4, %xmm3, %xmm2 {%k7} {z} +// CHECK: vaddbf16 %xmm4, %xmm3, %xmm2 {%k7} {z} // CHECK: encoding: [0x62,0xf5,0x65,0x8f,0x58,0xd4] - vaddnepbf16 %xmm4, %xmm3, %xmm2 {%k7} {z} + vaddbf16 %xmm4, %xmm3, %xmm2 {%k7} {z} -// CHECK: vaddnepbf16 268435456(%esp,%esi,8), %zmm3, %zmm2 +// CHECK: vaddbf16 268435456(%esp,%esi,8), %zmm3, %zmm2 // CHECK: encoding: [0x62,0xf5,0x65,0x48,0x58,0x94,0xf4,0x00,0x00,0x00,0x10] - vaddnepbf16 268435456(%esp,%esi,8), %zmm3, %zmm2 + vaddbf16 268435456(%esp,%esi,8), %zmm3, %zmm2 -// CHECK: vaddnepbf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7} +// CHECK: vaddbf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7} // CHECK: encoding: [0x62,0xf5,0x65,0x4f,0x58,0x94,0x87,0x23,0x01,0x00,0x00] - vaddnepbf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7} + vaddbf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7} -// CHECK: vaddnepbf16 (%eax){1to32}, %zmm3, %zmm2 +// CHECK: vaddbf16 (%eax){1to32}, %zmm3, %zmm2 // CHECK: encoding: [0x62,0xf5,0x65,0x58,0x58,0x10] - vaddnepbf16 (%eax){1to32}, %zmm3, %zmm2 + vaddbf16 (%eax){1to32}, %zmm3, %zmm2 -// CHECK: vaddnepbf16 -2048(,%ebp,2), %zmm3, %zmm2 +// CHECK: vaddbf16 -2048(,%ebp,2), %zmm3, %zmm2 // CHECK: encoding: [0x62,0xf5,0x65,0x48,0x58,0x14,0x6d,0x00,0xf8,0xff,0xff] - vaddnepbf16 -2048(,%ebp,2), %zmm3, %zmm2 + vaddbf16 -2048(,%ebp,2), %zmm3, %zmm2 -// CHECK: vaddnepbf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z} +// CHECK: vaddbf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z} // CHECK: encoding: [0x62,0xf5,0x65,0xcf,0x58,0x51,0x7f] - vaddnepbf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z} + vaddbf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z} -// CHECK: vaddnepbf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z} +// CHECK: vaddbf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z} // CHECK: encoding: [0x62,0xf5,0x65,0xdf,0x58,0x52,0x80] - vaddnepbf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z} + vaddbf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z} -// CHECK: vaddnepbf16 268435456(%esp,%esi,8), %ymm3, %ymm2 +// CHECK: vaddbf16 268435456(%esp,%esi,8), %ymm3, %ymm2 // CHECK: encoding: [0x62,0xf5,0x65,0x28,0x58,0x94,0xf4,0x00,0x00,0x00,0x10] - vaddnepbf16 268435456(%esp,%esi,8), %ymm3, %ymm2 + vaddbf16 268435456(%esp,%esi,8), %ymm3, %ymm2 -// CHECK: vaddnepbf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7} +// CHECK: vaddbf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7} // CHECK: encoding: [0x62,0xf5,0x65,0x2f,0x58,0x94,0x87,0x23,0x01,0x00,0x00] - vaddnepbf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7} + vaddbf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7} -// CHECK: vaddnepbf16 (%eax){1to16}, %ymm3, %ymm2 +// CHECK: vaddbf16 (%eax){1to16}, %ymm3, %ymm2 // CHECK: encoding: [0x62,0xf5,0x65,0x38,0x58,0x10] - vaddnepbf16 (%eax){1to16}, %ymm3, %ymm2 + vaddbf16 (%eax){1to16}, %ymm3, %ymm2 -// CHECK: vaddnepbf16 -1024(,%ebp,2), %ymm3, %ymm2 +// CHECK: vaddbf16 -1024(,%ebp,2), %ymm3, %ymm2 // CHECK: encoding: [0x62,0xf5,0x65,0x28,0x58,0x14,0x6d,0x00,0xfc,0xff,0xff] - vaddnepbf16 -1024(,%ebp,2), %ymm3, %ymm2 + vaddbf16 -1024(,%ebp,2), %ymm3, %ymm2 -// CHECK: vaddnepbf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z} +// CHECK: vaddbf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z} // CHECK: encoding: [0x62,0xf5,0x65,0xaf,0x58,0x51,0x7f] - vaddnepbf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z} + vaddbf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z} -// CHECK: vaddnepbf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z} +// CHECK: vaddbf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z} // CHECK: encoding: [0x62,0xf5,0x65,0xbf,0x58,0x52,0x80] - vaddnepbf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z} + vaddbf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z} -// CHECK: vaddnepbf16 268435456(%esp,%esi,8), %xmm3, %xmm2 +// CHECK: vaddbf16 268435456(%esp,%esi,8), %xmm3, %xmm2 // CHECK: encoding: [0x62,0xf5,0x65,0x08,0x58,0x94,0xf4,0x00,0x00,0x00,0x10] - vaddnepbf16 268435456(%esp,%esi,8), %xmm3, %xmm2 + vaddbf16 268435456(%esp,%esi,8), %xmm3, %xmm2 -// CHECK: vaddnepbf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7} +// CHECK: vaddbf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7} // CHECK: encoding: [0x62,0xf5,0x65,0x0f,0x58,0x94,0x87,0x23,0x01,0x00,0x00] - vaddnepbf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7} + vaddbf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7} -// CHECK: vaddnepbf16 (%eax){1to8}, %xmm3, %xmm2 +// CHECK: vaddbf16 (%eax){1to8}, %xmm3, %xmm2 // CHECK: encoding: [0x62,0xf5,0x65,0x18,0x58,0x10] - vaddnepbf16 (%eax){1to8}, %xmm3, %xmm2 + vaddbf16 (%eax){1to8}, %xmm3, %xmm2 -// CHECK: vaddnepbf16 -512(,%ebp,2), %xmm3, %xmm2 +// CHECK: vaddbf16 -512(,%ebp,2), %xmm3, %xmm2 // CHECK: encoding: [0x62,0xf5,0x65,0x08,0x58,0x14,0x6d,0x00,0xfe,0xff,0xff] - vaddnepbf16 -512(,%ebp,2), %xmm3, %xmm2 + vaddbf16 -512(,%ebp,2), %xmm3, %xmm2 -// CHECK: vaddnepbf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z} +// CHECK: vaddbf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z} // CHECK: encoding: [0x62,0xf5,0x65,0x8f,0x58,0x51,0x7f] - vaddnepbf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z} + vaddbf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z} -// CHECK: vaddnepbf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z} +// CHECK: vaddbf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z} // CHECK: encoding: [0x62,0xf5,0x65,0x9f,0x58,0x52,0x80] - vaddnepbf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z} + vaddbf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z} -// CHECK: vcmppbf16 $123, %ymm4, %ymm3, %k5 +// CHECK: vcmpbf16 $123, %ymm4, %ymm3, %k5 // CHECK: encoding: [0x62,0xf3,0x67,0x28,0xc2,0xec,0x7b] - vcmppbf16 $123, %ymm4, %ymm3, %k5 + vcmpbf16 $123, %ymm4, %ymm3, %k5 -// CHECK: vcmppbf16 $123, %ymm4, %ymm3, %k5 {%k7} +// CHECK: vcmpbf16 $123, %ymm4, %ymm3, %k5 {%k7} // CHECK: encoding: [0x62,0xf3,0x67,0x2f,0xc2,0xec,0x7b] - vcmppbf16 $123, %ymm4, %ymm3, %k5 {%k7} + vcmpbf16 $123, %ymm4, %ymm3, %k5 {%k7} -// CHECK: vcmppbf16 $123, %xmm4, %xmm3, %k5 +// CHECK: vcmpbf16 $123, %xmm4, %xmm3, %k5 // CHECK: encoding: [0x62,0xf3,0x67,0x08,0xc2,0xec,0x7b] - vcmppbf16 $123, %xmm4, %xmm3, %k5 + vcmpbf16 $123, %xmm4, %xmm3, %k5 -// CHECK: vcmppbf16 $123, %xmm4, %xmm3, %k5 {%k7} +// CHECK: vcmpbf16 $123, %xmm4, %xmm3, %k5 {%k7} // CHECK: encoding: [0x62,0xf3,0x67,0x0f,0xc2,0xec,0x7b] - vcmppbf16 $123, %xmm4, %xmm3, %k5 {%k7} + vcmpbf16 $123, %xmm4, %xmm3, %k5 {%k7} -// CHECK: vcmppbf16 $123, %zmm4, %zmm3, %k5 +// CHECK: vcmpbf16 $123, %zmm4, %zmm3, %k5 // CHECK: encoding: [0x62,0xf3,0x67,0x48,0xc2,0xec,0x7b] - vcmppbf16 $123, %zmm4, %zmm3, %k5 + vcmpbf16 $123, %zmm4, %zmm3, %k5 -// CHECK: vcmppbf16 $123, %zmm4, %zmm3, %k5 {%k7} +// CHECK: vcmpbf16 $123, %zmm4, %zmm3, %k5 {%k7} // CHECK: encoding: [0x62,0xf3,0x67,0x4f,0xc2,0xec,0x7b] - vcmppbf16 $123, %zmm4, %zmm3, %k5 {%k7} + vcmpbf16 $123, %zmm4, %zmm3, %k5 {%k7} -// CHECK: vcmppbf16 $123, 268435456(%esp,%esi,8), %zmm3, %k5 +// CHECK: vcmpbf16 $123, 268435456(%esp,%esi,8), %zmm3, %k5 // CHECK: encoding: [0x62,0xf3,0x67,0x48,0xc2,0xac,0xf4,0x00,0x00,0x00,0x10,0x7b] - vcmppbf16 $123, 268435456(%esp,%esi,8), %zmm3, %k5 + vcmpbf16 $123, 268435456(%esp,%esi,8), %zmm3, %k5 -// CHECK: vcmppbf16 $123, 291(%edi,%eax,4), %zmm3, %k5 {%k7} +// CHECK: vcmpbf16 $123, 291(%edi,%eax,4), %zmm3, %k5 {%k7} // CHECK: encoding: [0x62,0xf3,0x67,0x4f,0xc2,0xac,0x87,0x23,0x01,0x00,0x00,0x7b] - vcmppbf16 $123, 291(%edi,%eax,4), %zmm3, %k5 {%k7} + vcmpbf16 $123, 291(%edi,%eax,4), %zmm3, %k5 {%k7} -// CHECK: vcmppbf16 $123, (%eax){1to32}, %zmm3, %k5 +// CHECK: vcmpbf16 $123, (%eax){1to32}, %zmm3, %k5 // CHECK: encoding: [0x62,0xf3,0x67,0x58,0xc2,0x28,0x7b] - vcmppbf16 $123, (%eax){1to32}, %zmm3, %k5 + vcmpbf16 $123, (%eax){1to32}, %zmm3, %k5 -// CHECK: vcmppbf16 $123, -2048(,%ebp,2), %zmm3, %k5 +// CHECK: vcmpbf16 $123, -2048(,%ebp,2), %zmm3, %k5 // CHECK: encoding: [0x62,0xf3,0x67,0x48,0xc2,0x2c,0x6d,0x00,0xf8,0xff,0xff,0x7b] - vcmppbf16 $123, -2048(,%ebp,2), %zmm3, %k5 + vcmpbf16 $123, -2048(,%ebp,2), %zmm3, %k5 -// CHECK: vcmppbf16 $123, 8128(%ecx), %zmm3, %k5 {%k7} +// CHECK: vcmpbf16 $123, 8128(%ecx), %zmm3, %k5 {%k7} // CHECK: encoding: [0x62,0xf3,0x67,0x4f,0xc2,0x69,0x7f,0x7b] - vcmppbf16 $123, 8128(%ecx), %zmm3, %k5 {%k7} + vcmpbf16 $123, 8128(%ecx), %zmm3, %k5 {%k7} -// CHECK: vcmppbf16 $123, -256(%edx){1to32}, %zmm3, %k5 {%k7} +// CHECK: vcmpbf16 $123, -256(%edx){1to32}, %zmm3, %k5 {%k7} // CHECK: encoding: [0x62,0xf3,0x67,0x5f,0xc2,0x6a,0x80,0x7b] - vcmppbf16 $123, -256(%edx){1to32}, %zmm3, %k5 {%k7} + vcmpbf16 $123, -256(%edx){1to32}, %zmm3, %k5 {%k7} -// CHECK: vcmppbf16 $123, 268435456(%esp,%esi,8), %xmm3, %k5 +// CHECK: vcmpbf16 $123, 268435456(%esp,%esi,8), %xmm3, %k5 // CHECK: encoding: [0x62,0xf3,0x67,0x08,0xc2,0xac,0xf4,0x00,0x00,0x00,0x10,0x7b] - vcmppbf16 $123, 268435456(%esp,%esi,8), %xmm3, %k5 + vcmpbf16 $123, 268435456(%esp,%esi,8), %xmm3, %k5 -// CHECK: vcmppbf16 $123, 291(%edi,%eax,4), %xmm3, %k5 {%k7} +// CHECK: vcmpbf16 $123, 291(%edi,%eax,4), %xmm3, %k5 {%k7} // CHECK: encoding: [0x62,0xf3,0x67,0x0f,0xc2,0xac,0x87,0x23,0x01,0x00,0x00,0x7b] - vcmppbf16 $123, 291(%edi,%eax,4), %xmm3, %k5 {%k7} + vcmpbf16 $123, 291(%edi,%eax,4), %xmm3, %k5 {%k7} -// CHECK: vcmppbf16 $123, (%eax){1to8}, %xmm3, %k5 +// CHECK: vcmpbf16 $123, (%eax){1to8}, %xmm3, %k5 // CHECK: encoding: [0x62,0xf3,0x67,0x18,0xc2,0x28,0x7b] - vcmppbf16 $123, (%eax){1to8}, %xmm3, %k5 + vcmpbf16 $123, (%eax){1to8}, %xmm3, %k5 -// CHECK: vcmppbf16 $123, -512(,%ebp,2), %xmm3, %k5 +// CHECK: vcmpbf16 $123, -512(,%ebp,2), %xmm3, %k5 // CHECK: encoding: [0x62,0xf3,0x67,0x08,0xc2,0x2c,0x6d,0x00,0xfe,0xff,0xff,0x7b] - vcmppbf16 $123, -512(,%ebp,2), %xmm3, %k5 + vcmpbf16 $123, -512(,%ebp,2), %xmm3, %k5 -// CHECK: vcmppbf16 $123, 2032(%ecx), %xmm3, %k5 {%k7} +// CHECK: vcmpbf16 $123, 2032(%ecx), %xmm3, %k5 {%k7} // CHECK: encoding: [0x62,0xf3,0x67,0x0f,0xc2,0x69,0x7f,0x7b] - vcmppbf16 $123, 2032(%ecx), %xmm3, %k5 {%k7} + vcmpbf16 $123, 2032(%ecx), %xmm3, %k5 {%k7} -// CHECK: vcmppbf16 $123, -256(%edx){1to8}, %xmm3, %k5 {%k7} +// CHECK: vcmpbf16 $123, -256(%edx){1to8}, %xmm3, %k5 {%k7} // CHECK: encoding: [0x62,0xf3,0x67,0x1f,0xc2,0x6a,0x80,0x7b] - vcmppbf16 $123, -256(%edx){1to8}, %xmm3, %k5 {%k7} + vcmpbf16 $123, -256(%edx){1to8}, %xmm3, %k5 {%k7} -// CHECK: vcmppbf16 $123, 268435456(%esp,%esi,8), %ymm3, %k5 +// CHECK: vcmpbf16 $123, 268435456(%esp,%esi,8), %ymm3, %k5 // CHECK: encoding: [0x62,0xf3,0x67,0x28,0xc2,0xac,0xf4,0x00,0x00,0x00,0x10,0x7b] - vcmppbf16 $123, 268435456(%esp,%esi,8), %ymm3, %k5 + vcmpbf16 $123, 268435456(%esp,%esi,8), %ymm3, %k5 -// CHECK: vcmppbf16 $123, 291(%edi,%eax,4), %ymm3, %k5 {%k7} +// CHECK: vcmpbf16 $123, 291(%edi,%eax,4), %ymm3, %k5 {%k7} // CHECK: encoding: [0x62,0xf3,0x67,0x2f,0xc2,0xac,0x87,0x23,0x01,0x00,0x00,0x7b] - vcmppbf16 $123, 291(%edi,%eax,4), %ymm3, %k5 {%k7} + vcmpbf16 $123, 291(%edi,%eax,4), %ymm3, %k5 {%k7} -// CHECK: vcmppbf16 $123, (%eax){1to16}, %ymm3, %k5 +// CHECK: vcmpbf16 $123, (%eax){1to16}, %ymm3, %k5 // CHECK: encoding: [0x62,0xf3,0x67,0x38,0xc2,0x28,0x7b] - vcmppbf16 $123, (%eax){1to16}, %ymm3, %k5 + vcmpbf16 $123, (%eax){1to16}, %ymm3, %k5 -// CHECK: vcmppbf16 $123, -1024(,%ebp,2), %ymm3, %k5 +// CHECK: vcmpbf16 $123, -1024(,%ebp,2), %ymm3, %k5 // CHECK: encoding: [0x62,0xf3,0x67,0x28,0xc2,0x2c,0x6d,0x00,0xfc,0xff,0xff,0x7b] - vcmppbf16 $123, -1024(,%ebp,2), %ymm3, %k5 + vcmpbf16 $123, -1024(,%ebp,2), %ymm3, %k5 -// CHECK: vcmppbf16 $123, 4064(%ecx), %ymm3, %k5 {%k7} +// CHECK: vcmpbf16 $123, 4064(%ecx), %ymm3, %k5 {%k7} // CHECK: encoding: [0x62,0xf3,0x67,0x2f,0xc2,0x69,0x7f,0x7b] - vcmppbf16 $123, 4064(%ecx), %ymm3, %k5 {%k7} + vcmpbf16 $123, 4064(%ecx), %ymm3, %k5 {%k7} -// CHECK: vcmppbf16 $123, -256(%edx){1to16}, %ymm3, %k5 {%k7} +// CHECK: vcmpbf16 $123, -256(%edx){1to16}, %ymm3, %k5 {%k7} // CHECK: encoding: [0x62,0xf3,0x67,0x3f,0xc2,0x6a,0x80,0x7b] - vcmppbf16 $123, -256(%edx){1to16}, %ymm3, %k5 {%k7} + vcmpbf16 $123, -256(%edx){1to16}, %ymm3, %k5 {%k7} // CHECK: vcomsbf16 %xmm3, %xmm2 // CHECK: encoding: [0x62,0xf5,0x7d,0x08,0x2f,0xd3] @@ -232,2783 +232,2783 @@ // CHECK: encoding: [0x62,0xf5,0x7d,0x08,0x2f,0x52,0x80] vcomsbf16 -256(%edx), %xmm2 -// CHECK: vdivnepbf16 %ymm4, %ymm3, %ymm2 +// CHECK: vdivbf16 %ymm4, %ymm3, %ymm2 // CHECK: encoding: [0x62,0xf5,0x65,0x28,0x5e,0xd4] - vdivnepbf16 %ymm4, %ymm3, %ymm2 + vdivbf16 %ymm4, %ymm3, %ymm2 -// CHECK: vdivnepbf16 %ymm4, %ymm3, %ymm2 {%k7} +// CHECK: vdivbf16 %ymm4, %ymm3, %ymm2 {%k7} // CHECK: encoding: [0x62,0xf5,0x65,0x2f,0x5e,0xd4] - vdivnepbf16 %ymm4, %ymm3, %ymm2 {%k7} + vdivbf16 %ymm4, %ymm3, %ymm2 {%k7} -// CHECK: vdivnepbf16 %ymm4, %ymm3, %ymm2 {%k7} {z} +// CHECK: vdivbf16 %ymm4, %ymm3, %ymm2 {%k7} {z} // CHECK: encoding: [0x62,0xf5,0x65,0xaf,0x5e,0xd4] - vdivnepbf16 %ymm4, %ymm3, %ymm2 {%k7} {z} + vdivbf16 %ymm4, %ymm3, %ymm2 {%k7} {z} -// CHECK: vdivnepbf16 %zmm4, %zmm3, %zmm2 +// CHECK: vdivbf16 %zmm4, %zmm3, %zmm2 // CHECK: encoding: [0x62,0xf5,0x65,0x48,0x5e,0xd4] - vdivnepbf16 %zmm4, %zmm3, %zmm2 + vdivbf16 %zmm4, %zmm3, %zmm2 -// CHECK: vdivnepbf16 %zmm4, %zmm3, %zmm2 {%k7} +// CHECK: vdivbf16 %zmm4, %zmm3, %zmm2 {%k7} // CHECK: encoding: [0x62,0xf5,0x65,0x4f,0x5e,0xd4] - vdivnepbf16 %zmm4, %zmm3, %zmm2 {%k7} + vdivbf16 %zmm4, %zmm3, %zmm2 {%k7} -// CHECK: vdivnepbf16 %zmm4, %zmm3, %zmm2 {%k7} {z} +// CHECK: vdivbf16 %zmm4, %zmm3, %zmm2 {%k7} {z} // CHECK: encoding: [0x62,0xf5,0x65,0xcf,0x5e,0xd4] - vdivnepbf16 %zmm4, %zmm3, %zmm2 {%k7} {z} + vdivbf16 %zmm4, %zmm3, %zmm2 {%k7} {z} -// CHECK: vdivnepbf16 %xmm4, %xmm3, %xmm2 +// CHECK: vdivbf16 %xmm4, %xmm3, %xmm2 // CHECK: encoding: [0x62,0xf5,0x65,0x08,0x5e,0xd4] - vdivnepbf16 %xmm4, %xmm3, %xmm2 + vdivbf16 %xmm4, %xmm3, %xmm2 -// CHECK: vdivnepbf16 %xmm4, %xmm3, %xmm2 {%k7} +// CHECK: vdivbf16 %xmm4, %xmm3, %xmm2 {%k7} // CHECK: encoding: [0x62,0xf5,0x65,0x0f,0x5e,0xd4] - vdivnepbf16 %xmm4, %xmm3, %xmm2 {%k7} + vdivbf16 %xmm4, %xmm3, %xmm2 {%k7} -// CHECK: vdivnepbf16 %xmm4, %xmm3, %xmm2 {%k7} {z} +// CHECK: vdivbf16 %xmm4, %xmm3, %xmm2 {%k7} {z} // CHECK: encoding: [0x62,0xf5,0x65,0x8f,0x5e,0xd4] - vdivnepbf16 %xmm4, %xmm3, %xmm2 {%k7} {z} + vdivbf16 %xmm4, %xmm3, %xmm2 {%k7} {z} -// CHECK: vdivnepbf16 268435456(%esp,%esi,8), %zmm3, %zmm2 +// CHECK: vdivbf16 268435456(%esp,%esi,8), %zmm3, %zmm2 // CHECK: encoding: [0x62,0xf5,0x65,0x48,0x5e,0x94,0xf4,0x00,0x00,0x00,0x10] - vdivnepbf16 268435456(%esp,%esi,8), %zmm3, %zmm2 + vdivbf16 268435456(%esp,%esi,8), %zmm3, %zmm2 -// CHECK: vdivnepbf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7} +// CHECK: vdivbf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7} // CHECK: encoding: [0x62,0xf5,0x65,0x4f,0x5e,0x94,0x87,0x23,0x01,0x00,0x00] - vdivnepbf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7} + vdivbf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7} -// CHECK: vdivnepbf16 (%eax){1to32}, %zmm3, %zmm2 +// CHECK: vdivbf16 (%eax){1to32}, %zmm3, %zmm2 // CHECK: encoding: [0x62,0xf5,0x65,0x58,0x5e,0x10] - vdivnepbf16 (%eax){1to32}, %zmm3, %zmm2 + vdivbf16 (%eax){1to32}, %zmm3, %zmm2 -// CHECK: vdivnepbf16 -2048(,%ebp,2), %zmm3, %zmm2 +// CHECK: vdivbf16 -2048(,%ebp,2), %zmm3, %zmm2 // CHECK: encoding: [0x62,0xf5,0x65,0x48,0x5e,0x14,0x6d,0x00,0xf8,0xff,0xff] - vdivnepbf16 -2048(,%ebp,2), %zmm3, %zmm2 + vdivbf16 -2048(,%ebp,2), %zmm3, %zmm2 -// CHECK: vdivnepbf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z} +// CHECK: vdivbf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z} // CHECK: encoding: [0x62,0xf5,0x65,0xcf,0x5e,0x51,0x7f] - vdivnepbf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z} + vdivbf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z} -// CHECK: vdivnepbf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z} +// CHECK: vdivbf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z} // CHECK: encoding: [0x62,0xf5,0x65,0xdf,0x5e,0x52,0x80] - vdivnepbf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z} + vdivbf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z} -// CHECK: vdivnepbf16 268435456(%esp,%esi,8), %ymm3, %ymm2 +// CHECK: vdivbf16 268435456(%esp,%esi,8), %ymm3, %ymm2 // CHECK: encoding: [0x62,0xf5,0x65,0x28,0x5e,0x94,0xf4,0x00,0x00,0x00,0x10] - vdivnepbf16 268435456(%esp,%esi,8), %ymm3, %ymm2 + vdivbf16 268435456(%esp,%esi,8), %ymm3, %ymm2 -// CHECK: vdivnepbf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7} +// CHECK: vdivbf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7} // CHECK: encoding: [0x62,0xf5,0x65,0x2f,0x5e,0x94,0x87,0x23,0x01,0x00,0x00] - vdivnepbf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7} + vdivbf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7} -// CHECK: vdivnepbf16 (%eax){1to16}, %ymm3, %ymm2 +// CHECK: vdivbf16 (%eax){1to16}, %ymm3, %ymm2 // CHECK: encoding: [0x62,0xf5,0x65,0x38,0x5e,0x10] - vdivnepbf16 (%eax){1to16}, %ymm3, %ymm2 + vdivbf16 (%eax){1to16}, %ymm3, %ymm2 -// CHECK: vdivnepbf16 -1024(,%ebp,2), %ymm3, %ymm2 +// CHECK: vdivbf16 -1024(,%ebp,2), %ymm3, %ymm2 // CHECK: encoding: [0x62,0xf5,0x65,0x28,0x5e,0x14,0x6d,0x00,0xfc,0xff,0xff] - vdivnepbf16 -1024(,%ebp,2), %ymm3, %ymm2 + vdivbf16 -1024(,%ebp,2), %ymm3, %ymm2 -// CHECK: vdivnepbf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z} +// CHECK: vdivbf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z} // CHECK: encoding: [0x62,0xf5,0x65,0xaf,0x5e,0x51,0x7f] - vdivnepbf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z} + vdivbf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z} -// CHECK: vdivnepbf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z} +// CHECK: vdivbf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z} // CHECK: encoding: [0x62,0xf5,0x65,0xbf,0x5e,0x52,0x80] - vdivnepbf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z} + vdivbf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z} -// CHECK: vdivnepbf16 268435456(%esp,%esi,8), %xmm3, %xmm2 +// CHECK: vdivbf16 268435456(%esp,%esi,8), %xmm3, %xmm2 // CHECK: encoding: [0x62,0xf5,0x65,0x08,0x5e,0x94,0xf4,0x00,0x00,0x00,0x10] - vdivnepbf16 268435456(%esp,%esi,8), %xmm3, %xmm2 + vdivbf16 268435456(%esp,%esi,8), %xmm3, %xmm2 -// CHECK: vdivnepbf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7} +// CHECK: vdivbf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7} // CHECK: encoding: [0x62,0xf5,0x65,0x0f,0x5e,0x94,0x87,0x23,0x01,0x00,0x00] - vdivnepbf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7} + vdivbf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7} -// CHECK: vdivnepbf16 (%eax){1to8}, %xmm3, %xmm2 +// CHECK: vdivbf16 (%eax){1to8}, %xmm3, %xmm2 // CHECK: encoding: [0x62,0xf5,0x65,0x18,0x5e,0x10] - vdivnepbf16 (%eax){1to8}, %xmm3, %xmm2 + vdivbf16 (%eax){1to8}, %xmm3, %xmm2 -// CHECK: vdivnepbf16 -512(,%ebp,2), %xmm3, %xmm2 +// CHECK: vdivbf16 -512(,%ebp,2), %xmm3, %xmm2 // CHECK: encoding: [0x62,0xf5,0x65,0x08,0x5e,0x14,0x6d,0x00,0xfe,0xff,0xff] - vdivnepbf16 -512(,%ebp,2), %xmm3, %xmm2 + vdivbf16 -512(,%ebp,2), %xmm3, %xmm2 -// CHECK: vdivnepbf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z} +// CHECK: vdivbf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z} // CHECK: encoding: [0x62,0xf5,0x65,0x8f,0x5e,0x51,0x7f] - vdivnepbf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z} + vdivbf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z} -// CHECK: vdivnepbf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z} +// CHECK: vdivbf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z} // CHECK: encoding: [0x62,0xf5,0x65,0x9f,0x5e,0x52,0x80] - vdivnepbf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z} + vdivbf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z} -// CHECK: vfmadd132nepbf16 %ymm4, %ymm3, %ymm2 +// CHECK: vfmadd132bf16 %ymm4, %ymm3, %ymm2 // CHECK: encoding: [0x62,0xf6,0x64,0x28,0x98,0xd4] - vfmadd132nepbf16 %ymm4, %ymm3, %ymm2 + vfmadd132bf16 %ymm4, %ymm3, %ymm2 -// CHECK: vfmadd132nepbf16 %ymm4, %ymm3, %ymm2 {%k7} +// CHECK: vfmadd132bf16 %ymm4, %ymm3, %ymm2 {%k7} // CHECK: encoding: [0x62,0xf6,0x64,0x2f,0x98,0xd4] - vfmadd132nepbf16 %ymm4, %ymm3, %ymm2 {%k7} + vfmadd132bf16 %ymm4, %ymm3, %ymm2 {%k7} -// CHECK: vfmadd132nepbf16 %ymm4, %ymm3, %ymm2 {%k7} {z} +// CHECK: vfmadd132bf16 %ymm4, %ymm3, %ymm2 {%k7} {z} // CHECK: encoding: [0x62,0xf6,0x64,0xaf,0x98,0xd4] - vfmadd132nepbf16 %ymm4, %ymm3, %ymm2 {%k7} {z} + vfmadd132bf16 %ymm4, %ymm3, %ymm2 {%k7} {z} -// CHECK: vfmadd132nepbf16 %zmm4, %zmm3, %zmm2 +// CHECK: vfmadd132bf16 %zmm4, %zmm3, %zmm2 // CHECK: encoding: [0x62,0xf6,0x64,0x48,0x98,0xd4] - vfmadd132nepbf16 %zmm4, %zmm3, %zmm2 + vfmadd132bf16 %zmm4, %zmm3, %zmm2 -// CHECK: vfmadd132nepbf16 %zmm4, %zmm3, %zmm2 {%k7} +// CHECK: vfmadd132bf16 %zmm4, %zmm3, %zmm2 {%k7} // CHECK: encoding: [0x62,0xf6,0x64,0x4f,0x98,0xd4] - vfmadd132nepbf16 %zmm4, %zmm3, %zmm2 {%k7} + vfmadd132bf16 %zmm4, %zmm3, %zmm2 {%k7} -// CHECK: vfmadd132nepbf16 %zmm4, %zmm3, %zmm2 {%k7} {z} +// CHECK: vfmadd132bf16 %zmm4, %zmm3, %zmm2 {%k7} {z} // CHECK: encoding: [0x62,0xf6,0x64,0xcf,0x98,0xd4] - vfmadd132nepbf16 %zmm4, %zmm3, %zmm2 {%k7} {z} + vfmadd132bf16 %zmm4, %zmm3, %zmm2 {%k7} {z} -// CHECK: vfmadd132nepbf16 %xmm4, %xmm3, %xmm2 +// CHECK: vfmadd132bf16 %xmm4, %xmm3, %xmm2 // CHECK: encoding: [0x62,0xf6,0x64,0x08,0x98,0xd4] - vfmadd132nepbf16 %xmm4, %xmm3, %xmm2 + vfmadd132bf16 %xmm4, %xmm3, %xmm2 -// CHECK: vfmadd132nepbf16 %xmm4, %xmm3, %xmm2 {%k7} +// CHECK: vfmadd132bf16 %xmm4, %xmm3, %xmm2 {%k7} // CHECK: encoding: [0x62,0xf6,0x64,0x0f,0x98,0xd4] - vfmadd132nepbf16 %xmm4, %xmm3, %xmm2 {%k7} + vfmadd132bf16 %xmm4, %xmm3, %xmm2 {%k7} -// CHECK: vfmadd132nepbf16 %xmm4, %xmm3, %xmm2 {%k7} {z} +// CHECK: vfmadd132bf16 %xmm4, %xmm3, %xmm2 {%k7} {z} // CHECK: encoding: [0x62,0xf6,0x64,0x8f,0x98,0xd4] - vfmadd132nepbf16 %xmm4, %xmm3, %xmm2 {%k7} {z} + vfmadd132bf16 %xmm4, %xmm3, %xmm2 {%k7} {z} -// CHECK: vfmadd132nepbf16 268435456(%esp,%esi,8), %zmm3, %zmm2 +// CHECK: vfmadd132bf16 268435456(%esp,%esi,8), %zmm3, %zmm2 // CHECK: encoding: [0x62,0xf6,0x64,0x48,0x98,0x94,0xf4,0x00,0x00,0x00,0x10] - vfmadd132nepbf16 268435456(%esp,%esi,8), %zmm3, %zmm2 + vfmadd132bf16 268435456(%esp,%esi,8), %zmm3, %zmm2 -// CHECK: vfmadd132nepbf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7} +// CHECK: vfmadd132bf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7} // CHECK: encoding: [0x62,0xf6,0x64,0x4f,0x98,0x94,0x87,0x23,0x01,0x00,0x00] - vfmadd132nepbf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7} + vfmadd132bf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7} -// CHECK: vfmadd132nepbf16 (%eax){1to32}, %zmm3, %zmm2 +// CHECK: vfmadd132bf16 (%eax){1to32}, %zmm3, %zmm2 // CHECK: encoding: [0x62,0xf6,0x64,0x58,0x98,0x10] - vfmadd132nepbf16 (%eax){1to32}, %zmm3, %zmm2 + vfmadd132bf16 (%eax){1to32}, %zmm3, %zmm2 -// CHECK: vfmadd132nepbf16 -2048(,%ebp,2), %zmm3, %zmm2 +// CHECK: vfmadd132bf16 -2048(,%ebp,2), %zmm3, %zmm2 // CHECK: encoding: [0x62,0xf6,0x64,0x48,0x98,0x14,0x6d,0x00,0xf8,0xff,0xff] - vfmadd132nepbf16 -2048(,%ebp,2), %zmm3, %zmm2 + vfmadd132bf16 -2048(,%ebp,2), %zmm3, %zmm2 -// CHECK: vfmadd132nepbf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z} +// CHECK: vfmadd132bf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z} // CHECK: encoding: [0x62,0xf6,0x64,0xcf,0x98,0x51,0x7f] - vfmadd132nepbf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z} + vfmadd132bf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z} -// CHECK: vfmadd132nepbf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z} +// CHECK: vfmadd132bf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z} // CHECK: encoding: [0x62,0xf6,0x64,0xdf,0x98,0x52,0x80] - vfmadd132nepbf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z} + vfmadd132bf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z} -// CHECK: vfmadd132nepbf16 268435456(%esp,%esi,8), %ymm3, %ymm2 +// CHECK: vfmadd132bf16 268435456(%esp,%esi,8), %ymm3, %ymm2 // CHECK: encoding: [0x62,0xf6,0x64,0x28,0x98,0x94,0xf4,0x00,0x00,0x00,0x10] - vfmadd132nepbf16 268435456(%esp,%esi,8), %ymm3, %ymm2 + vfmadd132bf16 268435456(%esp,%esi,8), %ymm3, %ymm2 -// CHECK: vfmadd132nepbf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7} +// CHECK: vfmadd132bf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7} // CHECK: encoding: [0x62,0xf6,0x64,0x2f,0x98,0x94,0x87,0x23,0x01,0x00,0x00] - vfmadd132nepbf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7} + vfmadd132bf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7} -// CHECK: vfmadd132nepbf16 (%eax){1to16}, %ymm3, %ymm2 +// CHECK: vfmadd132bf16 (%eax){1to16}, %ymm3, %ymm2 // CHECK: encoding: [0x62,0xf6,0x64,0x38,0x98,0x10] - vfmadd132nepbf16 (%eax){1to16}, %ymm3, %ymm2 + vfmadd132bf16 (%eax){1to16}, %ymm3, %ymm2 -// CHECK: vfmadd132nepbf16 -1024(,%ebp,2), %ymm3, %ymm2 +// CHECK: vfmadd132bf16 -1024(,%ebp,2), %ymm3, %ymm2 // CHECK: encoding: [0x62,0xf6,0x64,0x28,0x98,0x14,0x6d,0x00,0xfc,0xff,0xff] - vfmadd132nepbf16 -1024(,%ebp,2), %ymm3, %ymm2 + vfmadd132bf16 -1024(,%ebp,2), %ymm3, %ymm2 -// CHECK: vfmadd132nepbf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z} +// CHECK: vfmadd132bf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z} // CHECK: encoding: [0x62,0xf6,0x64,0xaf,0x98,0x51,0x7f] - vfmadd132nepbf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z} + vfmadd132bf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z} -// CHECK: vfmadd132nepbf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z} +// CHECK: vfmadd132bf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z} // CHECK: encoding: [0x62,0xf6,0x64,0xbf,0x98,0x52,0x80] - vfmadd132nepbf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z} + vfmadd132bf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z} -// CHECK: vfmadd132nepbf16 268435456(%esp,%esi,8), %xmm3, %xmm2 +// CHECK: vfmadd132bf16 268435456(%esp,%esi,8), %xmm3, %xmm2 // CHECK: encoding: [0x62,0xf6,0x64,0x08,0x98,0x94,0xf4,0x00,0x00,0x00,0x10] - vfmadd132nepbf16 268435456(%esp,%esi,8), %xmm3, %xmm2 + vfmadd132bf16 268435456(%esp,%esi,8), %xmm3, %xmm2 -// CHECK: vfmadd132nepbf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7} +// CHECK: vfmadd132bf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7} // CHECK: encoding: [0x62,0xf6,0x64,0x0f,0x98,0x94,0x87,0x23,0x01,0x00,0x00] - vfmadd132nepbf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7} + vfmadd132bf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7} -// CHECK: vfmadd132nepbf16 (%eax){1to8}, %xmm3, %xmm2 +// CHECK: vfmadd132bf16 (%eax){1to8}, %xmm3, %xmm2 // CHECK: encoding: [0x62,0xf6,0x64,0x18,0x98,0x10] - vfmadd132nepbf16 (%eax){1to8}, %xmm3, %xmm2 + vfmadd132bf16 (%eax){1to8}, %xmm3, %xmm2 -// CHECK: vfmadd132nepbf16 -512(,%ebp,2), %xmm3, %xmm2 +// CHECK: vfmadd132bf16 -512(,%ebp,2), %xmm3, %xmm2 // CHECK: encoding: [0x62,0xf6,0x64,0x08,0x98,0x14,0x6d,0x00,0xfe,0xff,0xff] - vfmadd132nepbf16 -512(,%ebp,2), %xmm3, %xmm2 + vfmadd132bf16 -512(,%ebp,2), %xmm3, %xmm2 -// CHECK: vfmadd132nepbf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z} +// CHECK: vfmadd132bf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z} // CHECK: encoding: [0x62,0xf6,0x64,0x8f,0x98,0x51,0x7f] - vfmadd132nepbf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z} + vfmadd132bf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z} -// CHECK: vfmadd132nepbf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z} +// CHECK: vfmadd132bf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z} // CHECK: encoding: [0x62,0xf6,0x64,0x9f,0x98,0x52,0x80] - vfmadd132nepbf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z} + vfmadd132bf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z} -// CHECK: vfmadd213nepbf16 %ymm4, %ymm3, %ymm2 +// CHECK: vfmadd213bf16 %ymm4, %ymm3, %ymm2 // CHECK: encoding: [0x62,0xf6,0x64,0x28,0xa8,0xd4] - vfmadd213nepbf16 %ymm4, %ymm3, %ymm2 + vfmadd213bf16 %ymm4, %ymm3, %ymm2 -// CHECK: vfmadd213nepbf16 %ymm4, %ymm3, %ymm2 {%k7} +// CHECK: vfmadd213bf16 %ymm4, %ymm3, %ymm2 {%k7} // CHECK: encoding: [0x62,0xf6,0x64,0x2f,0xa8,0xd4] - vfmadd213nepbf16 %ymm4, %ymm3, %ymm2 {%k7} + vfmadd213bf16 %ymm4, %ymm3, %ymm2 {%k7} -// CHECK: vfmadd213nepbf16 %ymm4, %ymm3, %ymm2 {%k7} {z} +// CHECK: vfmadd213bf16 %ymm4, %ymm3, %ymm2 {%k7} {z} // CHECK: encoding: [0x62,0xf6,0x64,0xaf,0xa8,0xd4] - vfmadd213nepbf16 %ymm4, %ymm3, %ymm2 {%k7} {z} + vfmadd213bf16 %ymm4, %ymm3, %ymm2 {%k7} {z} -// CHECK: vfmadd213nepbf16 %zmm4, %zmm3, %zmm2 +// CHECK: vfmadd213bf16 %zmm4, %zmm3, %zmm2 // CHECK: encoding: [0x62,0xf6,0x64,0x48,0xa8,0xd4] - vfmadd213nepbf16 %zmm4, %zmm3, %zmm2 + vfmadd213bf16 %zmm4, %zmm3, %zmm2 -// CHECK: vfmadd213nepbf16 %zmm4, %zmm3, %zmm2 {%k7} +// CHECK: vfmadd213bf16 %zmm4, %zmm3, %zmm2 {%k7} // CHECK: encoding: [0x62,0xf6,0x64,0x4f,0xa8,0xd4] - vfmadd213nepbf16 %zmm4, %zmm3, %zmm2 {%k7} + vfmadd213bf16 %zmm4, %zmm3, %zmm2 {%k7} -// CHECK: vfmadd213nepbf16 %zmm4, %zmm3, %zmm2 {%k7} {z} +// CHECK: vfmadd213bf16 %zmm4, %zmm3, %zmm2 {%k7} {z} // CHECK: encoding: [0x62,0xf6,0x64,0xcf,0xa8,0xd4] - vfmadd213nepbf16 %zmm4, %zmm3, %zmm2 {%k7} {z} + vfmadd213bf16 %zmm4, %zmm3, %zmm2 {%k7} {z} -// CHECK: vfmadd213nepbf16 %xmm4, %xmm3, %xmm2 +// CHECK: vfmadd213bf16 %xmm4, %xmm3, %xmm2 // CHECK: encoding: [0x62,0xf6,0x64,0x08,0xa8,0xd4] - vfmadd213nepbf16 %xmm4, %xmm3, %xmm2 + vfmadd213bf16 %xmm4, %xmm3, %xmm2 -// CHECK: vfmadd213nepbf16 %xmm4, %xmm3, %xmm2 {%k7} +// CHECK: vfmadd213bf16 %xmm4, %xmm3, %xmm2 {%k7} // CHECK: encoding: [0x62,0xf6,0x64,0x0f,0xa8,0xd4] - vfmadd213nepbf16 %xmm4, %xmm3, %xmm2 {%k7} + vfmadd213bf16 %xmm4, %xmm3, %xmm2 {%k7} -// CHECK: vfmadd213nepbf16 %xmm4, %xmm3, %xmm2 {%k7} {z} +// CHECK: vfmadd213bf16 %xmm4, %xmm3, %xmm2 {%k7} {z} // CHECK: encoding: [0x62,0xf6,0x64,0x8f,0xa8,0xd4] - vfmadd213nepbf16 %xmm4, %xmm3, %xmm2 {%k7} {z} + vfmadd213bf16 %xmm4, %xmm3, %xmm2 {%k7} {z} -// CHECK: vfmadd213nepbf16 268435456(%esp,%esi,8), %zmm3, %zmm2 +// CHECK: vfmadd213bf16 268435456(%esp,%esi,8), %zmm3, %zmm2 // CHECK: encoding: [0x62,0xf6,0x64,0x48,0xa8,0x94,0xf4,0x00,0x00,0x00,0x10] - vfmadd213nepbf16 268435456(%esp,%esi,8), %zmm3, %zmm2 + vfmadd213bf16 268435456(%esp,%esi,8), %zmm3, %zmm2 -// CHECK: vfmadd213nepbf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7} +// CHECK: vfmadd213bf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7} // CHECK: encoding: [0x62,0xf6,0x64,0x4f,0xa8,0x94,0x87,0x23,0x01,0x00,0x00] - vfmadd213nepbf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7} + vfmadd213bf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7} -// CHECK: vfmadd213nepbf16 (%eax){1to32}, %zmm3, %zmm2 +// CHECK: vfmadd213bf16 (%eax){1to32}, %zmm3, %zmm2 // CHECK: encoding: [0x62,0xf6,0x64,0x58,0xa8,0x10] - vfmadd213nepbf16 (%eax){1to32}, %zmm3, %zmm2 + vfmadd213bf16 (%eax){1to32}, %zmm3, %zmm2 -// CHECK: vfmadd213nepbf16 -2048(,%ebp,2), %zmm3, %zmm2 +// CHECK: vfmadd213bf16 -2048(,%ebp,2), %zmm3, %zmm2 // CHECK: encoding: [0x62,0xf6,0x64,0x48,0xa8,0x14,0x6d,0x00,0xf8,0xff,0xff] - vfmadd213nepbf16 -2048(,%ebp,2), %zmm3, %zmm2 + vfmadd213bf16 -2048(,%ebp,2), %zmm3, %zmm2 -// CHECK: vfmadd213nepbf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z} +// CHECK: vfmadd213bf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z} // CHECK: encoding: [0x62,0xf6,0x64,0xcf,0xa8,0x51,0x7f] - vfmadd213nepbf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z} + vfmadd213bf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z} -// CHECK: vfmadd213nepbf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z} +// CHECK: vfmadd213bf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z} // CHECK: encoding: [0x62,0xf6,0x64,0xdf,0xa8,0x52,0x80] - vfmadd213nepbf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z} + vfmadd213bf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z} -// CHECK: vfmadd213nepbf16 268435456(%esp,%esi,8), %ymm3, %ymm2 +// CHECK: vfmadd213bf16 268435456(%esp,%esi,8), %ymm3, %ymm2 // CHECK: encoding: [0x62,0xf6,0x64,0x28,0xa8,0x94,0xf4,0x00,0x00,0x00,0x10] - vfmadd213nepbf16 268435456(%esp,%esi,8), %ymm3, %ymm2 + vfmadd213bf16 268435456(%esp,%esi,8), %ymm3, %ymm2 -// CHECK: vfmadd213nepbf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7} +// CHECK: vfmadd213bf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7} // CHECK: encoding: [0x62,0xf6,0x64,0x2f,0xa8,0x94,0x87,0x23,0x01,0x00,0x00] - vfmadd213nepbf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7} + vfmadd213bf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7} -// CHECK: vfmadd213nepbf16 (%eax){1to16}, %ymm3, %ymm2 +// CHECK: vfmadd213bf16 (%eax){1to16}, %ymm3, %ymm2 // CHECK: encoding: [0x62,0xf6,0x64,0x38,0xa8,0x10] - vfmadd213nepbf16 (%eax){1to16}, %ymm3, %ymm2 + vfmadd213bf16 (%eax){1to16}, %ymm3, %ymm2 -// CHECK: vfmadd213nepbf16 -1024(,%ebp,2), %ymm3, %ymm2 +// CHECK: vfmadd213bf16 -1024(,%ebp,2), %ymm3, %ymm2 // CHECK: encoding: [0x62,0xf6,0x64,0x28,0xa8,0x14,0x6d,0x00,0xfc,0xff,0xff] - vfmadd213nepbf16 -1024(,%ebp,2), %ymm3, %ymm2 + vfmadd213bf16 -1024(,%ebp,2), %ymm3, %ymm2 -// CHECK: vfmadd213nepbf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z} +// CHECK: vfmadd213bf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z} // CHECK: encoding: [0x62,0xf6,0x64,0xaf,0xa8,0x51,0x7f] - vfmadd213nepbf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z} + vfmadd213bf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z} -// CHECK: vfmadd213nepbf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z} +// CHECK: vfmadd213bf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z} // CHECK: encoding: [0x62,0xf6,0x64,0xbf,0xa8,0x52,0x80] - vfmadd213nepbf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z} + vfmadd213bf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z} -// CHECK: vfmadd213nepbf16 268435456(%esp,%esi,8), %xmm3, %xmm2 +// CHECK: vfmadd213bf16 268435456(%esp,%esi,8), %xmm3, %xmm2 // CHECK: encoding: [0x62,0xf6,0x64,0x08,0xa8,0x94,0xf4,0x00,0x00,0x00,0x10] - vfmadd213nepbf16 268435456(%esp,%esi,8), %xmm3, %xmm2 + vfmadd213bf16 268435456(%esp,%esi,8), %xmm3, %xmm2 -// CHECK: vfmadd213nepbf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7} +// CHECK: vfmadd213bf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7} // CHECK: encoding: [0x62,0xf6,0x64,0x0f,0xa8,0x94,0x87,0x23,0x01,0x00,0x00] - vfmadd213nepbf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7} + vfmadd213bf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7} -// CHECK: vfmadd213nepbf16 (%eax){1to8}, %xmm3, %xmm2 +// CHECK: vfmadd213bf16 (%eax){1to8}, %xmm3, %xmm2 // CHECK: encoding: [0x62,0xf6,0x64,0x18,0xa8,0x10] - vfmadd213nepbf16 (%eax){1to8}, %xmm3, %xmm2 + vfmadd213bf16 (%eax){1to8}, %xmm3, %xmm2 -// CHECK: vfmadd213nepbf16 -512(,%ebp,2), %xmm3, %xmm2 +// CHECK: vfmadd213bf16 -512(,%ebp,2), %xmm3, %xmm2 // CHECK: encoding: [0x62,0xf6,0x64,0x08,0xa8,0x14,0x6d,0x00,0xfe,0xff,0xff] - vfmadd213nepbf16 -512(,%ebp,2), %xmm3, %xmm2 + vfmadd213bf16 -512(,%ebp,2), %xmm3, %xmm2 -// CHECK: vfmadd213nepbf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z} +// CHECK: vfmadd213bf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z} // CHECK: encoding: [0x62,0xf6,0x64,0x8f,0xa8,0x51,0x7f] - vfmadd213nepbf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z} + vfmadd213bf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z} -// CHECK: vfmadd213nepbf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z} +// CHECK: vfmadd213bf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z} // CHECK: encoding: [0x62,0xf6,0x64,0x9f,0xa8,0x52,0x80] - vfmadd213nepbf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z} + vfmadd213bf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z} -// CHECK: vfmadd231nepbf16 %ymm4, %ymm3, %ymm2 +// CHECK: vfmadd231bf16 %ymm4, %ymm3, %ymm2 // CHECK: encoding: [0x62,0xf6,0x64,0x28,0xb8,0xd4] - vfmadd231nepbf16 %ymm4, %ymm3, %ymm2 + vfmadd231bf16 %ymm4, %ymm3, %ymm2 -// CHECK: vfmadd231nepbf16 %ymm4, %ymm3, %ymm2 {%k7} +// CHECK: vfmadd231bf16 %ymm4, %ymm3, %ymm2 {%k7} // CHECK: encoding: [0x62,0xf6,0x64,0x2f,0xb8,0xd4] - vfmadd231nepbf16 %ymm4, %ymm3, %ymm2 {%k7} + vfmadd231bf16 %ymm4, %ymm3, %ymm2 {%k7} -// CHECK: vfmadd231nepbf16 %ymm4, %ymm3, %ymm2 {%k7} {z} +// CHECK: vfmadd231bf16 %ymm4, %ymm3, %ymm2 {%k7} {z} // CHECK: encoding: [0x62,0xf6,0x64,0xaf,0xb8,0xd4] - vfmadd231nepbf16 %ymm4, %ymm3, %ymm2 {%k7} {z} + vfmadd231bf16 %ymm4, %ymm3, %ymm2 {%k7} {z} -// CHECK: vfmadd231nepbf16 %zmm4, %zmm3, %zmm2 +// CHECK: vfmadd231bf16 %zmm4, %zmm3, %zmm2 // CHECK: encoding: [0x62,0xf6,0x64,0x48,0xb8,0xd4] - vfmadd231nepbf16 %zmm4, %zmm3, %zmm2 + vfmadd231bf16 %zmm4, %zmm3, %zmm2 -// CHECK: vfmadd231nepbf16 %zmm4, %zmm3, %zmm2 {%k7} +// CHECK: vfmadd231bf16 %zmm4, %zmm3, %zmm2 {%k7} // CHECK: encoding: [0x62,0xf6,0x64,0x4f,0xb8,0xd4] - vfmadd231nepbf16 %zmm4, %zmm3, %zmm2 {%k7} + vfmadd231bf16 %zmm4, %zmm3, %zmm2 {%k7} -// CHECK: vfmadd231nepbf16 %zmm4, %zmm3, %zmm2 {%k7} {z} +// CHECK: vfmadd231bf16 %zmm4, %zmm3, %zmm2 {%k7} {z} // CHECK: encoding: [0x62,0xf6,0x64,0xcf,0xb8,0xd4] - vfmadd231nepbf16 %zmm4, %zmm3, %zmm2 {%k7} {z} + vfmadd231bf16 %zmm4, %zmm3, %zmm2 {%k7} {z} -// CHECK: vfmadd231nepbf16 %xmm4, %xmm3, %xmm2 +// CHECK: vfmadd231bf16 %xmm4, %xmm3, %xmm2 // CHECK: encoding: [0x62,0xf6,0x64,0x08,0xb8,0xd4] - vfmadd231nepbf16 %xmm4, %xmm3, %xmm2 + vfmadd231bf16 %xmm4, %xmm3, %xmm2 -// CHECK: vfmadd231nepbf16 %xmm4, %xmm3, %xmm2 {%k7} +// CHECK: vfmadd231bf16 %xmm4, %xmm3, %xmm2 {%k7} // CHECK: encoding: [0x62,0xf6,0x64,0x0f,0xb8,0xd4] - vfmadd231nepbf16 %xmm4, %xmm3, %xmm2 {%k7} + vfmadd231bf16 %xmm4, %xmm3, %xmm2 {%k7} -// CHECK: vfmadd231nepbf16 %xmm4, %xmm3, %xmm2 {%k7} {z} +// CHECK: vfmadd231bf16 %xmm4, %xmm3, %xmm2 {%k7} {z} // CHECK: encoding: [0x62,0xf6,0x64,0x8f,0xb8,0xd4] - vfmadd231nepbf16 %xmm4, %xmm3, %xmm2 {%k7} {z} + vfmadd231bf16 %xmm4, %xmm3, %xmm2 {%k7} {z} -// CHECK: vfmadd231nepbf16 268435456(%esp,%esi,8), %zmm3, %zmm2 +// CHECK: vfmadd231bf16 268435456(%esp,%esi,8), %zmm3, %zmm2 // CHECK: encoding: [0x62,0xf6,0x64,0x48,0xb8,0x94,0xf4,0x00,0x00,0x00,0x10] - vfmadd231nepbf16 268435456(%esp,%esi,8), %zmm3, %zmm2 + vfmadd231bf16 268435456(%esp,%esi,8), %zmm3, %zmm2 -// CHECK: vfmadd231nepbf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7} +// CHECK: vfmadd231bf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7} // CHECK: encoding: [0x62,0xf6,0x64,0x4f,0xb8,0x94,0x87,0x23,0x01,0x00,0x00] - vfmadd231nepbf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7} + vfmadd231bf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7} -// CHECK: vfmadd231nepbf16 (%eax){1to32}, %zmm3, %zmm2 +// CHECK: vfmadd231bf16 (%eax){1to32}, %zmm3, %zmm2 // CHECK: encoding: [0x62,0xf6,0x64,0x58,0xb8,0x10] - vfmadd231nepbf16 (%eax){1to32}, %zmm3, %zmm2 + vfmadd231bf16 (%eax){1to32}, %zmm3, %zmm2 -// CHECK: vfmadd231nepbf16 -2048(,%ebp,2), %zmm3, %zmm2 +// CHECK: vfmadd231bf16 -2048(,%ebp,2), %zmm3, %zmm2 // CHECK: encoding: [0x62,0xf6,0x64,0x48,0xb8,0x14,0x6d,0x00,0xf8,0xff,0xff] - vfmadd231nepbf16 -2048(,%ebp,2), %zmm3, %zmm2 + vfmadd231bf16 -2048(,%ebp,2), %zmm3, %zmm2 -// CHECK: vfmadd231nepbf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z} +// CHECK: vfmadd231bf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z} // CHECK: encoding: [0x62,0xf6,0x64,0xcf,0xb8,0x51,0x7f] - vfmadd231nepbf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z} + vfmadd231bf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z} -// CHECK: vfmadd231nepbf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z} +// CHECK: vfmadd231bf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z} // CHECK: encoding: [0x62,0xf6,0x64,0xdf,0xb8,0x52,0x80] - vfmadd231nepbf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z} + vfmadd231bf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z} -// CHECK: vfmadd231nepbf16 268435456(%esp,%esi,8), %ymm3, %ymm2 +// CHECK: vfmadd231bf16 268435456(%esp,%esi,8), %ymm3, %ymm2 // CHECK: encoding: [0x62,0xf6,0x64,0x28,0xb8,0x94,0xf4,0x00,0x00,0x00,0x10] - vfmadd231nepbf16 268435456(%esp,%esi,8), %ymm3, %ymm2 + vfmadd231bf16 268435456(%esp,%esi,8), %ymm3, %ymm2 -// CHECK: vfmadd231nepbf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7} +// CHECK: vfmadd231bf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7} // CHECK: encoding: [0x62,0xf6,0x64,0x2f,0xb8,0x94,0x87,0x23,0x01,0x00,0x00] - vfmadd231nepbf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7} + vfmadd231bf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7} -// CHECK: vfmadd231nepbf16 (%eax){1to16}, %ymm3, %ymm2 +// CHECK: vfmadd231bf16 (%eax){1to16}, %ymm3, %ymm2 // CHECK: encoding: [0x62,0xf6,0x64,0x38,0xb8,0x10] - vfmadd231nepbf16 (%eax){1to16}, %ymm3, %ymm2 + vfmadd231bf16 (%eax){1to16}, %ymm3, %ymm2 -// CHECK: vfmadd231nepbf16 -1024(,%ebp,2), %ymm3, %ymm2 +// CHECK: vfmadd231bf16 -1024(,%ebp,2), %ymm3, %ymm2 // CHECK: encoding: [0x62,0xf6,0x64,0x28,0xb8,0x14,0x6d,0x00,0xfc,0xff,0xff] - vfmadd231nepbf16 -1024(,%ebp,2), %ymm3, %ymm2 + vfmadd231bf16 -1024(,%ebp,2), %ymm3, %ymm2 -// CHECK: vfmadd231nepbf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z} +// CHECK: vfmadd231bf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z} // CHECK: encoding: [0x62,0xf6,0x64,0xaf,0xb8,0x51,0x7f] - vfmadd231nepbf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z} + vfmadd231bf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z} -// CHECK: vfmadd231nepbf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z} +// CHECK: vfmadd231bf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z} // CHECK: encoding: [0x62,0xf6,0x64,0xbf,0xb8,0x52,0x80] - vfmadd231nepbf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z} + vfmadd231bf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z} -// CHECK: vfmadd231nepbf16 268435456(%esp,%esi,8), %xmm3, %xmm2 +// CHECK: vfmadd231bf16 268435456(%esp,%esi,8), %xmm3, %xmm2 // CHECK: encoding: [0x62,0xf6,0x64,0x08,0xb8,0x94,0xf4,0x00,0x00,0x00,0x10] - vfmadd231nepbf16 268435456(%esp,%esi,8), %xmm3, %xmm2 + vfmadd231bf16 268435456(%esp,%esi,8), %xmm3, %xmm2 -// CHECK: vfmadd231nepbf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7} +// CHECK: vfmadd231bf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7} // CHECK: encoding: [0x62,0xf6,0x64,0x0f,0xb8,0x94,0x87,0x23,0x01,0x00,0x00] - vfmadd231nepbf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7} + vfmadd231bf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7} -// CHECK: vfmadd231nepbf16 (%eax){1to8}, %xmm3, %xmm2 +// CHECK: vfmadd231bf16 (%eax){1to8}, %xmm3, %xmm2 // CHECK: encoding: [0x62,0xf6,0x64,0x18,0xb8,0x10] - vfmadd231nepbf16 (%eax){1to8}, %xmm3, %xmm2 + vfmadd231bf16 (%eax){1to8}, %xmm3, %xmm2 -// CHECK: vfmadd231nepbf16 -512(,%ebp,2), %xmm3, %xmm2 +// CHECK: vfmadd231bf16 -512(,%ebp,2), %xmm3, %xmm2 // CHECK: encoding: [0x62,0xf6,0x64,0x08,0xb8,0x14,0x6d,0x00,0xfe,0xff,0xff] - vfmadd231nepbf16 -512(,%ebp,2), %xmm3, %xmm2 + vfmadd231bf16 -512(,%ebp,2), %xmm3, %xmm2 -// CHECK: vfmadd231nepbf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z} +// CHECK: vfmadd231bf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z} // CHECK: encoding: [0x62,0xf6,0x64,0x8f,0xb8,0x51,0x7f] - vfmadd231nepbf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z} + vfmadd231bf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z} -// CHECK: vfmadd231nepbf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z} +// CHECK: vfmadd231bf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z} // CHECK: encoding: [0x62,0xf6,0x64,0x9f,0xb8,0x52,0x80] - vfmadd231nepbf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z} + vfmadd231bf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z} -// CHECK: vfmsub132nepbf16 %ymm4, %ymm3, %ymm2 +// CHECK: vfmsub132bf16 %ymm4, %ymm3, %ymm2 // CHECK: encoding: [0x62,0xf6,0x64,0x28,0x9a,0xd4] - vfmsub132nepbf16 %ymm4, %ymm3, %ymm2 + vfmsub132bf16 %ymm4, %ymm3, %ymm2 -// CHECK: vfmsub132nepbf16 %ymm4, %ymm3, %ymm2 {%k7} +// CHECK: vfmsub132bf16 %ymm4, %ymm3, %ymm2 {%k7} // CHECK: encoding: [0x62,0xf6,0x64,0x2f,0x9a,0xd4] - vfmsub132nepbf16 %ymm4, %ymm3, %ymm2 {%k7} + vfmsub132bf16 %ymm4, %ymm3, %ymm2 {%k7} -// CHECK: vfmsub132nepbf16 %ymm4, %ymm3, %ymm2 {%k7} {z} +// CHECK: vfmsub132bf16 %ymm4, %ymm3, %ymm2 {%k7} {z} // CHECK: encoding: [0x62,0xf6,0x64,0xaf,0x9a,0xd4] - vfmsub132nepbf16 %ymm4, %ymm3, %ymm2 {%k7} {z} + vfmsub132bf16 %ymm4, %ymm3, %ymm2 {%k7} {z} -// CHECK: vfmsub132nepbf16 %zmm4, %zmm3, %zmm2 +// CHECK: vfmsub132bf16 %zmm4, %zmm3, %zmm2 // CHECK: encoding: [0x62,0xf6,0x64,0x48,0x9a,0xd4] - vfmsub132nepbf16 %zmm4, %zmm3, %zmm2 + vfmsub132bf16 %zmm4, %zmm3, %zmm2 -// CHECK: vfmsub132nepbf16 %zmm4, %zmm3, %zmm2 {%k7} +// CHECK: vfmsub132bf16 %zmm4, %zmm3, %zmm2 {%k7} // CHECK: encoding: [0x62,0xf6,0x64,0x4f,0x9a,0xd4] - vfmsub132nepbf16 %zmm4, %zmm3, %zmm2 {%k7} + vfmsub132bf16 %zmm4, %zmm3, %zmm2 {%k7} -// CHECK: vfmsub132nepbf16 %zmm4, %zmm3, %zmm2 {%k7} {z} +// CHECK: vfmsub132bf16 %zmm4, %zmm3, %zmm2 {%k7} {z} // CHECK: encoding: [0x62,0xf6,0x64,0xcf,0x9a,0xd4] - vfmsub132nepbf16 %zmm4, %zmm3, %zmm2 {%k7} {z} + vfmsub132bf16 %zmm4, %zmm3, %zmm2 {%k7} {z} -// CHECK: vfmsub132nepbf16 %xmm4, %xmm3, %xmm2 +// CHECK: vfmsub132bf16 %xmm4, %xmm3, %xmm2 // CHECK: encoding: [0x62,0xf6,0x64,0x08,0x9a,0xd4] - vfmsub132nepbf16 %xmm4, %xmm3, %xmm2 + vfmsub132bf16 %xmm4, %xmm3, %xmm2 -// CHECK: vfmsub132nepbf16 %xmm4, %xmm3, %xmm2 {%k7} +// CHECK: vfmsub132bf16 %xmm4, %xmm3, %xmm2 {%k7} // CHECK: encoding: [0x62,0xf6,0x64,0x0f,0x9a,0xd4] - vfmsub132nepbf16 %xmm4, %xmm3, %xmm2 {%k7} + vfmsub132bf16 %xmm4, %xmm3, %xmm2 {%k7} -// CHECK: vfmsub132nepbf16 %xmm4, %xmm3, %xmm2 {%k7} {z} +// CHECK: vfmsub132bf16 %xmm4, %xmm3, %xmm2 {%k7} {z} // CHECK: encoding: [0x62,0xf6,0x64,0x8f,0x9a,0xd4] - vfmsub132nepbf16 %xmm4, %xmm3, %xmm2 {%k7} {z} + vfmsub132bf16 %xmm4, %xmm3, %xmm2 {%k7} {z} -// CHECK: vfmsub132nepbf16 268435456(%esp,%esi,8), %zmm3, %zmm2 +// CHECK: vfmsub132bf16 268435456(%esp,%esi,8), %zmm3, %zmm2 // CHECK: encoding: [0x62,0xf6,0x64,0x48,0x9a,0x94,0xf4,0x00,0x00,0x00,0x10] - vfmsub132nepbf16 268435456(%esp,%esi,8), %zmm3, %zmm2 + vfmsub132bf16 268435456(%esp,%esi,8), %zmm3, %zmm2 -// CHECK: vfmsub132nepbf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7} +// CHECK: vfmsub132bf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7} // CHECK: encoding: [0x62,0xf6,0x64,0x4f,0x9a,0x94,0x87,0x23,0x01,0x00,0x00] - vfmsub132nepbf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7} + vfmsub132bf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7} -// CHECK: vfmsub132nepbf16 (%eax){1to32}, %zmm3, %zmm2 +// CHECK: vfmsub132bf16 (%eax){1to32}, %zmm3, %zmm2 // CHECK: encoding: [0x62,0xf6,0x64,0x58,0x9a,0x10] - vfmsub132nepbf16 (%eax){1to32}, %zmm3, %zmm2 + vfmsub132bf16 (%eax){1to32}, %zmm3, %zmm2 -// CHECK: vfmsub132nepbf16 -2048(,%ebp,2), %zmm3, %zmm2 +// CHECK: vfmsub132bf16 -2048(,%ebp,2), %zmm3, %zmm2 // CHECK: encoding: [0x62,0xf6,0x64,0x48,0x9a,0x14,0x6d,0x00,0xf8,0xff,0xff] - vfmsub132nepbf16 -2048(,%ebp,2), %zmm3, %zmm2 + vfmsub132bf16 -2048(,%ebp,2), %zmm3, %zmm2 -// CHECK: vfmsub132nepbf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z} +// CHECK: vfmsub132bf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z} // CHECK: encoding: [0x62,0xf6,0x64,0xcf,0x9a,0x51,0x7f] - vfmsub132nepbf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z} + vfmsub132bf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z} -// CHECK: vfmsub132nepbf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z} +// CHECK: vfmsub132bf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z} // CHECK: encoding: [0x62,0xf6,0x64,0xdf,0x9a,0x52,0x80] - vfmsub132nepbf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z} + vfmsub132bf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z} -// CHECK: vfmsub132nepbf16 268435456(%esp,%esi,8), %ymm3, %ymm2 +// CHECK: vfmsub132bf16 268435456(%esp,%esi,8), %ymm3, %ymm2 // CHECK: encoding: [0x62,0xf6,0x64,0x28,0x9a,0x94,0xf4,0x00,0x00,0x00,0x10] - vfmsub132nepbf16 268435456(%esp,%esi,8), %ymm3, %ymm2 + vfmsub132bf16 268435456(%esp,%esi,8), %ymm3, %ymm2 -// CHECK: vfmsub132nepbf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7} +// CHECK: vfmsub132bf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7} // CHECK: encoding: [0x62,0xf6,0x64,0x2f,0x9a,0x94,0x87,0x23,0x01,0x00,0x00] - vfmsub132nepbf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7} + vfmsub132bf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7} -// CHECK: vfmsub132nepbf16 (%eax){1to16}, %ymm3, %ymm2 +// CHECK: vfmsub132bf16 (%eax){1to16}, %ymm3, %ymm2 // CHECK: encoding: [0x62,0xf6,0x64,0x38,0x9a,0x10] - vfmsub132nepbf16 (%eax){1to16}, %ymm3, %ymm2 + vfmsub132bf16 (%eax){1to16}, %ymm3, %ymm2 -// CHECK: vfmsub132nepbf16 -1024(,%ebp,2), %ymm3, %ymm2 +// CHECK: vfmsub132bf16 -1024(,%ebp,2), %ymm3, %ymm2 // CHECK: encoding: [0x62,0xf6,0x64,0x28,0x9a,0x14,0x6d,0x00,0xfc,0xff,0xff] - vfmsub132nepbf16 -1024(,%ebp,2), %ymm3, %ymm2 + vfmsub132bf16 -1024(,%ebp,2), %ymm3, %ymm2 -// CHECK: vfmsub132nepbf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z} +// CHECK: vfmsub132bf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z} // CHECK: encoding: [0x62,0xf6,0x64,0xaf,0x9a,0x51,0x7f] - vfmsub132nepbf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z} + vfmsub132bf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z} -// CHECK: vfmsub132nepbf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z} +// CHECK: vfmsub132bf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z} // CHECK: encoding: [0x62,0xf6,0x64,0xbf,0x9a,0x52,0x80] - vfmsub132nepbf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z} + vfmsub132bf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z} -// CHECK: vfmsub132nepbf16 268435456(%esp,%esi,8), %xmm3, %xmm2 +// CHECK: vfmsub132bf16 268435456(%esp,%esi,8), %xmm3, %xmm2 // CHECK: encoding: [0x62,0xf6,0x64,0x08,0x9a,0x94,0xf4,0x00,0x00,0x00,0x10] - vfmsub132nepbf16 268435456(%esp,%esi,8), %xmm3, %xmm2 + vfmsub132bf16 268435456(%esp,%esi,8), %xmm3, %xmm2 -// CHECK: vfmsub132nepbf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7} +// CHECK: vfmsub132bf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7} // CHECK: encoding: [0x62,0xf6,0x64,0x0f,0x9a,0x94,0x87,0x23,0x01,0x00,0x00] - vfmsub132nepbf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7} + vfmsub132bf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7} -// CHECK: vfmsub132nepbf16 (%eax){1to8}, %xmm3, %xmm2 +// CHECK: vfmsub132bf16 (%eax){1to8}, %xmm3, %xmm2 // CHECK: encoding: [0x62,0xf6,0x64,0x18,0x9a,0x10] - vfmsub132nepbf16 (%eax){1to8}, %xmm3, %xmm2 + vfmsub132bf16 (%eax){1to8}, %xmm3, %xmm2 -// CHECK: vfmsub132nepbf16 -512(,%ebp,2), %xmm3, %xmm2 +// CHECK: vfmsub132bf16 -512(,%ebp,2), %xmm3, %xmm2 // CHECK: encoding: [0x62,0xf6,0x64,0x08,0x9a,0x14,0x6d,0x00,0xfe,0xff,0xff] - vfmsub132nepbf16 -512(,%ebp,2), %xmm3, %xmm2 + vfmsub132bf16 -512(,%ebp,2), %xmm3, %xmm2 -// CHECK: vfmsub132nepbf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z} +// CHECK: vfmsub132bf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z} // CHECK: encoding: [0x62,0xf6,0x64,0x8f,0x9a,0x51,0x7f] - vfmsub132nepbf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z} + vfmsub132bf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z} -// CHECK: vfmsub132nepbf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z} +// CHECK: vfmsub132bf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z} // CHECK: encoding: [0x62,0xf6,0x64,0x9f,0x9a,0x52,0x80] - vfmsub132nepbf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z} + vfmsub132bf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z} -// CHECK: vfmsub213nepbf16 %ymm4, %ymm3, %ymm2 +// CHECK: vfmsub213bf16 %ymm4, %ymm3, %ymm2 // CHECK: encoding: [0x62,0xf6,0x64,0x28,0xaa,0xd4] - vfmsub213nepbf16 %ymm4, %ymm3, %ymm2 + vfmsub213bf16 %ymm4, %ymm3, %ymm2 -// CHECK: vfmsub213nepbf16 %ymm4, %ymm3, %ymm2 {%k7} +// CHECK: vfmsub213bf16 %ymm4, %ymm3, %ymm2 {%k7} // CHECK: encoding: [0x62,0xf6,0x64,0x2f,0xaa,0xd4] - vfmsub213nepbf16 %ymm4, %ymm3, %ymm2 {%k7} + vfmsub213bf16 %ymm4, %ymm3, %ymm2 {%k7} -// CHECK: vfmsub213nepbf16 %ymm4, %ymm3, %ymm2 {%k7} {z} +// CHECK: vfmsub213bf16 %ymm4, %ymm3, %ymm2 {%k7} {z} // CHECK: encoding: [0x62,0xf6,0x64,0xaf,0xaa,0xd4] - vfmsub213nepbf16 %ymm4, %ymm3, %ymm2 {%k7} {z} + vfmsub213bf16 %ymm4, %ymm3, %ymm2 {%k7} {z} -// CHECK: vfmsub213nepbf16 %zmm4, %zmm3, %zmm2 +// CHECK: vfmsub213bf16 %zmm4, %zmm3, %zmm2 // CHECK: encoding: [0x62,0xf6,0x64,0x48,0xaa,0xd4] - vfmsub213nepbf16 %zmm4, %zmm3, %zmm2 + vfmsub213bf16 %zmm4, %zmm3, %zmm2 -// CHECK: vfmsub213nepbf16 %zmm4, %zmm3, %zmm2 {%k7} +// CHECK: vfmsub213bf16 %zmm4, %zmm3, %zmm2 {%k7} // CHECK: encoding: [0x62,0xf6,0x64,0x4f,0xaa,0xd4] - vfmsub213nepbf16 %zmm4, %zmm3, %zmm2 {%k7} + vfmsub213bf16 %zmm4, %zmm3, %zmm2 {%k7} -// CHECK: vfmsub213nepbf16 %zmm4, %zmm3, %zmm2 {%k7} {z} +// CHECK: vfmsub213bf16 %zmm4, %zmm3, %zmm2 {%k7} {z} // CHECK: encoding: [0x62,0xf6,0x64,0xcf,0xaa,0xd4] - vfmsub213nepbf16 %zmm4, %zmm3, %zmm2 {%k7} {z} + vfmsub213bf16 %zmm4, %zmm3, %zmm2 {%k7} {z} -// CHECK: vfmsub213nepbf16 %xmm4, %xmm3, %xmm2 +// CHECK: vfmsub213bf16 %xmm4, %xmm3, %xmm2 // CHECK: encoding: [0x62,0xf6,0x64,0x08,0xaa,0xd4] - vfmsub213nepbf16 %xmm4, %xmm3, %xmm2 + vfmsub213bf16 %xmm4, %xmm3, %xmm2 -// CHECK: vfmsub213nepbf16 %xmm4, %xmm3, %xmm2 {%k7} +// CHECK: vfmsub213bf16 %xmm4, %xmm3, %xmm2 {%k7} // CHECK: encoding: [0x62,0xf6,0x64,0x0f,0xaa,0xd4] - vfmsub213nepbf16 %xmm4, %xmm3, %xmm2 {%k7} + vfmsub213bf16 %xmm4, %xmm3, %xmm2 {%k7} -// CHECK: vfmsub213nepbf16 %xmm4, %xmm3, %xmm2 {%k7} {z} +// CHECK: vfmsub213bf16 %xmm4, %xmm3, %xmm2 {%k7} {z} // CHECK: encoding: [0x62,0xf6,0x64,0x8f,0xaa,0xd4] - vfmsub213nepbf16 %xmm4, %xmm3, %xmm2 {%k7} {z} + vfmsub213bf16 %xmm4, %xmm3, %xmm2 {%k7} {z} -// CHECK: vfmsub213nepbf16 268435456(%esp,%esi,8), %zmm3, %zmm2 +// CHECK: vfmsub213bf16 268435456(%esp,%esi,8), %zmm3, %zmm2 // CHECK: encoding: [0x62,0xf6,0x64,0x48,0xaa,0x94,0xf4,0x00,0x00,0x00,0x10] - vfmsub213nepbf16 268435456(%esp,%esi,8), %zmm3, %zmm2 + vfmsub213bf16 268435456(%esp,%esi,8), %zmm3, %zmm2 -// CHECK: vfmsub213nepbf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7} +// CHECK: vfmsub213bf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7} // CHECK: encoding: [0x62,0xf6,0x64,0x4f,0xaa,0x94,0x87,0x23,0x01,0x00,0x00] - vfmsub213nepbf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7} + vfmsub213bf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7} -// CHECK: vfmsub213nepbf16 (%eax){1to32}, %zmm3, %zmm2 +// CHECK: vfmsub213bf16 (%eax){1to32}, %zmm3, %zmm2 // CHECK: encoding: [0x62,0xf6,0x64,0x58,0xaa,0x10] - vfmsub213nepbf16 (%eax){1to32}, %zmm3, %zmm2 + vfmsub213bf16 (%eax){1to32}, %zmm3, %zmm2 -// CHECK: vfmsub213nepbf16 -2048(,%ebp,2), %zmm3, %zmm2 +// CHECK: vfmsub213bf16 -2048(,%ebp,2), %zmm3, %zmm2 // CHECK: encoding: [0x62,0xf6,0x64,0x48,0xaa,0x14,0x6d,0x00,0xf8,0xff,0xff] - vfmsub213nepbf16 -2048(,%ebp,2), %zmm3, %zmm2 + vfmsub213bf16 -2048(,%ebp,2), %zmm3, %zmm2 -// CHECK: vfmsub213nepbf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z} +// CHECK: vfmsub213bf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z} // CHECK: encoding: [0x62,0xf6,0x64,0xcf,0xaa,0x51,0x7f] - vfmsub213nepbf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z} + vfmsub213bf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z} -// CHECK: vfmsub213nepbf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z} +// CHECK: vfmsub213bf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z} // CHECK: encoding: [0x62,0xf6,0x64,0xdf,0xaa,0x52,0x80] - vfmsub213nepbf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z} + vfmsub213bf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z} -// CHECK: vfmsub213nepbf16 268435456(%esp,%esi,8), %ymm3, %ymm2 +// CHECK: vfmsub213bf16 268435456(%esp,%esi,8), %ymm3, %ymm2 // CHECK: encoding: [0x62,0xf6,0x64,0x28,0xaa,0x94,0xf4,0x00,0x00,0x00,0x10] - vfmsub213nepbf16 268435456(%esp,%esi,8), %ymm3, %ymm2 + vfmsub213bf16 268435456(%esp,%esi,8), %ymm3, %ymm2 -// CHECK: vfmsub213nepbf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7} +// CHECK: vfmsub213bf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7} // CHECK: encoding: [0x62,0xf6,0x64,0x2f,0xaa,0x94,0x87,0x23,0x01,0x00,0x00] - vfmsub213nepbf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7} + vfmsub213bf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7} -// CHECK: vfmsub213nepbf16 (%eax){1to16}, %ymm3, %ymm2 +// CHECK: vfmsub213bf16 (%eax){1to16}, %ymm3, %ymm2 // CHECK: encoding: [0x62,0xf6,0x64,0x38,0xaa,0x10] - vfmsub213nepbf16 (%eax){1to16}, %ymm3, %ymm2 + vfmsub213bf16 (%eax){1to16}, %ymm3, %ymm2 -// CHECK: vfmsub213nepbf16 -1024(,%ebp,2), %ymm3, %ymm2 +// CHECK: vfmsub213bf16 -1024(,%ebp,2), %ymm3, %ymm2 // CHECK: encoding: [0x62,0xf6,0x64,0x28,0xaa,0x14,0x6d,0x00,0xfc,0xff,0xff] - vfmsub213nepbf16 -1024(,%ebp,2), %ymm3, %ymm2 + vfmsub213bf16 -1024(,%ebp,2), %ymm3, %ymm2 -// CHECK: vfmsub213nepbf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z} +// CHECK: vfmsub213bf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z} // CHECK: encoding: [0x62,0xf6,0x64,0xaf,0xaa,0x51,0x7f] - vfmsub213nepbf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z} + vfmsub213bf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z} -// CHECK: vfmsub213nepbf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z} +// CHECK: vfmsub213bf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z} // CHECK: encoding: [0x62,0xf6,0x64,0xbf,0xaa,0x52,0x80] - vfmsub213nepbf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z} + vfmsub213bf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z} -// CHECK: vfmsub213nepbf16 268435456(%esp,%esi,8), %xmm3, %xmm2 +// CHECK: vfmsub213bf16 268435456(%esp,%esi,8), %xmm3, %xmm2 // CHECK: encoding: [0x62,0xf6,0x64,0x08,0xaa,0x94,0xf4,0x00,0x00,0x00,0x10] - vfmsub213nepbf16 268435456(%esp,%esi,8), %xmm3, %xmm2 + vfmsub213bf16 268435456(%esp,%esi,8), %xmm3, %xmm2 -// CHECK: vfmsub213nepbf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7} +// CHECK: vfmsub213bf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7} // CHECK: encoding: [0x62,0xf6,0x64,0x0f,0xaa,0x94,0x87,0x23,0x01,0x00,0x00] - vfmsub213nepbf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7} + vfmsub213bf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7} -// CHECK: vfmsub213nepbf16 (%eax){1to8}, %xmm3, %xmm2 +// CHECK: vfmsub213bf16 (%eax){1to8}, %xmm3, %xmm2 // CHECK: encoding: [0x62,0xf6,0x64,0x18,0xaa,0x10] - vfmsub213nepbf16 (%eax){1to8}, %xmm3, %xmm2 + vfmsub213bf16 (%eax){1to8}, %xmm3, %xmm2 -// CHECK: vfmsub213nepbf16 -512(,%ebp,2), %xmm3, %xmm2 +// CHECK: vfmsub213bf16 -512(,%ebp,2), %xmm3, %xmm2 // CHECK: encoding: [0x62,0xf6,0x64,0x08,0xaa,0x14,0x6d,0x00,0xfe,0xff,0xff] - vfmsub213nepbf16 -512(,%ebp,2), %xmm3, %xmm2 + vfmsub213bf16 -512(,%ebp,2), %xmm3, %xmm2 -// CHECK: vfmsub213nepbf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z} +// CHECK: vfmsub213bf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z} // CHECK: encoding: [0x62,0xf6,0x64,0x8f,0xaa,0x51,0x7f] - vfmsub213nepbf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z} + vfmsub213bf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z} -// CHECK: vfmsub213nepbf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z} +// CHECK: vfmsub213bf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z} // CHECK: encoding: [0x62,0xf6,0x64,0x9f,0xaa,0x52,0x80] - vfmsub213nepbf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z} + vfmsub213bf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z} -// CHECK: vfmsub231nepbf16 %ymm4, %ymm3, %ymm2 +// CHECK: vfmsub231bf16 %ymm4, %ymm3, %ymm2 // CHECK: encoding: [0x62,0xf6,0x64,0x28,0xba,0xd4] - vfmsub231nepbf16 %ymm4, %ymm3, %ymm2 + vfmsub231bf16 %ymm4, %ymm3, %ymm2 -// CHECK: vfmsub231nepbf16 %ymm4, %ymm3, %ymm2 {%k7} +// CHECK: vfmsub231bf16 %ymm4, %ymm3, %ymm2 {%k7} // CHECK: encoding: [0x62,0xf6,0x64,0x2f,0xba,0xd4] - vfmsub231nepbf16 %ymm4, %ymm3, %ymm2 {%k7} + vfmsub231bf16 %ymm4, %ymm3, %ymm2 {%k7} -// CHECK: vfmsub231nepbf16 %ymm4, %ymm3, %ymm2 {%k7} {z} +// CHECK: vfmsub231bf16 %ymm4, %ymm3, %ymm2 {%k7} {z} // CHECK: encoding: [0x62,0xf6,0x64,0xaf,0xba,0xd4] - vfmsub231nepbf16 %ymm4, %ymm3, %ymm2 {%k7} {z} + vfmsub231bf16 %ymm4, %ymm3, %ymm2 {%k7} {z} -// CHECK: vfmsub231nepbf16 %zmm4, %zmm3, %zmm2 +// CHECK: vfmsub231bf16 %zmm4, %zmm3, %zmm2 // CHECK: encoding: [0x62,0xf6,0x64,0x48,0xba,0xd4] - vfmsub231nepbf16 %zmm4, %zmm3, %zmm2 + vfmsub231bf16 %zmm4, %zmm3, %zmm2 -// CHECK: vfmsub231nepbf16 %zmm4, %zmm3, %zmm2 {%k7} +// CHECK: vfmsub231bf16 %zmm4, %zmm3, %zmm2 {%k7} // CHECK: encoding: [0x62,0xf6,0x64,0x4f,0xba,0xd4] - vfmsub231nepbf16 %zmm4, %zmm3, %zmm2 {%k7} + vfmsub231bf16 %zmm4, %zmm3, %zmm2 {%k7} -// CHECK: vfmsub231nepbf16 %zmm4, %zmm3, %zmm2 {%k7} {z} +// CHECK: vfmsub231bf16 %zmm4, %zmm3, %zmm2 {%k7} {z} // CHECK: encoding: [0x62,0xf6,0x64,0xcf,0xba,0xd4] - vfmsub231nepbf16 %zmm4, %zmm3, %zmm2 {%k7} {z} + vfmsub231bf16 %zmm4, %zmm3, %zmm2 {%k7} {z} -// CHECK: vfmsub231nepbf16 %xmm4, %xmm3, %xmm2 +// CHECK: vfmsub231bf16 %xmm4, %xmm3, %xmm2 // CHECK: encoding: [0x62,0xf6,0x64,0x08,0xba,0xd4] - vfmsub231nepbf16 %xmm4, %xmm3, %xmm2 + vfmsub231bf16 %xmm4, %xmm3, %xmm2 -// CHECK: vfmsub231nepbf16 %xmm4, %xmm3, %xmm2 {%k7} +// CHECK: vfmsub231bf16 %xmm4, %xmm3, %xmm2 {%k7} // CHECK: encoding: [0x62,0xf6,0x64,0x0f,0xba,0xd4] - vfmsub231nepbf16 %xmm4, %xmm3, %xmm2 {%k7} + vfmsub231bf16 %xmm4, %xmm3, %xmm2 {%k7} -// CHECK: vfmsub231nepbf16 %xmm4, %xmm3, %xmm2 {%k7} {z} +// CHECK: vfmsub231bf16 %xmm4, %xmm3, %xmm2 {%k7} {z} // CHECK: encoding: [0x62,0xf6,0x64,0x8f,0xba,0xd4] - vfmsub231nepbf16 %xmm4, %xmm3, %xmm2 {%k7} {z} + vfmsub231bf16 %xmm4, %xmm3, %xmm2 {%k7} {z} -// CHECK: vfmsub231nepbf16 268435456(%esp,%esi,8), %zmm3, %zmm2 +// CHECK: vfmsub231bf16 268435456(%esp,%esi,8), %zmm3, %zmm2 // CHECK: encoding: [0x62,0xf6,0x64,0x48,0xba,0x94,0xf4,0x00,0x00,0x00,0x10] - vfmsub231nepbf16 268435456(%esp,%esi,8), %zmm3, %zmm2 + vfmsub231bf16 268435456(%esp,%esi,8), %zmm3, %zmm2 -// CHECK: vfmsub231nepbf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7} +// CHECK: vfmsub231bf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7} // CHECK: encoding: [0x62,0xf6,0x64,0x4f,0xba,0x94,0x87,0x23,0x01,0x00,0x00] - vfmsub231nepbf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7} + vfmsub231bf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7} -// CHECK: vfmsub231nepbf16 (%eax){1to32}, %zmm3, %zmm2 +// CHECK: vfmsub231bf16 (%eax){1to32}, %zmm3, %zmm2 // CHECK: encoding: [0x62,0xf6,0x64,0x58,0xba,0x10] - vfmsub231nepbf16 (%eax){1to32}, %zmm3, %zmm2 + vfmsub231bf16 (%eax){1to32}, %zmm3, %zmm2 -// CHECK: vfmsub231nepbf16 -2048(,%ebp,2), %zmm3, %zmm2 +// CHECK: vfmsub231bf16 -2048(,%ebp,2), %zmm3, %zmm2 // CHECK: encoding: [0x62,0xf6,0x64,0x48,0xba,0x14,0x6d,0x00,0xf8,0xff,0xff] - vfmsub231nepbf16 -2048(,%ebp,2), %zmm3, %zmm2 + vfmsub231bf16 -2048(,%ebp,2), %zmm3, %zmm2 -// CHECK: vfmsub231nepbf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z} +// CHECK: vfmsub231bf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z} // CHECK: encoding: [0x62,0xf6,0x64,0xcf,0xba,0x51,0x7f] - vfmsub231nepbf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z} + vfmsub231bf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z} -// CHECK: vfmsub231nepbf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z} +// CHECK: vfmsub231bf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z} // CHECK: encoding: [0x62,0xf6,0x64,0xdf,0xba,0x52,0x80] - vfmsub231nepbf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z} + vfmsub231bf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z} -// CHECK: vfmsub231nepbf16 268435456(%esp,%esi,8), %ymm3, %ymm2 +// CHECK: vfmsub231bf16 268435456(%esp,%esi,8), %ymm3, %ymm2 // CHECK: encoding: [0x62,0xf6,0x64,0x28,0xba,0x94,0xf4,0x00,0x00,0x00,0x10] - vfmsub231nepbf16 268435456(%esp,%esi,8), %ymm3, %ymm2 + vfmsub231bf16 268435456(%esp,%esi,8), %ymm3, %ymm2 -// CHECK: vfmsub231nepbf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7} +// CHECK: vfmsub231bf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7} // CHECK: encoding: [0x62,0xf6,0x64,0x2f,0xba,0x94,0x87,0x23,0x01,0x00,0x00] - vfmsub231nepbf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7} + vfmsub231bf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7} -// CHECK: vfmsub231nepbf16 (%eax){1to16}, %ymm3, %ymm2 +// CHECK: vfmsub231bf16 (%eax){1to16}, %ymm3, %ymm2 // CHECK: encoding: [0x62,0xf6,0x64,0x38,0xba,0x10] - vfmsub231nepbf16 (%eax){1to16}, %ymm3, %ymm2 + vfmsub231bf16 (%eax){1to16}, %ymm3, %ymm2 -// CHECK: vfmsub231nepbf16 -1024(,%ebp,2), %ymm3, %ymm2 +// CHECK: vfmsub231bf16 -1024(,%ebp,2), %ymm3, %ymm2 // CHECK: encoding: [0x62,0xf6,0x64,0x28,0xba,0x14,0x6d,0x00,0xfc,0xff,0xff] - vfmsub231nepbf16 -1024(,%ebp,2), %ymm3, %ymm2 + vfmsub231bf16 -1024(,%ebp,2), %ymm3, %ymm2 -// CHECK: vfmsub231nepbf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z} +// CHECK: vfmsub231bf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z} // CHECK: encoding: [0x62,0xf6,0x64,0xaf,0xba,0x51,0x7f] - vfmsub231nepbf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z} + vfmsub231bf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z} -// CHECK: vfmsub231nepbf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z} +// CHECK: vfmsub231bf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z} // CHECK: encoding: [0x62,0xf6,0x64,0xbf,0xba,0x52,0x80] - vfmsub231nepbf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z} + vfmsub231bf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z} -// CHECK: vfmsub231nepbf16 268435456(%esp,%esi,8), %xmm3, %xmm2 +// CHECK: vfmsub231bf16 268435456(%esp,%esi,8), %xmm3, %xmm2 // CHECK: encoding: [0x62,0xf6,0x64,0x08,0xba,0x94,0xf4,0x00,0x00,0x00,0x10] - vfmsub231nepbf16 268435456(%esp,%esi,8), %xmm3, %xmm2 + vfmsub231bf16 268435456(%esp,%esi,8), %xmm3, %xmm2 -// CHECK: vfmsub231nepbf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7} +// CHECK: vfmsub231bf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7} // CHECK: encoding: [0x62,0xf6,0x64,0x0f,0xba,0x94,0x87,0x23,0x01,0x00,0x00] - vfmsub231nepbf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7} + vfmsub231bf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7} -// CHECK: vfmsub231nepbf16 (%eax){1to8}, %xmm3, %xmm2 +// CHECK: vfmsub231bf16 (%eax){1to8}, %xmm3, %xmm2 // CHECK: encoding: [0x62,0xf6,0x64,0x18,0xba,0x10] - vfmsub231nepbf16 (%eax){1to8}, %xmm3, %xmm2 + vfmsub231bf16 (%eax){1to8}, %xmm3, %xmm2 -// CHECK: vfmsub231nepbf16 -512(,%ebp,2), %xmm3, %xmm2 +// CHECK: vfmsub231bf16 -512(,%ebp,2), %xmm3, %xmm2 // CHECK: encoding: [0x62,0xf6,0x64,0x08,0xba,0x14,0x6d,0x00,0xfe,0xff,0xff] - vfmsub231nepbf16 -512(,%ebp,2), %xmm3, %xmm2 + vfmsub231bf16 -512(,%ebp,2), %xmm3, %xmm2 -// CHECK: vfmsub231nepbf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z} +// CHECK: vfmsub231bf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z} // CHECK: encoding: [0x62,0xf6,0x64,0x8f,0xba,0x51,0x7f] - vfmsub231nepbf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z} + vfmsub231bf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z} -// CHECK: vfmsub231nepbf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z} +// CHECK: vfmsub231bf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z} // CHECK: encoding: [0x62,0xf6,0x64,0x9f,0xba,0x52,0x80] - vfmsub231nepbf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z} + vfmsub231bf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z} -// CHECK: vfnmadd132nepbf16 %ymm4, %ymm3, %ymm2 +// CHECK: vfnmadd132bf16 %ymm4, %ymm3, %ymm2 // CHECK: encoding: [0x62,0xf6,0x64,0x28,0x9c,0xd4] - vfnmadd132nepbf16 %ymm4, %ymm3, %ymm2 + vfnmadd132bf16 %ymm4, %ymm3, %ymm2 -// CHECK: vfnmadd132nepbf16 %ymm4, %ymm3, %ymm2 {%k7} +// CHECK: vfnmadd132bf16 %ymm4, %ymm3, %ymm2 {%k7} // CHECK: encoding: [0x62,0xf6,0x64,0x2f,0x9c,0xd4] - vfnmadd132nepbf16 %ymm4, %ymm3, %ymm2 {%k7} + vfnmadd132bf16 %ymm4, %ymm3, %ymm2 {%k7} -// CHECK: vfnmadd132nepbf16 %ymm4, %ymm3, %ymm2 {%k7} {z} +// CHECK: vfnmadd132bf16 %ymm4, %ymm3, %ymm2 {%k7} {z} // CHECK: encoding: [0x62,0xf6,0x64,0xaf,0x9c,0xd4] - vfnmadd132nepbf16 %ymm4, %ymm3, %ymm2 {%k7} {z} + vfnmadd132bf16 %ymm4, %ymm3, %ymm2 {%k7} {z} -// CHECK: vfnmadd132nepbf16 %zmm4, %zmm3, %zmm2 +// CHECK: vfnmadd132bf16 %zmm4, %zmm3, %zmm2 // CHECK: encoding: [0x62,0xf6,0x64,0x48,0x9c,0xd4] - vfnmadd132nepbf16 %zmm4, %zmm3, %zmm2 + vfnmadd132bf16 %zmm4, %zmm3, %zmm2 -// CHECK: vfnmadd132nepbf16 %zmm4, %zmm3, %zmm2 {%k7} +// CHECK: vfnmadd132bf16 %zmm4, %zmm3, %zmm2 {%k7} // CHECK: encoding: [0x62,0xf6,0x64,0x4f,0x9c,0xd4] - vfnmadd132nepbf16 %zmm4, %zmm3, %zmm2 {%k7} + vfnmadd132bf16 %zmm4, %zmm3, %zmm2 {%k7} -// CHECK: vfnmadd132nepbf16 %zmm4, %zmm3, %zmm2 {%k7} {z} +// CHECK: vfnmadd132bf16 %zmm4, %zmm3, %zmm2 {%k7} {z} // CHECK: encoding: [0x62,0xf6,0x64,0xcf,0x9c,0xd4] - vfnmadd132nepbf16 %zmm4, %zmm3, %zmm2 {%k7} {z} + vfnmadd132bf16 %zmm4, %zmm3, %zmm2 {%k7} {z} -// CHECK: vfnmadd132nepbf16 %xmm4, %xmm3, %xmm2 +// CHECK: vfnmadd132bf16 %xmm4, %xmm3, %xmm2 // CHECK: encoding: [0x62,0xf6,0x64,0x08,0x9c,0xd4] - vfnmadd132nepbf16 %xmm4, %xmm3, %xmm2 + vfnmadd132bf16 %xmm4, %xmm3, %xmm2 -// CHECK: vfnmadd132nepbf16 %xmm4, %xmm3, %xmm2 {%k7} +// CHECK: vfnmadd132bf16 %xmm4, %xmm3, %xmm2 {%k7} // CHECK: encoding: [0x62,0xf6,0x64,0x0f,0x9c,0xd4] - vfnmadd132nepbf16 %xmm4, %xmm3, %xmm2 {%k7} + vfnmadd132bf16 %xmm4, %xmm3, %xmm2 {%k7} -// CHECK: vfnmadd132nepbf16 %xmm4, %xmm3, %xmm2 {%k7} {z} +// CHECK: vfnmadd132bf16 %xmm4, %xmm3, %xmm2 {%k7} {z} // CHECK: encoding: [0x62,0xf6,0x64,0x8f,0x9c,0xd4] - vfnmadd132nepbf16 %xmm4, %xmm3, %xmm2 {%k7} {z} + vfnmadd132bf16 %xmm4, %xmm3, %xmm2 {%k7} {z} -// CHECK: vfnmadd132nepbf16 268435456(%esp,%esi,8), %zmm3, %zmm2 +// CHECK: vfnmadd132bf16 268435456(%esp,%esi,8), %zmm3, %zmm2 // CHECK: encoding: [0x62,0xf6,0x64,0x48,0x9c,0x94,0xf4,0x00,0x00,0x00,0x10] - vfnmadd132nepbf16 268435456(%esp,%esi,8), %zmm3, %zmm2 + vfnmadd132bf16 268435456(%esp,%esi,8), %zmm3, %zmm2 -// CHECK: vfnmadd132nepbf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7} +// CHECK: vfnmadd132bf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7} // CHECK: encoding: [0x62,0xf6,0x64,0x4f,0x9c,0x94,0x87,0x23,0x01,0x00,0x00] - vfnmadd132nepbf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7} + vfnmadd132bf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7} -// CHECK: vfnmadd132nepbf16 (%eax){1to32}, %zmm3, %zmm2 +// CHECK: vfnmadd132bf16 (%eax){1to32}, %zmm3, %zmm2 // CHECK: encoding: [0x62,0xf6,0x64,0x58,0x9c,0x10] - vfnmadd132nepbf16 (%eax){1to32}, %zmm3, %zmm2 + vfnmadd132bf16 (%eax){1to32}, %zmm3, %zmm2 -// CHECK: vfnmadd132nepbf16 -2048(,%ebp,2), %zmm3, %zmm2 +// CHECK: vfnmadd132bf16 -2048(,%ebp,2), %zmm3, %zmm2 // CHECK: encoding: [0x62,0xf6,0x64,0x48,0x9c,0x14,0x6d,0x00,0xf8,0xff,0xff] - vfnmadd132nepbf16 -2048(,%ebp,2), %zmm3, %zmm2 + vfnmadd132bf16 -2048(,%ebp,2), %zmm3, %zmm2 -// CHECK: vfnmadd132nepbf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z} +// CHECK: vfnmadd132bf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z} // CHECK: encoding: [0x62,0xf6,0x64,0xcf,0x9c,0x51,0x7f] - vfnmadd132nepbf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z} + vfnmadd132bf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z} -// CHECK: vfnmadd132nepbf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z} +// CHECK: vfnmadd132bf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z} // CHECK: encoding: [0x62,0xf6,0x64,0xdf,0x9c,0x52,0x80] - vfnmadd132nepbf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z} + vfnmadd132bf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z} -// CHECK: vfnmadd132nepbf16 268435456(%esp,%esi,8), %ymm3, %ymm2 +// CHECK: vfnmadd132bf16 268435456(%esp,%esi,8), %ymm3, %ymm2 // CHECK: encoding: [0x62,0xf6,0x64,0x28,0x9c,0x94,0xf4,0x00,0x00,0x00,0x10] - vfnmadd132nepbf16 268435456(%esp,%esi,8), %ymm3, %ymm2 + vfnmadd132bf16 268435456(%esp,%esi,8), %ymm3, %ymm2 -// CHECK: vfnmadd132nepbf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7} +// CHECK: vfnmadd132bf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7} // CHECK: encoding: [0x62,0xf6,0x64,0x2f,0x9c,0x94,0x87,0x23,0x01,0x00,0x00] - vfnmadd132nepbf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7} + vfnmadd132bf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7} -// CHECK: vfnmadd132nepbf16 (%eax){1to16}, %ymm3, %ymm2 +// CHECK: vfnmadd132bf16 (%eax){1to16}, %ymm3, %ymm2 // CHECK: encoding: [0x62,0xf6,0x64,0x38,0x9c,0x10] - vfnmadd132nepbf16 (%eax){1to16}, %ymm3, %ymm2 + vfnmadd132bf16 (%eax){1to16}, %ymm3, %ymm2 -// CHECK: vfnmadd132nepbf16 -1024(,%ebp,2), %ymm3, %ymm2 +// CHECK: vfnmadd132bf16 -1024(,%ebp,2), %ymm3, %ymm2 // CHECK: encoding: [0x62,0xf6,0x64,0x28,0x9c,0x14,0x6d,0x00,0xfc,0xff,0xff] - vfnmadd132nepbf16 -1024(,%ebp,2), %ymm3, %ymm2 + vfnmadd132bf16 -1024(,%ebp,2), %ymm3, %ymm2 -// CHECK: vfnmadd132nepbf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z} +// CHECK: vfnmadd132bf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z} // CHECK: encoding: [0x62,0xf6,0x64,0xaf,0x9c,0x51,0x7f] - vfnmadd132nepbf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z} + vfnmadd132bf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z} -// CHECK: vfnmadd132nepbf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z} +// CHECK: vfnmadd132bf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z} // CHECK: encoding: [0x62,0xf6,0x64,0xbf,0x9c,0x52,0x80] - vfnmadd132nepbf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z} + vfnmadd132bf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z} -// CHECK: vfnmadd132nepbf16 268435456(%esp,%esi,8), %xmm3, %xmm2 +// CHECK: vfnmadd132bf16 268435456(%esp,%esi,8), %xmm3, %xmm2 // CHECK: encoding: [0x62,0xf6,0x64,0x08,0x9c,0x94,0xf4,0x00,0x00,0x00,0x10] - vfnmadd132nepbf16 268435456(%esp,%esi,8), %xmm3, %xmm2 + vfnmadd132bf16 268435456(%esp,%esi,8), %xmm3, %xmm2 -// CHECK: vfnmadd132nepbf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7} +// CHECK: vfnmadd132bf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7} // CHECK: encoding: [0x62,0xf6,0x64,0x0f,0x9c,0x94,0x87,0x23,0x01,0x00,0x00] - vfnmadd132nepbf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7} + vfnmadd132bf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7} -// CHECK: vfnmadd132nepbf16 (%eax){1to8}, %xmm3, %xmm2 +// CHECK: vfnmadd132bf16 (%eax){1to8}, %xmm3, %xmm2 // CHECK: encoding: [0x62,0xf6,0x64,0x18,0x9c,0x10] - vfnmadd132nepbf16 (%eax){1to8}, %xmm3, %xmm2 + vfnmadd132bf16 (%eax){1to8}, %xmm3, %xmm2 -// CHECK: vfnmadd132nepbf16 -512(,%ebp,2), %xmm3, %xmm2 +// CHECK: vfnmadd132bf16 -512(,%ebp,2), %xmm3, %xmm2 // CHECK: encoding: [0x62,0xf6,0x64,0x08,0x9c,0x14,0x6d,0x00,0xfe,0xff,0xff] - vfnmadd132nepbf16 -512(,%ebp,2), %xmm3, %xmm2 + vfnmadd132bf16 -512(,%ebp,2), %xmm3, %xmm2 -// CHECK: vfnmadd132nepbf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z} +// CHECK: vfnmadd132bf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z} // CHECK: encoding: [0x62,0xf6,0x64,0x8f,0x9c,0x51,0x7f] - vfnmadd132nepbf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z} + vfnmadd132bf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z} -// CHECK: vfnmadd132nepbf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z} +// CHECK: vfnmadd132bf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z} // CHECK: encoding: [0x62,0xf6,0x64,0x9f,0x9c,0x52,0x80] - vfnmadd132nepbf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z} + vfnmadd132bf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z} -// CHECK: vfnmadd213nepbf16 %ymm4, %ymm3, %ymm2 +// CHECK: vfnmadd213bf16 %ymm4, %ymm3, %ymm2 // CHECK: encoding: [0x62,0xf6,0x64,0x28,0xac,0xd4] - vfnmadd213nepbf16 %ymm4, %ymm3, %ymm2 + vfnmadd213bf16 %ymm4, %ymm3, %ymm2 -// CHECK: vfnmadd213nepbf16 %ymm4, %ymm3, %ymm2 {%k7} +// CHECK: vfnmadd213bf16 %ymm4, %ymm3, %ymm2 {%k7} // CHECK: encoding: [0x62,0xf6,0x64,0x2f,0xac,0xd4] - vfnmadd213nepbf16 %ymm4, %ymm3, %ymm2 {%k7} + vfnmadd213bf16 %ymm4, %ymm3, %ymm2 {%k7} -// CHECK: vfnmadd213nepbf16 %ymm4, %ymm3, %ymm2 {%k7} {z} +// CHECK: vfnmadd213bf16 %ymm4, %ymm3, %ymm2 {%k7} {z} // CHECK: encoding: [0x62,0xf6,0x64,0xaf,0xac,0xd4] - vfnmadd213nepbf16 %ymm4, %ymm3, %ymm2 {%k7} {z} + vfnmadd213bf16 %ymm4, %ymm3, %ymm2 {%k7} {z} -// CHECK: vfnmadd213nepbf16 %zmm4, %zmm3, %zmm2 +// CHECK: vfnmadd213bf16 %zmm4, %zmm3, %zmm2 // CHECK: encoding: [0x62,0xf6,0x64,0x48,0xac,0xd4] - vfnmadd213nepbf16 %zmm4, %zmm3, %zmm2 + vfnmadd213bf16 %zmm4, %zmm3, %zmm2 -// CHECK: vfnmadd213nepbf16 %zmm4, %zmm3, %zmm2 {%k7} +// CHECK: vfnmadd213bf16 %zmm4, %zmm3, %zmm2 {%k7} // CHECK: encoding: [0x62,0xf6,0x64,0x4f,0xac,0xd4] - vfnmadd213nepbf16 %zmm4, %zmm3, %zmm2 {%k7} + vfnmadd213bf16 %zmm4, %zmm3, %zmm2 {%k7} -// CHECK: vfnmadd213nepbf16 %zmm4, %zmm3, %zmm2 {%k7} {z} +// CHECK: vfnmadd213bf16 %zmm4, %zmm3, %zmm2 {%k7} {z} // CHECK: encoding: [0x62,0xf6,0x64,0xcf,0xac,0xd4] - vfnmadd213nepbf16 %zmm4, %zmm3, %zmm2 {%k7} {z} + vfnmadd213bf16 %zmm4, %zmm3, %zmm2 {%k7} {z} -// CHECK: vfnmadd213nepbf16 %xmm4, %xmm3, %xmm2 +// CHECK: vfnmadd213bf16 %xmm4, %xmm3, %xmm2 // CHECK: encoding: [0x62,0xf6,0x64,0x08,0xac,0xd4] - vfnmadd213nepbf16 %xmm4, %xmm3, %xmm2 + vfnmadd213bf16 %xmm4, %xmm3, %xmm2 -// CHECK: vfnmadd213nepbf16 %xmm4, %xmm3, %xmm2 {%k7} +// CHECK: vfnmadd213bf16 %xmm4, %xmm3, %xmm2 {%k7} // CHECK: encoding: [0x62,0xf6,0x64,0x0f,0xac,0xd4] - vfnmadd213nepbf16 %xmm4, %xmm3, %xmm2 {%k7} + vfnmadd213bf16 %xmm4, %xmm3, %xmm2 {%k7} -// CHECK: vfnmadd213nepbf16 %xmm4, %xmm3, %xmm2 {%k7} {z} +// CHECK: vfnmadd213bf16 %xmm4, %xmm3, %xmm2 {%k7} {z} // CHECK: encoding: [0x62,0xf6,0x64,0x8f,0xac,0xd4] - vfnmadd213nepbf16 %xmm4, %xmm3, %xmm2 {%k7} {z} + vfnmadd213bf16 %xmm4, %xmm3, %xmm2 {%k7} {z} -// CHECK: vfnmadd213nepbf16 268435456(%esp,%esi,8), %zmm3, %zmm2 +// CHECK: vfnmadd213bf16 268435456(%esp,%esi,8), %zmm3, %zmm2 // CHECK: encoding: [0x62,0xf6,0x64,0x48,0xac,0x94,0xf4,0x00,0x00,0x00,0x10] - vfnmadd213nepbf16 268435456(%esp,%esi,8), %zmm3, %zmm2 + vfnmadd213bf16 268435456(%esp,%esi,8), %zmm3, %zmm2 -// CHECK: vfnmadd213nepbf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7} +// CHECK: vfnmadd213bf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7} // CHECK: encoding: [0x62,0xf6,0x64,0x4f,0xac,0x94,0x87,0x23,0x01,0x00,0x00] - vfnmadd213nepbf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7} + vfnmadd213bf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7} -// CHECK: vfnmadd213nepbf16 (%eax){1to32}, %zmm3, %zmm2 +// CHECK: vfnmadd213bf16 (%eax){1to32}, %zmm3, %zmm2 // CHECK: encoding: [0x62,0xf6,0x64,0x58,0xac,0x10] - vfnmadd213nepbf16 (%eax){1to32}, %zmm3, %zmm2 + vfnmadd213bf16 (%eax){1to32}, %zmm3, %zmm2 -// CHECK: vfnmadd213nepbf16 -2048(,%ebp,2), %zmm3, %zmm2 +// CHECK: vfnmadd213bf16 -2048(,%ebp,2), %zmm3, %zmm2 // CHECK: encoding: [0x62,0xf6,0x64,0x48,0xac,0x14,0x6d,0x00,0xf8,0xff,0xff] - vfnmadd213nepbf16 -2048(,%ebp,2), %zmm3, %zmm2 + vfnmadd213bf16 -2048(,%ebp,2), %zmm3, %zmm2 -// CHECK: vfnmadd213nepbf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z} +// CHECK: vfnmadd213bf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z} // CHECK: encoding: [0x62,0xf6,0x64,0xcf,0xac,0x51,0x7f] - vfnmadd213nepbf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z} + vfnmadd213bf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z} -// CHECK: vfnmadd213nepbf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z} +// CHECK: vfnmadd213bf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z} // CHECK: encoding: [0x62,0xf6,0x64,0xdf,0xac,0x52,0x80] - vfnmadd213nepbf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z} + vfnmadd213bf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z} -// CHECK: vfnmadd213nepbf16 268435456(%esp,%esi,8), %ymm3, %ymm2 +// CHECK: vfnmadd213bf16 268435456(%esp,%esi,8), %ymm3, %ymm2 // CHECK: encoding: [0x62,0xf6,0x64,0x28,0xac,0x94,0xf4,0x00,0x00,0x00,0x10] - vfnmadd213nepbf16 268435456(%esp,%esi,8), %ymm3, %ymm2 + vfnmadd213bf16 268435456(%esp,%esi,8), %ymm3, %ymm2 -// CHECK: vfnmadd213nepbf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7} +// CHECK: vfnmadd213bf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7} // CHECK: encoding: [0x62,0xf6,0x64,0x2f,0xac,0x94,0x87,0x23,0x01,0x00,0x00] - vfnmadd213nepbf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7} + vfnmadd213bf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7} -// CHECK: vfnmadd213nepbf16 (%eax){1to16}, %ymm3, %ymm2 +// CHECK: vfnmadd213bf16 (%eax){1to16}, %ymm3, %ymm2 // CHECK: encoding: [0x62,0xf6,0x64,0x38,0xac,0x10] - vfnmadd213nepbf16 (%eax){1to16}, %ymm3, %ymm2 + vfnmadd213bf16 (%eax){1to16}, %ymm3, %ymm2 -// CHECK: vfnmadd213nepbf16 -1024(,%ebp,2), %ymm3, %ymm2 +// CHECK: vfnmadd213bf16 -1024(,%ebp,2), %ymm3, %ymm2 // CHECK: encoding: [0x62,0xf6,0x64,0x28,0xac,0x14,0x6d,0x00,0xfc,0xff,0xff] - vfnmadd213nepbf16 -1024(,%ebp,2), %ymm3, %ymm2 + vfnmadd213bf16 -1024(,%ebp,2), %ymm3, %ymm2 -// CHECK: vfnmadd213nepbf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z} +// CHECK: vfnmadd213bf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z} // CHECK: encoding: [0x62,0xf6,0x64,0xaf,0xac,0x51,0x7f] - vfnmadd213nepbf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z} + vfnmadd213bf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z} -// CHECK: vfnmadd213nepbf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z} +// CHECK: vfnmadd213bf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z} // CHECK: encoding: [0x62,0xf6,0x64,0xbf,0xac,0x52,0x80] - vfnmadd213nepbf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z} + vfnmadd213bf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z} -// CHECK: vfnmadd213nepbf16 268435456(%esp,%esi,8), %xmm3, %xmm2 +// CHECK: vfnmadd213bf16 268435456(%esp,%esi,8), %xmm3, %xmm2 // CHECK: encoding: [0x62,0xf6,0x64,0x08,0xac,0x94,0xf4,0x00,0x00,0x00,0x10] - vfnmadd213nepbf16 268435456(%esp,%esi,8), %xmm3, %xmm2 + vfnmadd213bf16 268435456(%esp,%esi,8), %xmm3, %xmm2 -// CHECK: vfnmadd213nepbf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7} +// CHECK: vfnmadd213bf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7} // CHECK: encoding: [0x62,0xf6,0x64,0x0f,0xac,0x94,0x87,0x23,0x01,0x00,0x00] - vfnmadd213nepbf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7} + vfnmadd213bf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7} -// CHECK: vfnmadd213nepbf16 (%eax){1to8}, %xmm3, %xmm2 +// CHECK: vfnmadd213bf16 (%eax){1to8}, %xmm3, %xmm2 // CHECK: encoding: [0x62,0xf6,0x64,0x18,0xac,0x10] - vfnmadd213nepbf16 (%eax){1to8}, %xmm3, %xmm2 + vfnmadd213bf16 (%eax){1to8}, %xmm3, %xmm2 -// CHECK: vfnmadd213nepbf16 -512(,%ebp,2), %xmm3, %xmm2 +// CHECK: vfnmadd213bf16 -512(,%ebp,2), %xmm3, %xmm2 // CHECK: encoding: [0x62,0xf6,0x64,0x08,0xac,0x14,0x6d,0x00,0xfe,0xff,0xff] - vfnmadd213nepbf16 -512(,%ebp,2), %xmm3, %xmm2 + vfnmadd213bf16 -512(,%ebp,2), %xmm3, %xmm2 -// CHECK: vfnmadd213nepbf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z} +// CHECK: vfnmadd213bf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z} // CHECK: encoding: [0x62,0xf6,0x64,0x8f,0xac,0x51,0x7f] - vfnmadd213nepbf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z} + vfnmadd213bf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z} -// CHECK: vfnmadd213nepbf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z} +// CHECK: vfnmadd213bf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z} // CHECK: encoding: [0x62,0xf6,0x64,0x9f,0xac,0x52,0x80] - vfnmadd213nepbf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z} + vfnmadd213bf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z} -// CHECK: vfnmadd231nepbf16 %ymm4, %ymm3, %ymm2 +// CHECK: vfnmadd231bf16 %ymm4, %ymm3, %ymm2 // CHECK: encoding: [0x62,0xf6,0x64,0x28,0xbc,0xd4] - vfnmadd231nepbf16 %ymm4, %ymm3, %ymm2 + vfnmadd231bf16 %ymm4, %ymm3, %ymm2 -// CHECK: vfnmadd231nepbf16 %ymm4, %ymm3, %ymm2 {%k7} +// CHECK: vfnmadd231bf16 %ymm4, %ymm3, %ymm2 {%k7} // CHECK: encoding: [0x62,0xf6,0x64,0x2f,0xbc,0xd4] - vfnmadd231nepbf16 %ymm4, %ymm3, %ymm2 {%k7} + vfnmadd231bf16 %ymm4, %ymm3, %ymm2 {%k7} -// CHECK: vfnmadd231nepbf16 %ymm4, %ymm3, %ymm2 {%k7} {z} +// CHECK: vfnmadd231bf16 %ymm4, %ymm3, %ymm2 {%k7} {z} // CHECK: encoding: [0x62,0xf6,0x64,0xaf,0xbc,0xd4] - vfnmadd231nepbf16 %ymm4, %ymm3, %ymm2 {%k7} {z} + vfnmadd231bf16 %ymm4, %ymm3, %ymm2 {%k7} {z} -// CHECK: vfnmadd231nepbf16 %zmm4, %zmm3, %zmm2 +// CHECK: vfnmadd231bf16 %zmm4, %zmm3, %zmm2 // CHECK: encoding: [0x62,0xf6,0x64,0x48,0xbc,0xd4] - vfnmadd231nepbf16 %zmm4, %zmm3, %zmm2 + vfnmadd231bf16 %zmm4, %zmm3, %zmm2 -// CHECK: vfnmadd231nepbf16 %zmm4, %zmm3, %zmm2 {%k7} +// CHECK: vfnmadd231bf16 %zmm4, %zmm3, %zmm2 {%k7} // CHECK: encoding: [0x62,0xf6,0x64,0x4f,0xbc,0xd4] - vfnmadd231nepbf16 %zmm4, %zmm3, %zmm2 {%k7} + vfnmadd231bf16 %zmm4, %zmm3, %zmm2 {%k7} -// CHECK: vfnmadd231nepbf16 %zmm4, %zmm3, %zmm2 {%k7} {z} +// CHECK: vfnmadd231bf16 %zmm4, %zmm3, %zmm2 {%k7} {z} // CHECK: encoding: [0x62,0xf6,0x64,0xcf,0xbc,0xd4] - vfnmadd231nepbf16 %zmm4, %zmm3, %zmm2 {%k7} {z} + vfnmadd231bf16 %zmm4, %zmm3, %zmm2 {%k7} {z} -// CHECK: vfnmadd231nepbf16 %xmm4, %xmm3, %xmm2 +// CHECK: vfnmadd231bf16 %xmm4, %xmm3, %xmm2 // CHECK: encoding: [0x62,0xf6,0x64,0x08,0xbc,0xd4] - vfnmadd231nepbf16 %xmm4, %xmm3, %xmm2 + vfnmadd231bf16 %xmm4, %xmm3, %xmm2 -// CHECK: vfnmadd231nepbf16 %xmm4, %xmm3, %xmm2 {%k7} +// CHECK: vfnmadd231bf16 %xmm4, %xmm3, %xmm2 {%k7} // CHECK: encoding: [0x62,0xf6,0x64,0x0f,0xbc,0xd4] - vfnmadd231nepbf16 %xmm4, %xmm3, %xmm2 {%k7} + vfnmadd231bf16 %xmm4, %xmm3, %xmm2 {%k7} -// CHECK: vfnmadd231nepbf16 %xmm4, %xmm3, %xmm2 {%k7} {z} +// CHECK: vfnmadd231bf16 %xmm4, %xmm3, %xmm2 {%k7} {z} // CHECK: encoding: [0x62,0xf6,0x64,0x8f,0xbc,0xd4] - vfnmadd231nepbf16 %xmm4, %xmm3, %xmm2 {%k7} {z} + vfnmadd231bf16 %xmm4, %xmm3, %xmm2 {%k7} {z} -// CHECK: vfnmadd231nepbf16 268435456(%esp,%esi,8), %zmm3, %zmm2 +// CHECK: vfnmadd231bf16 268435456(%esp,%esi,8), %zmm3, %zmm2 // CHECK: encoding: [0x62,0xf6,0x64,0x48,0xbc,0x94,0xf4,0x00,0x00,0x00,0x10] - vfnmadd231nepbf16 268435456(%esp,%esi,8), %zmm3, %zmm2 + vfnmadd231bf16 268435456(%esp,%esi,8), %zmm3, %zmm2 -// CHECK: vfnmadd231nepbf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7} +// CHECK: vfnmadd231bf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7} // CHECK: encoding: [0x62,0xf6,0x64,0x4f,0xbc,0x94,0x87,0x23,0x01,0x00,0x00] - vfnmadd231nepbf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7} + vfnmadd231bf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7} -// CHECK: vfnmadd231nepbf16 (%eax){1to32}, %zmm3, %zmm2 +// CHECK: vfnmadd231bf16 (%eax){1to32}, %zmm3, %zmm2 // CHECK: encoding: [0x62,0xf6,0x64,0x58,0xbc,0x10] - vfnmadd231nepbf16 (%eax){1to32}, %zmm3, %zmm2 + vfnmadd231bf16 (%eax){1to32}, %zmm3, %zmm2 -// CHECK: vfnmadd231nepbf16 -2048(,%ebp,2), %zmm3, %zmm2 +// CHECK: vfnmadd231bf16 -2048(,%ebp,2), %zmm3, %zmm2 // CHECK: encoding: [0x62,0xf6,0x64,0x48,0xbc,0x14,0x6d,0x00,0xf8,0xff,0xff] - vfnmadd231nepbf16 -2048(,%ebp,2), %zmm3, %zmm2 + vfnmadd231bf16 -2048(,%ebp,2), %zmm3, %zmm2 -// CHECK: vfnmadd231nepbf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z} +// CHECK: vfnmadd231bf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z} // CHECK: encoding: [0x62,0xf6,0x64,0xcf,0xbc,0x51,0x7f] - vfnmadd231nepbf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z} + vfnmadd231bf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z} -// CHECK: vfnmadd231nepbf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z} +// CHECK: vfnmadd231bf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z} // CHECK: encoding: [0x62,0xf6,0x64,0xdf,0xbc,0x52,0x80] - vfnmadd231nepbf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z} + vfnmadd231bf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z} -// CHECK: vfnmadd231nepbf16 268435456(%esp,%esi,8), %ymm3, %ymm2 +// CHECK: vfnmadd231bf16 268435456(%esp,%esi,8), %ymm3, %ymm2 // CHECK: encoding: [0x62,0xf6,0x64,0x28,0xbc,0x94,0xf4,0x00,0x00,0x00,0x10] - vfnmadd231nepbf16 268435456(%esp,%esi,8), %ymm3, %ymm2 + vfnmadd231bf16 268435456(%esp,%esi,8), %ymm3, %ymm2 -// CHECK: vfnmadd231nepbf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7} +// CHECK: vfnmadd231bf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7} // CHECK: encoding: [0x62,0xf6,0x64,0x2f,0xbc,0x94,0x87,0x23,0x01,0x00,0x00] - vfnmadd231nepbf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7} + vfnmadd231bf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7} -// CHECK: vfnmadd231nepbf16 (%eax){1to16}, %ymm3, %ymm2 +// CHECK: vfnmadd231bf16 (%eax){1to16}, %ymm3, %ymm2 // CHECK: encoding: [0x62,0xf6,0x64,0x38,0xbc,0x10] - vfnmadd231nepbf16 (%eax){1to16}, %ymm3, %ymm2 + vfnmadd231bf16 (%eax){1to16}, %ymm3, %ymm2 -// CHECK: vfnmadd231nepbf16 -1024(,%ebp,2), %ymm3, %ymm2 +// CHECK: vfnmadd231bf16 -1024(,%ebp,2), %ymm3, %ymm2 // CHECK: encoding: [0x62,0xf6,0x64,0x28,0xbc,0x14,0x6d,0x00,0xfc,0xff,0xff] - vfnmadd231nepbf16 -1024(,%ebp,2), %ymm3, %ymm2 + vfnmadd231bf16 -1024(,%ebp,2), %ymm3, %ymm2 -// CHECK: vfnmadd231nepbf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z} +// CHECK: vfnmadd231bf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z} // CHECK: encoding: [0x62,0xf6,0x64,0xaf,0xbc,0x51,0x7f] - vfnmadd231nepbf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z} + vfnmadd231bf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z} -// CHECK: vfnmadd231nepbf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z} +// CHECK: vfnmadd231bf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z} // CHECK: encoding: [0x62,0xf6,0x64,0xbf,0xbc,0x52,0x80] - vfnmadd231nepbf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z} + vfnmadd231bf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z} -// CHECK: vfnmadd231nepbf16 268435456(%esp,%esi,8), %xmm3, %xmm2 +// CHECK: vfnmadd231bf16 268435456(%esp,%esi,8), %xmm3, %xmm2 // CHECK: encoding: [0x62,0xf6,0x64,0x08,0xbc,0x94,0xf4,0x00,0x00,0x00,0x10] - vfnmadd231nepbf16 268435456(%esp,%esi,8), %xmm3, %xmm2 + vfnmadd231bf16 268435456(%esp,%esi,8), %xmm3, %xmm2 -// CHECK: vfnmadd231nepbf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7} +// CHECK: vfnmadd231bf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7} // CHECK: encoding: [0x62,0xf6,0x64,0x0f,0xbc,0x94,0x87,0x23,0x01,0x00,0x00] - vfnmadd231nepbf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7} + vfnmadd231bf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7} -// CHECK: vfnmadd231nepbf16 (%eax){1to8}, %xmm3, %xmm2 +// CHECK: vfnmadd231bf16 (%eax){1to8}, %xmm3, %xmm2 // CHECK: encoding: [0x62,0xf6,0x64,0x18,0xbc,0x10] - vfnmadd231nepbf16 (%eax){1to8}, %xmm3, %xmm2 + vfnmadd231bf16 (%eax){1to8}, %xmm3, %xmm2 -// CHECK: vfnmadd231nepbf16 -512(,%ebp,2), %xmm3, %xmm2 +// CHECK: vfnmadd231bf16 -512(,%ebp,2), %xmm3, %xmm2 // CHECK: encoding: [0x62,0xf6,0x64,0x08,0xbc,0x14,0x6d,0x00,0xfe,0xff,0xff] - vfnmadd231nepbf16 -512(,%ebp,2), %xmm3, %xmm2 + vfnmadd231bf16 -512(,%ebp,2), %xmm3, %xmm2 -// CHECK: vfnmadd231nepbf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z} +// CHECK: vfnmadd231bf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z} // CHECK: encoding: [0x62,0xf6,0x64,0x8f,0xbc,0x51,0x7f] - vfnmadd231nepbf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z} + vfnmadd231bf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z} -// CHECK: vfnmadd231nepbf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z} +// CHECK: vfnmadd231bf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z} // CHECK: encoding: [0x62,0xf6,0x64,0x9f,0xbc,0x52,0x80] - vfnmadd231nepbf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z} + vfnmadd231bf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z} -// CHECK: vfnmsub132nepbf16 %ymm4, %ymm3, %ymm2 +// CHECK: vfnmsub132bf16 %ymm4, %ymm3, %ymm2 // CHECK: encoding: [0x62,0xf6,0x64,0x28,0x9e,0xd4] - vfnmsub132nepbf16 %ymm4, %ymm3, %ymm2 + vfnmsub132bf16 %ymm4, %ymm3, %ymm2 -// CHECK: vfnmsub132nepbf16 %ymm4, %ymm3, %ymm2 {%k7} +// CHECK: vfnmsub132bf16 %ymm4, %ymm3, %ymm2 {%k7} // CHECK: encoding: [0x62,0xf6,0x64,0x2f,0x9e,0xd4] - vfnmsub132nepbf16 %ymm4, %ymm3, %ymm2 {%k7} + vfnmsub132bf16 %ymm4, %ymm3, %ymm2 {%k7} -// CHECK: vfnmsub132nepbf16 %ymm4, %ymm3, %ymm2 {%k7} {z} +// CHECK: vfnmsub132bf16 %ymm4, %ymm3, %ymm2 {%k7} {z} // CHECK: encoding: [0x62,0xf6,0x64,0xaf,0x9e,0xd4] - vfnmsub132nepbf16 %ymm4, %ymm3, %ymm2 {%k7} {z} + vfnmsub132bf16 %ymm4, %ymm3, %ymm2 {%k7} {z} -// CHECK: vfnmsub132nepbf16 %zmm4, %zmm3, %zmm2 +// CHECK: vfnmsub132bf16 %zmm4, %zmm3, %zmm2 // CHECK: encoding: [0x62,0xf6,0x64,0x48,0x9e,0xd4] - vfnmsub132nepbf16 %zmm4, %zmm3, %zmm2 + vfnmsub132bf16 %zmm4, %zmm3, %zmm2 -// CHECK: vfnmsub132nepbf16 %zmm4, %zmm3, %zmm2 {%k7} +// CHECK: vfnmsub132bf16 %zmm4, %zmm3, %zmm2 {%k7} // CHECK: encoding: [0x62,0xf6,0x64,0x4f,0x9e,0xd4] - vfnmsub132nepbf16 %zmm4, %zmm3, %zmm2 {%k7} + vfnmsub132bf16 %zmm4, %zmm3, %zmm2 {%k7} -// CHECK: vfnmsub132nepbf16 %zmm4, %zmm3, %zmm2 {%k7} {z} +// CHECK: vfnmsub132bf16 %zmm4, %zmm3, %zmm2 {%k7} {z} // CHECK: encoding: [0x62,0xf6,0x64,0xcf,0x9e,0xd4] - vfnmsub132nepbf16 %zmm4, %zmm3, %zmm2 {%k7} {z} + vfnmsub132bf16 %zmm4, %zmm3, %zmm2 {%k7} {z} -// CHECK: vfnmsub132nepbf16 %xmm4, %xmm3, %xmm2 +// CHECK: vfnmsub132bf16 %xmm4, %xmm3, %xmm2 // CHECK: encoding: [0x62,0xf6,0x64,0x08,0x9e,0xd4] - vfnmsub132nepbf16 %xmm4, %xmm3, %xmm2 + vfnmsub132bf16 %xmm4, %xmm3, %xmm2 -// CHECK: vfnmsub132nepbf16 %xmm4, %xmm3, %xmm2 {%k7} +// CHECK: vfnmsub132bf16 %xmm4, %xmm3, %xmm2 {%k7} // CHECK: encoding: [0x62,0xf6,0x64,0x0f,0x9e,0xd4] - vfnmsub132nepbf16 %xmm4, %xmm3, %xmm2 {%k7} + vfnmsub132bf16 %xmm4, %xmm3, %xmm2 {%k7} -// CHECK: vfnmsub132nepbf16 %xmm4, %xmm3, %xmm2 {%k7} {z} +// CHECK: vfnmsub132bf16 %xmm4, %xmm3, %xmm2 {%k7} {z} // CHECK: encoding: [0x62,0xf6,0x64,0x8f,0x9e,0xd4] - vfnmsub132nepbf16 %xmm4, %xmm3, %xmm2 {%k7} {z} + vfnmsub132bf16 %xmm4, %xmm3, %xmm2 {%k7} {z} -// CHECK: vfnmsub132nepbf16 268435456(%esp,%esi,8), %zmm3, %zmm2 +// CHECK: vfnmsub132bf16 268435456(%esp,%esi,8), %zmm3, %zmm2 // CHECK: encoding: [0x62,0xf6,0x64,0x48,0x9e,0x94,0xf4,0x00,0x00,0x00,0x10] - vfnmsub132nepbf16 268435456(%esp,%esi,8), %zmm3, %zmm2 + vfnmsub132bf16 268435456(%esp,%esi,8), %zmm3, %zmm2 -// CHECK: vfnmsub132nepbf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7} +// CHECK: vfnmsub132bf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7} // CHECK: encoding: [0x62,0xf6,0x64,0x4f,0x9e,0x94,0x87,0x23,0x01,0x00,0x00] - vfnmsub132nepbf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7} + vfnmsub132bf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7} -// CHECK: vfnmsub132nepbf16 (%eax){1to32}, %zmm3, %zmm2 +// CHECK: vfnmsub132bf16 (%eax){1to32}, %zmm3, %zmm2 // CHECK: encoding: [0x62,0xf6,0x64,0x58,0x9e,0x10] - vfnmsub132nepbf16 (%eax){1to32}, %zmm3, %zmm2 + vfnmsub132bf16 (%eax){1to32}, %zmm3, %zmm2 -// CHECK: vfnmsub132nepbf16 -2048(,%ebp,2), %zmm3, %zmm2 +// CHECK: vfnmsub132bf16 -2048(,%ebp,2), %zmm3, %zmm2 // CHECK: encoding: [0x62,0xf6,0x64,0x48,0x9e,0x14,0x6d,0x00,0xf8,0xff,0xff] - vfnmsub132nepbf16 -2048(,%ebp,2), %zmm3, %zmm2 + vfnmsub132bf16 -2048(,%ebp,2), %zmm3, %zmm2 -// CHECK: vfnmsub132nepbf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z} +// CHECK: vfnmsub132bf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z} // CHECK: encoding: [0x62,0xf6,0x64,0xcf,0x9e,0x51,0x7f] - vfnmsub132nepbf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z} + vfnmsub132bf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z} -// CHECK: vfnmsub132nepbf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z} +// CHECK: vfnmsub132bf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z} // CHECK: encoding: [0x62,0xf6,0x64,0xdf,0x9e,0x52,0x80] - vfnmsub132nepbf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z} + vfnmsub132bf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z} -// CHECK: vfnmsub132nepbf16 268435456(%esp,%esi,8), %ymm3, %ymm2 +// CHECK: vfnmsub132bf16 268435456(%esp,%esi,8), %ymm3, %ymm2 // CHECK: encoding: [0x62,0xf6,0x64,0x28,0x9e,0x94,0xf4,0x00,0x00,0x00,0x10] - vfnmsub132nepbf16 268435456(%esp,%esi,8), %ymm3, %ymm2 + vfnmsub132bf16 268435456(%esp,%esi,8), %ymm3, %ymm2 -// CHECK: vfnmsub132nepbf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7} +// CHECK: vfnmsub132bf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7} // CHECK: encoding: [0x62,0xf6,0x64,0x2f,0x9e,0x94,0x87,0x23,0x01,0x00,0x00] - vfnmsub132nepbf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7} + vfnmsub132bf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7} -// CHECK: vfnmsub132nepbf16 (%eax){1to16}, %ymm3, %ymm2 +// CHECK: vfnmsub132bf16 (%eax){1to16}, %ymm3, %ymm2 // CHECK: encoding: [0x62,0xf6,0x64,0x38,0x9e,0x10] - vfnmsub132nepbf16 (%eax){1to16}, %ymm3, %ymm2 + vfnmsub132bf16 (%eax){1to16}, %ymm3, %ymm2 -// CHECK: vfnmsub132nepbf16 -1024(,%ebp,2), %ymm3, %ymm2 +// CHECK: vfnmsub132bf16 -1024(,%ebp,2), %ymm3, %ymm2 // CHECK: encoding: [0x62,0xf6,0x64,0x28,0x9e,0x14,0x6d,0x00,0xfc,0xff,0xff] - vfnmsub132nepbf16 -1024(,%ebp,2), %ymm3, %ymm2 + vfnmsub132bf16 -1024(,%ebp,2), %ymm3, %ymm2 -// CHECK: vfnmsub132nepbf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z} +// CHECK: vfnmsub132bf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z} // CHECK: encoding: [0x62,0xf6,0x64,0xaf,0x9e,0x51,0x7f] - vfnmsub132nepbf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z} + vfnmsub132bf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z} -// CHECK: vfnmsub132nepbf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z} +// CHECK: vfnmsub132bf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z} // CHECK: encoding: [0x62,0xf6,0x64,0xbf,0x9e,0x52,0x80] - vfnmsub132nepbf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z} + vfnmsub132bf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z} -// CHECK: vfnmsub132nepbf16 268435456(%esp,%esi,8), %xmm3, %xmm2 +// CHECK: vfnmsub132bf16 268435456(%esp,%esi,8), %xmm3, %xmm2 // CHECK: encoding: [0x62,0xf6,0x64,0x08,0x9e,0x94,0xf4,0x00,0x00,0x00,0x10] - vfnmsub132nepbf16 268435456(%esp,%esi,8), %xmm3, %xmm2 + vfnmsub132bf16 268435456(%esp,%esi,8), %xmm3, %xmm2 -// CHECK: vfnmsub132nepbf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7} +// CHECK: vfnmsub132bf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7} // CHECK: encoding: [0x62,0xf6,0x64,0x0f,0x9e,0x94,0x87,0x23,0x01,0x00,0x00] - vfnmsub132nepbf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7} + vfnmsub132bf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7} -// CHECK: vfnmsub132nepbf16 (%eax){1to8}, %xmm3, %xmm2 +// CHECK: vfnmsub132bf16 (%eax){1to8}, %xmm3, %xmm2 // CHECK: encoding: [0x62,0xf6,0x64,0x18,0x9e,0x10] - vfnmsub132nepbf16 (%eax){1to8}, %xmm3, %xmm2 + vfnmsub132bf16 (%eax){1to8}, %xmm3, %xmm2 -// CHECK: vfnmsub132nepbf16 -512(,%ebp,2), %xmm3, %xmm2 +// CHECK: vfnmsub132bf16 -512(,%ebp,2), %xmm3, %xmm2 // CHECK: encoding: [0x62,0xf6,0x64,0x08,0x9e,0x14,0x6d,0x00,0xfe,0xff,0xff] - vfnmsub132nepbf16 -512(,%ebp,2), %xmm3, %xmm2 + vfnmsub132bf16 -512(,%ebp,2), %xmm3, %xmm2 -// CHECK: vfnmsub132nepbf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z} +// CHECK: vfnmsub132bf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z} // CHECK: encoding: [0x62,0xf6,0x64,0x8f,0x9e,0x51,0x7f] - vfnmsub132nepbf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z} + vfnmsub132bf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z} -// CHECK: vfnmsub132nepbf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z} +// CHECK: vfnmsub132bf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z} // CHECK: encoding: [0x62,0xf6,0x64,0x9f,0x9e,0x52,0x80] - vfnmsub132nepbf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z} + vfnmsub132bf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z} -// CHECK: vfnmsub213nepbf16 %ymm4, %ymm3, %ymm2 +// CHECK: vfnmsub213bf16 %ymm4, %ymm3, %ymm2 // CHECK: encoding: [0x62,0xf6,0x64,0x28,0xae,0xd4] - vfnmsub213nepbf16 %ymm4, %ymm3, %ymm2 + vfnmsub213bf16 %ymm4, %ymm3, %ymm2 -// CHECK: vfnmsub213nepbf16 %ymm4, %ymm3, %ymm2 {%k7} +// CHECK: vfnmsub213bf16 %ymm4, %ymm3, %ymm2 {%k7} // CHECK: encoding: [0x62,0xf6,0x64,0x2f,0xae,0xd4] - vfnmsub213nepbf16 %ymm4, %ymm3, %ymm2 {%k7} + vfnmsub213bf16 %ymm4, %ymm3, %ymm2 {%k7} -// CHECK: vfnmsub213nepbf16 %ymm4, %ymm3, %ymm2 {%k7} {z} +// CHECK: vfnmsub213bf16 %ymm4, %ymm3, %ymm2 {%k7} {z} // CHECK: encoding: [0x62,0xf6,0x64,0xaf,0xae,0xd4] - vfnmsub213nepbf16 %ymm4, %ymm3, %ymm2 {%k7} {z} + vfnmsub213bf16 %ymm4, %ymm3, %ymm2 {%k7} {z} -// CHECK: vfnmsub213nepbf16 %zmm4, %zmm3, %zmm2 +// CHECK: vfnmsub213bf16 %zmm4, %zmm3, %zmm2 // CHECK: encoding: [0x62,0xf6,0x64,0x48,0xae,0xd4] - vfnmsub213nepbf16 %zmm4, %zmm3, %zmm2 + vfnmsub213bf16 %zmm4, %zmm3, %zmm2 -// CHECK: vfnmsub213nepbf16 %zmm4, %zmm3, %zmm2 {%k7} +// CHECK: vfnmsub213bf16 %zmm4, %zmm3, %zmm2 {%k7} // CHECK: encoding: [0x62,0xf6,0x64,0x4f,0xae,0xd4] - vfnmsub213nepbf16 %zmm4, %zmm3, %zmm2 {%k7} + vfnmsub213bf16 %zmm4, %zmm3, %zmm2 {%k7} -// CHECK: vfnmsub213nepbf16 %zmm4, %zmm3, %zmm2 {%k7} {z} +// CHECK: vfnmsub213bf16 %zmm4, %zmm3, %zmm2 {%k7} {z} // CHECK: encoding: [0x62,0xf6,0x64,0xcf,0xae,0xd4] - vfnmsub213nepbf16 %zmm4, %zmm3, %zmm2 {%k7} {z} + vfnmsub213bf16 %zmm4, %zmm3, %zmm2 {%k7} {z} -// CHECK: vfnmsub213nepbf16 %xmm4, %xmm3, %xmm2 +// CHECK: vfnmsub213bf16 %xmm4, %xmm3, %xmm2 // CHECK: encoding: [0x62,0xf6,0x64,0x08,0xae,0xd4] - vfnmsub213nepbf16 %xmm4, %xmm3, %xmm2 + vfnmsub213bf16 %xmm4, %xmm3, %xmm2 -// CHECK: vfnmsub213nepbf16 %xmm4, %xmm3, %xmm2 {%k7} +// CHECK: vfnmsub213bf16 %xmm4, %xmm3, %xmm2 {%k7} // CHECK: encoding: [0x62,0xf6,0x64,0x0f,0xae,0xd4] - vfnmsub213nepbf16 %xmm4, %xmm3, %xmm2 {%k7} + vfnmsub213bf16 %xmm4, %xmm3, %xmm2 {%k7} -// CHECK: vfnmsub213nepbf16 %xmm4, %xmm3, %xmm2 {%k7} {z} +// CHECK: vfnmsub213bf16 %xmm4, %xmm3, %xmm2 {%k7} {z} // CHECK: encoding: [0x62,0xf6,0x64,0x8f,0xae,0xd4] - vfnmsub213nepbf16 %xmm4, %xmm3, %xmm2 {%k7} {z} + vfnmsub213bf16 %xmm4, %xmm3, %xmm2 {%k7} {z} -// CHECK: vfnmsub213nepbf16 268435456(%esp,%esi,8), %zmm3, %zmm2 +// CHECK: vfnmsub213bf16 268435456(%esp,%esi,8), %zmm3, %zmm2 // CHECK: encoding: [0x62,0xf6,0x64,0x48,0xae,0x94,0xf4,0x00,0x00,0x00,0x10] - vfnmsub213nepbf16 268435456(%esp,%esi,8), %zmm3, %zmm2 + vfnmsub213bf16 268435456(%esp,%esi,8), %zmm3, %zmm2 -// CHECK: vfnmsub213nepbf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7} +// CHECK: vfnmsub213bf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7} // CHECK: encoding: [0x62,0xf6,0x64,0x4f,0xae,0x94,0x87,0x23,0x01,0x00,0x00] - vfnmsub213nepbf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7} + vfnmsub213bf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7} -// CHECK: vfnmsub213nepbf16 (%eax){1to32}, %zmm3, %zmm2 +// CHECK: vfnmsub213bf16 (%eax){1to32}, %zmm3, %zmm2 // CHECK: encoding: [0x62,0xf6,0x64,0x58,0xae,0x10] - vfnmsub213nepbf16 (%eax){1to32}, %zmm3, %zmm2 + vfnmsub213bf16 (%eax){1to32}, %zmm3, %zmm2 -// CHECK: vfnmsub213nepbf16 -2048(,%ebp,2), %zmm3, %zmm2 +// CHECK: vfnmsub213bf16 -2048(,%ebp,2), %zmm3, %zmm2 // CHECK: encoding: [0x62,0xf6,0x64,0x48,0xae,0x14,0x6d,0x00,0xf8,0xff,0xff] - vfnmsub213nepbf16 -2048(,%ebp,2), %zmm3, %zmm2 + vfnmsub213bf16 -2048(,%ebp,2), %zmm3, %zmm2 -// CHECK: vfnmsub213nepbf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z} +// CHECK: vfnmsub213bf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z} // CHECK: encoding: [0x62,0xf6,0x64,0xcf,0xae,0x51,0x7f] - vfnmsub213nepbf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z} + vfnmsub213bf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z} -// CHECK: vfnmsub213nepbf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z} +// CHECK: vfnmsub213bf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z} // CHECK: encoding: [0x62,0xf6,0x64,0xdf,0xae,0x52,0x80] - vfnmsub213nepbf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z} + vfnmsub213bf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z} -// CHECK: vfnmsub213nepbf16 268435456(%esp,%esi,8), %ymm3, %ymm2 +// CHECK: vfnmsub213bf16 268435456(%esp,%esi,8), %ymm3, %ymm2 // CHECK: encoding: [0x62,0xf6,0x64,0x28,0xae,0x94,0xf4,0x00,0x00,0x00,0x10] - vfnmsub213nepbf16 268435456(%esp,%esi,8), %ymm3, %ymm2 + vfnmsub213bf16 268435456(%esp,%esi,8), %ymm3, %ymm2 -// CHECK: vfnmsub213nepbf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7} +// CHECK: vfnmsub213bf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7} // CHECK: encoding: [0x62,0xf6,0x64,0x2f,0xae,0x94,0x87,0x23,0x01,0x00,0x00] - vfnmsub213nepbf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7} + vfnmsub213bf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7} -// CHECK: vfnmsub213nepbf16 (%eax){1to16}, %ymm3, %ymm2 +// CHECK: vfnmsub213bf16 (%eax){1to16}, %ymm3, %ymm2 // CHECK: encoding: [0x62,0xf6,0x64,0x38,0xae,0x10] - vfnmsub213nepbf16 (%eax){1to16}, %ymm3, %ymm2 + vfnmsub213bf16 (%eax){1to16}, %ymm3, %ymm2 -// CHECK: vfnmsub213nepbf16 -1024(,%ebp,2), %ymm3, %ymm2 +// CHECK: vfnmsub213bf16 -1024(,%ebp,2), %ymm3, %ymm2 // CHECK: encoding: [0x62,0xf6,0x64,0x28,0xae,0x14,0x6d,0x00,0xfc,0xff,0xff] - vfnmsub213nepbf16 -1024(,%ebp,2), %ymm3, %ymm2 + vfnmsub213bf16 -1024(,%ebp,2), %ymm3, %ymm2 -// CHECK: vfnmsub213nepbf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z} +// CHECK: vfnmsub213bf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z} // CHECK: encoding: [0x62,0xf6,0x64,0xaf,0xae,0x51,0x7f] - vfnmsub213nepbf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z} + vfnmsub213bf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z} -// CHECK: vfnmsub213nepbf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z} +// CHECK: vfnmsub213bf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z} // CHECK: encoding: [0x62,0xf6,0x64,0xbf,0xae,0x52,0x80] - vfnmsub213nepbf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z} + vfnmsub213bf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z} -// CHECK: vfnmsub213nepbf16 268435456(%esp,%esi,8), %xmm3, %xmm2 +// CHECK: vfnmsub213bf16 268435456(%esp,%esi,8), %xmm3, %xmm2 // CHECK: encoding: [0x62,0xf6,0x64,0x08,0xae,0x94,0xf4,0x00,0x00,0x00,0x10] - vfnmsub213nepbf16 268435456(%esp,%esi,8), %xmm3, %xmm2 + vfnmsub213bf16 268435456(%esp,%esi,8), %xmm3, %xmm2 -// CHECK: vfnmsub213nepbf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7} +// CHECK: vfnmsub213bf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7} // CHECK: encoding: [0x62,0xf6,0x64,0x0f,0xae,0x94,0x87,0x23,0x01,0x00,0x00] - vfnmsub213nepbf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7} + vfnmsub213bf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7} -// CHECK: vfnmsub213nepbf16 (%eax){1to8}, %xmm3, %xmm2 +// CHECK: vfnmsub213bf16 (%eax){1to8}, %xmm3, %xmm2 // CHECK: encoding: [0x62,0xf6,0x64,0x18,0xae,0x10] - vfnmsub213nepbf16 (%eax){1to8}, %xmm3, %xmm2 + vfnmsub213bf16 (%eax){1to8}, %xmm3, %xmm2 -// CHECK: vfnmsub213nepbf16 -512(,%ebp,2), %xmm3, %xmm2 +// CHECK: vfnmsub213bf16 -512(,%ebp,2), %xmm3, %xmm2 // CHECK: encoding: [0x62,0xf6,0x64,0x08,0xae,0x14,0x6d,0x00,0xfe,0xff,0xff] - vfnmsub213nepbf16 -512(,%ebp,2), %xmm3, %xmm2 + vfnmsub213bf16 -512(,%ebp,2), %xmm3, %xmm2 -// CHECK: vfnmsub213nepbf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z} +// CHECK: vfnmsub213bf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z} // CHECK: encoding: [0x62,0xf6,0x64,0x8f,0xae,0x51,0x7f] - vfnmsub213nepbf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z} + vfnmsub213bf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z} -// CHECK: vfnmsub213nepbf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z} +// CHECK: vfnmsub213bf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z} // CHECK: encoding: [0x62,0xf6,0x64,0x9f,0xae,0x52,0x80] - vfnmsub213nepbf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z} + vfnmsub213bf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z} -// CHECK: vfnmsub231nepbf16 %ymm4, %ymm3, %ymm2 +// CHECK: vfnmsub231bf16 %ymm4, %ymm3, %ymm2 // CHECK: encoding: [0x62,0xf6,0x64,0x28,0xbe,0xd4] - vfnmsub231nepbf16 %ymm4, %ymm3, %ymm2 + vfnmsub231bf16 %ymm4, %ymm3, %ymm2 -// CHECK: vfnmsub231nepbf16 %ymm4, %ymm3, %ymm2 {%k7} +// CHECK: vfnmsub231bf16 %ymm4, %ymm3, %ymm2 {%k7} // CHECK: encoding: [0x62,0xf6,0x64,0x2f,0xbe,0xd4] - vfnmsub231nepbf16 %ymm4, %ymm3, %ymm2 {%k7} + vfnmsub231bf16 %ymm4, %ymm3, %ymm2 {%k7} -// CHECK: vfnmsub231nepbf16 %ymm4, %ymm3, %ymm2 {%k7} {z} +// CHECK: vfnmsub231bf16 %ymm4, %ymm3, %ymm2 {%k7} {z} // CHECK: encoding: [0x62,0xf6,0x64,0xaf,0xbe,0xd4] - vfnmsub231nepbf16 %ymm4, %ymm3, %ymm2 {%k7} {z} + vfnmsub231bf16 %ymm4, %ymm3, %ymm2 {%k7} {z} -// CHECK: vfnmsub231nepbf16 %zmm4, %zmm3, %zmm2 +// CHECK: vfnmsub231bf16 %zmm4, %zmm3, %zmm2 // CHECK: encoding: [0x62,0xf6,0x64,0x48,0xbe,0xd4] - vfnmsub231nepbf16 %zmm4, %zmm3, %zmm2 + vfnmsub231bf16 %zmm4, %zmm3, %zmm2 -// CHECK: vfnmsub231nepbf16 %zmm4, %zmm3, %zmm2 {%k7} +// CHECK: vfnmsub231bf16 %zmm4, %zmm3, %zmm2 {%k7} // CHECK: encoding: [0x62,0xf6,0x64,0x4f,0xbe,0xd4] - vfnmsub231nepbf16 %zmm4, %zmm3, %zmm2 {%k7} + vfnmsub231bf16 %zmm4, %zmm3, %zmm2 {%k7} -// CHECK: vfnmsub231nepbf16 %zmm4, %zmm3, %zmm2 {%k7} {z} +// CHECK: vfnmsub231bf16 %zmm4, %zmm3, %zmm2 {%k7} {z} // CHECK: encoding: [0x62,0xf6,0x64,0xcf,0xbe,0xd4] - vfnmsub231nepbf16 %zmm4, %zmm3, %zmm2 {%k7} {z} + vfnmsub231bf16 %zmm4, %zmm3, %zmm2 {%k7} {z} -// CHECK: vfnmsub231nepbf16 %xmm4, %xmm3, %xmm2 +// CHECK: vfnmsub231bf16 %xmm4, %xmm3, %xmm2 // CHECK: encoding: [0x62,0xf6,0x64,0x08,0xbe,0xd4] - vfnmsub231nepbf16 %xmm4, %xmm3, %xmm2 + vfnmsub231bf16 %xmm4, %xmm3, %xmm2 -// CHECK: vfnmsub231nepbf16 %xmm4, %xmm3, %xmm2 {%k7} +// CHECK: vfnmsub231bf16 %xmm4, %xmm3, %xmm2 {%k7} // CHECK: encoding: [0x62,0xf6,0x64,0x0f,0xbe,0xd4] - vfnmsub231nepbf16 %xmm4, %xmm3, %xmm2 {%k7} + vfnmsub231bf16 %xmm4, %xmm3, %xmm2 {%k7} -// CHECK: vfnmsub231nepbf16 %xmm4, %xmm3, %xmm2 {%k7} {z} +// CHECK: vfnmsub231bf16 %xmm4, %xmm3, %xmm2 {%k7} {z} // CHECK: encoding: [0x62,0xf6,0x64,0x8f,0xbe,0xd4] - vfnmsub231nepbf16 %xmm4, %xmm3, %xmm2 {%k7} {z} + vfnmsub231bf16 %xmm4, %xmm3, %xmm2 {%k7} {z} -// CHECK: vfnmsub231nepbf16 268435456(%esp,%esi,8), %zmm3, %zmm2 +// CHECK: vfnmsub231bf16 268435456(%esp,%esi,8), %zmm3, %zmm2 // CHECK: encoding: [0x62,0xf6,0x64,0x48,0xbe,0x94,0xf4,0x00,0x00,0x00,0x10] - vfnmsub231nepbf16 268435456(%esp,%esi,8), %zmm3, %zmm2 + vfnmsub231bf16 268435456(%esp,%esi,8), %zmm3, %zmm2 -// CHECK: vfnmsub231nepbf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7} +// CHECK: vfnmsub231bf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7} // CHECK: encoding: [0x62,0xf6,0x64,0x4f,0xbe,0x94,0x87,0x23,0x01,0x00,0x00] - vfnmsub231nepbf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7} + vfnmsub231bf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7} -// CHECK: vfnmsub231nepbf16 (%eax){1to32}, %zmm3, %zmm2 +// CHECK: vfnmsub231bf16 (%eax){1to32}, %zmm3, %zmm2 // CHECK: encoding: [0x62,0xf6,0x64,0x58,0xbe,0x10] - vfnmsub231nepbf16 (%eax){1to32}, %zmm3, %zmm2 + vfnmsub231bf16 (%eax){1to32}, %zmm3, %zmm2 -// CHECK: vfnmsub231nepbf16 -2048(,%ebp,2), %zmm3, %zmm2 +// CHECK: vfnmsub231bf16 -2048(,%ebp,2), %zmm3, %zmm2 // CHECK: encoding: [0x62,0xf6,0x64,0x48,0xbe,0x14,0x6d,0x00,0xf8,0xff,0xff] - vfnmsub231nepbf16 -2048(,%ebp,2), %zmm3, %zmm2 + vfnmsub231bf16 -2048(,%ebp,2), %zmm3, %zmm2 -// CHECK: vfnmsub231nepbf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z} +// CHECK: vfnmsub231bf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z} // CHECK: encoding: [0x62,0xf6,0x64,0xcf,0xbe,0x51,0x7f] - vfnmsub231nepbf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z} + vfnmsub231bf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z} -// CHECK: vfnmsub231nepbf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z} +// CHECK: vfnmsub231bf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z} // CHECK: encoding: [0x62,0xf6,0x64,0xdf,0xbe,0x52,0x80] - vfnmsub231nepbf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z} + vfnmsub231bf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z} -// CHECK: vfnmsub231nepbf16 268435456(%esp,%esi,8), %ymm3, %ymm2 +// CHECK: vfnmsub231bf16 268435456(%esp,%esi,8), %ymm3, %ymm2 // CHECK: encoding: [0x62,0xf6,0x64,0x28,0xbe,0x94,0xf4,0x00,0x00,0x00,0x10] - vfnmsub231nepbf16 268435456(%esp,%esi,8), %ymm3, %ymm2 + vfnmsub231bf16 268435456(%esp,%esi,8), %ymm3, %ymm2 -// CHECK: vfnmsub231nepbf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7} +// CHECK: vfnmsub231bf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7} // CHECK: encoding: [0x62,0xf6,0x64,0x2f,0xbe,0x94,0x87,0x23,0x01,0x00,0x00] - vfnmsub231nepbf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7} + vfnmsub231bf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7} -// CHECK: vfnmsub231nepbf16 (%eax){1to16}, %ymm3, %ymm2 +// CHECK: vfnmsub231bf16 (%eax){1to16}, %ymm3, %ymm2 // CHECK: encoding: [0x62,0xf6,0x64,0x38,0xbe,0x10] - vfnmsub231nepbf16 (%eax){1to16}, %ymm3, %ymm2 + vfnmsub231bf16 (%eax){1to16}, %ymm3, %ymm2 -// CHECK: vfnmsub231nepbf16 -1024(,%ebp,2), %ymm3, %ymm2 +// CHECK: vfnmsub231bf16 -1024(,%ebp,2), %ymm3, %ymm2 // CHECK: encoding: [0x62,0xf6,0x64,0x28,0xbe,0x14,0x6d,0x00,0xfc,0xff,0xff] - vfnmsub231nepbf16 -1024(,%ebp,2), %ymm3, %ymm2 + vfnmsub231bf16 -1024(,%ebp,2), %ymm3, %ymm2 -// CHECK: vfnmsub231nepbf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z} +// CHECK: vfnmsub231bf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z} // CHECK: encoding: [0x62,0xf6,0x64,0xaf,0xbe,0x51,0x7f] - vfnmsub231nepbf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z} + vfnmsub231bf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z} -// CHECK: vfnmsub231nepbf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z} +// CHECK: vfnmsub231bf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z} // CHECK: encoding: [0x62,0xf6,0x64,0xbf,0xbe,0x52,0x80] - vfnmsub231nepbf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z} + vfnmsub231bf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z} -// CHECK: vfnmsub231nepbf16 268435456(%esp,%esi,8), %xmm3, %xmm2 +// CHECK: vfnmsub231bf16 268435456(%esp,%esi,8), %xmm3, %xmm2 // CHECK: encoding: [0x62,0xf6,0x64,0x08,0xbe,0x94,0xf4,0x00,0x00,0x00,0x10] - vfnmsub231nepbf16 268435456(%esp,%esi,8), %xmm3, %xmm2 + vfnmsub231bf16 268435456(%esp,%esi,8), %xmm3, %xmm2 -// CHECK: vfnmsub231nepbf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7} +// CHECK: vfnmsub231bf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7} // CHECK: encoding: [0x62,0xf6,0x64,0x0f,0xbe,0x94,0x87,0x23,0x01,0x00,0x00] - vfnmsub231nepbf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7} + vfnmsub231bf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7} -// CHECK: vfnmsub231nepbf16 (%eax){1to8}, %xmm3, %xmm2 +// CHECK: vfnmsub231bf16 (%eax){1to8}, %xmm3, %xmm2 // CHECK: encoding: [0x62,0xf6,0x64,0x18,0xbe,0x10] - vfnmsub231nepbf16 (%eax){1to8}, %xmm3, %xmm2 + vfnmsub231bf16 (%eax){1to8}, %xmm3, %xmm2 -// CHECK: vfnmsub231nepbf16 -512(,%ebp,2), %xmm3, %xmm2 +// CHECK: vfnmsub231bf16 -512(,%ebp,2), %xmm3, %xmm2 // CHECK: encoding: [0x62,0xf6,0x64,0x08,0xbe,0x14,0x6d,0x00,0xfe,0xff,0xff] - vfnmsub231nepbf16 -512(,%ebp,2), %xmm3, %xmm2 + vfnmsub231bf16 -512(,%ebp,2), %xmm3, %xmm2 -// CHECK: vfnmsub231nepbf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z} +// CHECK: vfnmsub231bf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z} // CHECK: encoding: [0x62,0xf6,0x64,0x8f,0xbe,0x51,0x7f] - vfnmsub231nepbf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z} + vfnmsub231bf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z} -// CHECK: vfnmsub231nepbf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z} +// CHECK: vfnmsub231bf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z} // CHECK: encoding: [0x62,0xf6,0x64,0x9f,0xbe,0x52,0x80] - vfnmsub231nepbf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z} + vfnmsub231bf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z} -// CHECK: vfpclasspbf16 $123, %zmm3, %k5 +// CHECK: vfpclassbf16 $123, %zmm3, %k5 // CHECK: encoding: [0x62,0xf3,0x7f,0x48,0x66,0xeb,0x7b] - vfpclasspbf16 $123, %zmm3, %k5 + vfpclassbf16 $123, %zmm3, %k5 -// CHECK: vfpclasspbf16 $123, %zmm3, %k5 {%k7} +// CHECK: vfpclassbf16 $123, %zmm3, %k5 {%k7} // CHECK: encoding: [0x62,0xf3,0x7f,0x4f,0x66,0xeb,0x7b] - vfpclasspbf16 $123, %zmm3, %k5 {%k7} + vfpclassbf16 $123, %zmm3, %k5 {%k7} -// CHECK: vfpclasspbf16 $123, %ymm3, %k5 +// CHECK: vfpclassbf16 $123, %ymm3, %k5 // CHECK: encoding: [0x62,0xf3,0x7f,0x28,0x66,0xeb,0x7b] - vfpclasspbf16 $123, %ymm3, %k5 + vfpclassbf16 $123, %ymm3, %k5 -// CHECK: vfpclasspbf16 $123, %ymm3, %k5 {%k7} +// CHECK: vfpclassbf16 $123, %ymm3, %k5 {%k7} // CHECK: encoding: [0x62,0xf3,0x7f,0x2f,0x66,0xeb,0x7b] - vfpclasspbf16 $123, %ymm3, %k5 {%k7} + vfpclassbf16 $123, %ymm3, %k5 {%k7} -// CHECK: vfpclasspbf16 $123, %xmm3, %k5 +// CHECK: vfpclassbf16 $123, %xmm3, %k5 // CHECK: encoding: [0x62,0xf3,0x7f,0x08,0x66,0xeb,0x7b] - vfpclasspbf16 $123, %xmm3, %k5 + vfpclassbf16 $123, %xmm3, %k5 -// CHECK: vfpclasspbf16 $123, %xmm3, %k5 {%k7} +// CHECK: vfpclassbf16 $123, %xmm3, %k5 {%k7} // CHECK: encoding: [0x62,0xf3,0x7f,0x0f,0x66,0xeb,0x7b] - vfpclasspbf16 $123, %xmm3, %k5 {%k7} + vfpclassbf16 $123, %xmm3, %k5 {%k7} -// CHECK: vfpclasspbf16x $123, 268435456(%esp,%esi,8), %k5 +// CHECK: vfpclassbf16x $123, 268435456(%esp,%esi,8), %k5 // CHECK: encoding: [0x62,0xf3,0x7f,0x08,0x66,0xac,0xf4,0x00,0x00,0x00,0x10,0x7b] - vfpclasspbf16x $123, 268435456(%esp,%esi,8), %k5 + vfpclassbf16x $123, 268435456(%esp,%esi,8), %k5 -// CHECK: vfpclasspbf16x $123, 291(%edi,%eax,4), %k5 {%k7} +// CHECK: vfpclassbf16x $123, 291(%edi,%eax,4), %k5 {%k7} // CHECK: encoding: [0x62,0xf3,0x7f,0x0f,0x66,0xac,0x87,0x23,0x01,0x00,0x00,0x7b] - vfpclasspbf16x $123, 291(%edi,%eax,4), %k5 {%k7} + vfpclassbf16x $123, 291(%edi,%eax,4), %k5 {%k7} -// CHECK: vfpclasspbf16 $123, (%eax){1to8}, %k5 +// CHECK: vfpclassbf16 $123, (%eax){1to8}, %k5 // CHECK: encoding: [0x62,0xf3,0x7f,0x18,0x66,0x28,0x7b] - vfpclasspbf16 $123, (%eax){1to8}, %k5 + vfpclassbf16 $123, (%eax){1to8}, %k5 -// CHECK: vfpclasspbf16x $123, -512(,%ebp,2), %k5 +// CHECK: vfpclassbf16x $123, -512(,%ebp,2), %k5 // CHECK: encoding: [0x62,0xf3,0x7f,0x08,0x66,0x2c,0x6d,0x00,0xfe,0xff,0xff,0x7b] - vfpclasspbf16x $123, -512(,%ebp,2), %k5 + vfpclassbf16x $123, -512(,%ebp,2), %k5 -// CHECK: vfpclasspbf16x $123, 2032(%ecx), %k5 {%k7} +// CHECK: vfpclassbf16x $123, 2032(%ecx), %k5 {%k7} // CHECK: encoding: [0x62,0xf3,0x7f,0x0f,0x66,0x69,0x7f,0x7b] - vfpclasspbf16x $123, 2032(%ecx), %k5 {%k7} + vfpclassbf16x $123, 2032(%ecx), %k5 {%k7} -// CHECK: vfpclasspbf16 $123, -256(%edx){1to8}, %k5 {%k7} +// CHECK: vfpclassbf16 $123, -256(%edx){1to8}, %k5 {%k7} // CHECK: encoding: [0x62,0xf3,0x7f,0x1f,0x66,0x6a,0x80,0x7b] - vfpclasspbf16 $123, -256(%edx){1to8}, %k5 {%k7} + vfpclassbf16 $123, -256(%edx){1to8}, %k5 {%k7} -// CHECK: vfpclasspbf16 $123, (%eax){1to16}, %k5 +// CHECK: vfpclassbf16 $123, (%eax){1to16}, %k5 // CHECK: encoding: [0x62,0xf3,0x7f,0x38,0x66,0x28,0x7b] - vfpclasspbf16 $123, (%eax){1to16}, %k5 + vfpclassbf16 $123, (%eax){1to16}, %k5 -// CHECK: vfpclasspbf16y $123, -1024(,%ebp,2), %k5 +// CHECK: vfpclassbf16y $123, -1024(,%ebp,2), %k5 // CHECK: encoding: [0x62,0xf3,0x7f,0x28,0x66,0x2c,0x6d,0x00,0xfc,0xff,0xff,0x7b] - vfpclasspbf16y $123, -1024(,%ebp,2), %k5 + vfpclassbf16y $123, -1024(,%ebp,2), %k5 -// CHECK: vfpclasspbf16y $123, 4064(%ecx), %k5 {%k7} +// CHECK: vfpclassbf16y $123, 4064(%ecx), %k5 {%k7} // CHECK: encoding: [0x62,0xf3,0x7f,0x2f,0x66,0x69,0x7f,0x7b] - vfpclasspbf16y $123, 4064(%ecx), %k5 {%k7} + vfpclassbf16y $123, 4064(%ecx), %k5 {%k7} -// CHECK: vfpclasspbf16 $123, -256(%edx){1to16}, %k5 {%k7} +// CHECK: vfpclassbf16 $123, -256(%edx){1to16}, %k5 {%k7} // CHECK: encoding: [0x62,0xf3,0x7f,0x3f,0x66,0x6a,0x80,0x7b] - vfpclasspbf16 $123, -256(%edx){1to16}, %k5 {%k7} + vfpclassbf16 $123, -256(%edx){1to16}, %k5 {%k7} -// CHECK: vfpclasspbf16 $123, (%eax){1to32}, %k5 +// CHECK: vfpclassbf16 $123, (%eax){1to32}, %k5 // CHECK: encoding: [0x62,0xf3,0x7f,0x58,0x66,0x28,0x7b] - vfpclasspbf16 $123, (%eax){1to32}, %k5 + vfpclassbf16 $123, (%eax){1to32}, %k5 -// CHECK: vfpclasspbf16z $123, -2048(,%ebp,2), %k5 +// CHECK: vfpclassbf16z $123, -2048(,%ebp,2), %k5 // CHECK: encoding: [0x62,0xf3,0x7f,0x48,0x66,0x2c,0x6d,0x00,0xf8,0xff,0xff,0x7b] - vfpclasspbf16z $123, -2048(,%ebp,2), %k5 + vfpclassbf16z $123, -2048(,%ebp,2), %k5 -// CHECK: vfpclasspbf16z $123, 8128(%ecx), %k5 {%k7} +// CHECK: vfpclassbf16z $123, 8128(%ecx), %k5 {%k7} // CHECK: encoding: [0x62,0xf3,0x7f,0x4f,0x66,0x69,0x7f,0x7b] - vfpclasspbf16z $123, 8128(%ecx), %k5 {%k7} + vfpclassbf16z $123, 8128(%ecx), %k5 {%k7} -// CHECK: vfpclasspbf16 $123, -256(%edx){1to32}, %k5 {%k7} +// CHECK: vfpclassbf16 $123, -256(%edx){1to32}, %k5 {%k7} // CHECK: encoding: [0x62,0xf3,0x7f,0x5f,0x66,0x6a,0x80,0x7b] - vfpclasspbf16 $123, -256(%edx){1to32}, %k5 {%k7} + vfpclassbf16 $123, -256(%edx){1to32}, %k5 {%k7} -// CHECK: vgetexppbf16 %xmm3, %xmm2 +// CHECK: vgetexpbf16 %xmm3, %xmm2 // CHECK: encoding: [0x62,0xf5,0x7d,0x08,0x42,0xd3] - vgetexppbf16 %xmm3, %xmm2 + vgetexpbf16 %xmm3, %xmm2 -// CHECK: vgetexppbf16 %xmm3, %xmm2 {%k7} +// CHECK: vgetexpbf16 %xmm3, %xmm2 {%k7} // CHECK: encoding: [0x62,0xf5,0x7d,0x0f,0x42,0xd3] - vgetexppbf16 %xmm3, %xmm2 {%k7} + vgetexpbf16 %xmm3, %xmm2 {%k7} -// CHECK: vgetexppbf16 %xmm3, %xmm2 {%k7} {z} +// CHECK: vgetexpbf16 %xmm3, %xmm2 {%k7} {z} // CHECK: encoding: [0x62,0xf5,0x7d,0x8f,0x42,0xd3] - vgetexppbf16 %xmm3, %xmm2 {%k7} {z} + vgetexpbf16 %xmm3, %xmm2 {%k7} {z} -// CHECK: vgetexppbf16 %zmm3, %zmm2 +// CHECK: vgetexpbf16 %zmm3, %zmm2 // CHECK: encoding: [0x62,0xf5,0x7d,0x48,0x42,0xd3] - vgetexppbf16 %zmm3, %zmm2 + vgetexpbf16 %zmm3, %zmm2 -// CHECK: vgetexppbf16 %zmm3, %zmm2 {%k7} +// CHECK: vgetexpbf16 %zmm3, %zmm2 {%k7} // CHECK: encoding: [0x62,0xf5,0x7d,0x4f,0x42,0xd3] - vgetexppbf16 %zmm3, %zmm2 {%k7} + vgetexpbf16 %zmm3, %zmm2 {%k7} -// CHECK: vgetexppbf16 %zmm3, %zmm2 {%k7} {z} +// CHECK: vgetexpbf16 %zmm3, %zmm2 {%k7} {z} // CHECK: encoding: [0x62,0xf5,0x7d,0xcf,0x42,0xd3] - vgetexppbf16 %zmm3, %zmm2 {%k7} {z} + vgetexpbf16 %zmm3, %zmm2 {%k7} {z} -// CHECK: vgetexppbf16 %ymm3, %ymm2 +// CHECK: vgetexpbf16 %ymm3, %ymm2 // CHECK: encoding: [0x62,0xf5,0x7d,0x28,0x42,0xd3] - vgetexppbf16 %ymm3, %ymm2 + vgetexpbf16 %ymm3, %ymm2 -// CHECK: vgetexppbf16 %ymm3, %ymm2 {%k7} +// CHECK: vgetexpbf16 %ymm3, %ymm2 {%k7} // CHECK: encoding: [0x62,0xf5,0x7d,0x2f,0x42,0xd3] - vgetexppbf16 %ymm3, %ymm2 {%k7} + vgetexpbf16 %ymm3, %ymm2 {%k7} -// CHECK: vgetexppbf16 %ymm3, %ymm2 {%k7} {z} +// CHECK: vgetexpbf16 %ymm3, %ymm2 {%k7} {z} // CHECK: encoding: [0x62,0xf5,0x7d,0xaf,0x42,0xd3] - vgetexppbf16 %ymm3, %ymm2 {%k7} {z} + vgetexpbf16 %ymm3, %ymm2 {%k7} {z} -// CHECK: vgetexppbf16 268435456(%esp,%esi,8), %xmm2 +// CHECK: vgetexpbf16 268435456(%esp,%esi,8), %xmm2 // CHECK: encoding: [0x62,0xf5,0x7d,0x08,0x42,0x94,0xf4,0x00,0x00,0x00,0x10] - vgetexppbf16 268435456(%esp,%esi,8), %xmm2 + vgetexpbf16 268435456(%esp,%esi,8), %xmm2 -// CHECK: vgetexppbf16 291(%edi,%eax,4), %xmm2 {%k7} +// CHECK: vgetexpbf16 291(%edi,%eax,4), %xmm2 {%k7} // CHECK: encoding: [0x62,0xf5,0x7d,0x0f,0x42,0x94,0x87,0x23,0x01,0x00,0x00] - vgetexppbf16 291(%edi,%eax,4), %xmm2 {%k7} + vgetexpbf16 291(%edi,%eax,4), %xmm2 {%k7} -// CHECK: vgetexppbf16 (%eax){1to8}, %xmm2 +// CHECK: vgetexpbf16 (%eax){1to8}, %xmm2 // CHECK: encoding: [0x62,0xf5,0x7d,0x18,0x42,0x10] - vgetexppbf16 (%eax){1to8}, %xmm2 + vgetexpbf16 (%eax){1to8}, %xmm2 -// CHECK: vgetexppbf16 -512(,%ebp,2), %xmm2 +// CHECK: vgetexpbf16 -512(,%ebp,2), %xmm2 // CHECK: encoding: [0x62,0xf5,0x7d,0x08,0x42,0x14,0x6d,0x00,0xfe,0xff,0xff] - vgetexppbf16 -512(,%ebp,2), %xmm2 + vgetexpbf16 -512(,%ebp,2), %xmm2 -// CHECK: vgetexppbf16 2032(%ecx), %xmm2 {%k7} {z} +// CHECK: vgetexpbf16 2032(%ecx), %xmm2 {%k7} {z} // CHECK: encoding: [0x62,0xf5,0x7d,0x8f,0x42,0x51,0x7f] - vgetexppbf16 2032(%ecx), %xmm2 {%k7} {z} + vgetexpbf16 2032(%ecx), %xmm2 {%k7} {z} -// CHECK: vgetexppbf16 -256(%edx){1to8}, %xmm2 {%k7} {z} +// CHECK: vgetexpbf16 -256(%edx){1to8}, %xmm2 {%k7} {z} // CHECK: encoding: [0x62,0xf5,0x7d,0x9f,0x42,0x52,0x80] - vgetexppbf16 -256(%edx){1to8}, %xmm2 {%k7} {z} + vgetexpbf16 -256(%edx){1to8}, %xmm2 {%k7} {z} -// CHECK: vgetexppbf16 268435456(%esp,%esi,8), %ymm2 +// CHECK: vgetexpbf16 268435456(%esp,%esi,8), %ymm2 // CHECK: encoding: [0x62,0xf5,0x7d,0x28,0x42,0x94,0xf4,0x00,0x00,0x00,0x10] - vgetexppbf16 268435456(%esp,%esi,8), %ymm2 + vgetexpbf16 268435456(%esp,%esi,8), %ymm2 -// CHECK: vgetexppbf16 291(%edi,%eax,4), %ymm2 {%k7} +// CHECK: vgetexpbf16 291(%edi,%eax,4), %ymm2 {%k7} // CHECK: encoding: [0x62,0xf5,0x7d,0x2f,0x42,0x94,0x87,0x23,0x01,0x00,0x00] - vgetexppbf16 291(%edi,%eax,4), %ymm2 {%k7} + vgetexpbf16 291(%edi,%eax,4), %ymm2 {%k7} -// CHECK: vgetexppbf16 (%eax){1to16}, %ymm2 +// CHECK: vgetexpbf16 (%eax){1to16}, %ymm2 // CHECK: encoding: [0x62,0xf5,0x7d,0x38,0x42,0x10] - vgetexppbf16 (%eax){1to16}, %ymm2 + vgetexpbf16 (%eax){1to16}, %ymm2 -// CHECK: vgetexppbf16 -1024(,%ebp,2), %ymm2 +// CHECK: vgetexpbf16 -1024(,%ebp,2), %ymm2 // CHECK: encoding: [0x62,0xf5,0x7d,0x28,0x42,0x14,0x6d,0x00,0xfc,0xff,0xff] - vgetexppbf16 -1024(,%ebp,2), %ymm2 + vgetexpbf16 -1024(,%ebp,2), %ymm2 -// CHECK: vgetexppbf16 4064(%ecx), %ymm2 {%k7} {z} +// CHECK: vgetexpbf16 4064(%ecx), %ymm2 {%k7} {z} // CHECK: encoding: [0x62,0xf5,0x7d,0xaf,0x42,0x51,0x7f] - vgetexppbf16 4064(%ecx), %ymm2 {%k7} {z} + vgetexpbf16 4064(%ecx), %ymm2 {%k7} {z} -// CHECK: vgetexppbf16 -256(%edx){1to16}, %ymm2 {%k7} {z} +// CHECK: vgetexpbf16 -256(%edx){1to16}, %ymm2 {%k7} {z} // CHECK: encoding: [0x62,0xf5,0x7d,0xbf,0x42,0x52,0x80] - vgetexppbf16 -256(%edx){1to16}, %ymm2 {%k7} {z} + vgetexpbf16 -256(%edx){1to16}, %ymm2 {%k7} {z} -// CHECK: vgetexppbf16 268435456(%esp,%esi,8), %zmm2 +// CHECK: vgetexpbf16 268435456(%esp,%esi,8), %zmm2 // CHECK: encoding: [0x62,0xf5,0x7d,0x48,0x42,0x94,0xf4,0x00,0x00,0x00,0x10] - vgetexppbf16 268435456(%esp,%esi,8), %zmm2 + vgetexpbf16 268435456(%esp,%esi,8), %zmm2 -// CHECK: vgetexppbf16 291(%edi,%eax,4), %zmm2 {%k7} +// CHECK: vgetexpbf16 291(%edi,%eax,4), %zmm2 {%k7} // CHECK: encoding: [0x62,0xf5,0x7d,0x4f,0x42,0x94,0x87,0x23,0x01,0x00,0x00] - vgetexppbf16 291(%edi,%eax,4), %zmm2 {%k7} + vgetexpbf16 291(%edi,%eax,4), %zmm2 {%k7} -// CHECK: vgetexppbf16 (%eax){1to32}, %zmm2 +// CHECK: vgetexpbf16 (%eax){1to32}, %zmm2 // CHECK: encoding: [0x62,0xf5,0x7d,0x58,0x42,0x10] - vgetexppbf16 (%eax){1to32}, %zmm2 + vgetexpbf16 (%eax){1to32}, %zmm2 -// CHECK: vgetexppbf16 -2048(,%ebp,2), %zmm2 +// CHECK: vgetexpbf16 -2048(,%ebp,2), %zmm2 // CHECK: encoding: [0x62,0xf5,0x7d,0x48,0x42,0x14,0x6d,0x00,0xf8,0xff,0xff] - vgetexppbf16 -2048(,%ebp,2), %zmm2 + vgetexpbf16 -2048(,%ebp,2), %zmm2 -// CHECK: vgetexppbf16 8128(%ecx), %zmm2 {%k7} {z} +// CHECK: vgetexpbf16 8128(%ecx), %zmm2 {%k7} {z} // CHECK: encoding: [0x62,0xf5,0x7d,0xcf,0x42,0x51,0x7f] - vgetexppbf16 8128(%ecx), %zmm2 {%k7} {z} + vgetexpbf16 8128(%ecx), %zmm2 {%k7} {z} -// CHECK: vgetexppbf16 -256(%edx){1to32}, %zmm2 {%k7} {z} +// CHECK: vgetexpbf16 -256(%edx){1to32}, %zmm2 {%k7} {z} // CHECK: encoding: [0x62,0xf5,0x7d,0xdf,0x42,0x52,0x80] - vgetexppbf16 -256(%edx){1to32}, %zmm2 {%k7} {z} + vgetexpbf16 -256(%edx){1to32}, %zmm2 {%k7} {z} -// CHECK: vgetmantpbf16 $123, %zmm3, %zmm2 +// CHECK: vgetmantbf16 $123, %zmm3, %zmm2 // CHECK: encoding: [0x62,0xf3,0x7f,0x48,0x26,0xd3,0x7b] - vgetmantpbf16 $123, %zmm3, %zmm2 + vgetmantbf16 $123, %zmm3, %zmm2 -// CHECK: vgetmantpbf16 $123, %zmm3, %zmm2 {%k7} +// CHECK: vgetmantbf16 $123, %zmm3, %zmm2 {%k7} // CHECK: encoding: [0x62,0xf3,0x7f,0x4f,0x26,0xd3,0x7b] - vgetmantpbf16 $123, %zmm3, %zmm2 {%k7} + vgetmantbf16 $123, %zmm3, %zmm2 {%k7} -// CHECK: vgetmantpbf16 $123, %zmm3, %zmm2 {%k7} {z} +// CHECK: vgetmantbf16 $123, %zmm3, %zmm2 {%k7} {z} // CHECK: encoding: [0x62,0xf3,0x7f,0xcf,0x26,0xd3,0x7b] - vgetmantpbf16 $123, %zmm3, %zmm2 {%k7} {z} + vgetmantbf16 $123, %zmm3, %zmm2 {%k7} {z} -// CHECK: vgetmantpbf16 $123, %ymm3, %ymm2 +// CHECK: vgetmantbf16 $123, %ymm3, %ymm2 // CHECK: encoding: [0x62,0xf3,0x7f,0x28,0x26,0xd3,0x7b] - vgetmantpbf16 $123, %ymm3, %ymm2 + vgetmantbf16 $123, %ymm3, %ymm2 -// CHECK: vgetmantpbf16 $123, %ymm3, %ymm2 {%k7} +// CHECK: vgetmantbf16 $123, %ymm3, %ymm2 {%k7} // CHECK: encoding: [0x62,0xf3,0x7f,0x2f,0x26,0xd3,0x7b] - vgetmantpbf16 $123, %ymm3, %ymm2 {%k7} + vgetmantbf16 $123, %ymm3, %ymm2 {%k7} -// CHECK: vgetmantpbf16 $123, %ymm3, %ymm2 {%k7} {z} +// CHECK: vgetmantbf16 $123, %ymm3, %ymm2 {%k7} {z} // CHECK: encoding: [0x62,0xf3,0x7f,0xaf,0x26,0xd3,0x7b] - vgetmantpbf16 $123, %ymm3, %ymm2 {%k7} {z} + vgetmantbf16 $123, %ymm3, %ymm2 {%k7} {z} -// CHECK: vgetmantpbf16 $123, %xmm3, %xmm2 +// CHECK: vgetmantbf16 $123, %xmm3, %xmm2 // CHECK: encoding: [0x62,0xf3,0x7f,0x08,0x26,0xd3,0x7b] - vgetmantpbf16 $123, %xmm3, %xmm2 + vgetmantbf16 $123, %xmm3, %xmm2 -// CHECK: vgetmantpbf16 $123, %xmm3, %xmm2 {%k7} +// CHECK: vgetmantbf16 $123, %xmm3, %xmm2 {%k7} // CHECK: encoding: [0x62,0xf3,0x7f,0x0f,0x26,0xd3,0x7b] - vgetmantpbf16 $123, %xmm3, %xmm2 {%k7} + vgetmantbf16 $123, %xmm3, %xmm2 {%k7} -// CHECK: vgetmantpbf16 $123, %xmm3, %xmm2 {%k7} {z} +// CHECK: vgetmantbf16 $123, %xmm3, %xmm2 {%k7} {z} // CHECK: encoding: [0x62,0xf3,0x7f,0x8f,0x26,0xd3,0x7b] - vgetmantpbf16 $123, %xmm3, %xmm2 {%k7} {z} + vgetmantbf16 $123, %xmm3, %xmm2 {%k7} {z} -// CHECK: vgetmantpbf16 $123, 268435456(%esp,%esi,8), %xmm2 +// CHECK: vgetmantbf16 $123, 268435456(%esp,%esi,8), %xmm2 // CHECK: encoding: [0x62,0xf3,0x7f,0x08,0x26,0x94,0xf4,0x00,0x00,0x00,0x10,0x7b] - vgetmantpbf16 $123, 268435456(%esp,%esi,8), %xmm2 + vgetmantbf16 $123, 268435456(%esp,%esi,8), %xmm2 -// CHECK: vgetmantpbf16 $123, 291(%edi,%eax,4), %xmm2 {%k7} +// CHECK: vgetmantbf16 $123, 291(%edi,%eax,4), %xmm2 {%k7} // CHECK: encoding: [0x62,0xf3,0x7f,0x0f,0x26,0x94,0x87,0x23,0x01,0x00,0x00,0x7b] - vgetmantpbf16 $123, 291(%edi,%eax,4), %xmm2 {%k7} + vgetmantbf16 $123, 291(%edi,%eax,4), %xmm2 {%k7} -// CHECK: vgetmantpbf16 $123, (%eax){1to8}, %xmm2 +// CHECK: vgetmantbf16 $123, (%eax){1to8}, %xmm2 // CHECK: encoding: [0x62,0xf3,0x7f,0x18,0x26,0x10,0x7b] - vgetmantpbf16 $123, (%eax){1to8}, %xmm2 + vgetmantbf16 $123, (%eax){1to8}, %xmm2 -// CHECK: vgetmantpbf16 $123, -512(,%ebp,2), %xmm2 +// CHECK: vgetmantbf16 $123, -512(,%ebp,2), %xmm2 // CHECK: encoding: [0x62,0xf3,0x7f,0x08,0x26,0x14,0x6d,0x00,0xfe,0xff,0xff,0x7b] - vgetmantpbf16 $123, -512(,%ebp,2), %xmm2 + vgetmantbf16 $123, -512(,%ebp,2), %xmm2 -// CHECK: vgetmantpbf16 $123, 2032(%ecx), %xmm2 {%k7} {z} +// CHECK: vgetmantbf16 $123, 2032(%ecx), %xmm2 {%k7} {z} // CHECK: encoding: [0x62,0xf3,0x7f,0x8f,0x26,0x51,0x7f,0x7b] - vgetmantpbf16 $123, 2032(%ecx), %xmm2 {%k7} {z} + vgetmantbf16 $123, 2032(%ecx), %xmm2 {%k7} {z} -// CHECK: vgetmantpbf16 $123, -256(%edx){1to8}, %xmm2 {%k7} {z} +// CHECK: vgetmantbf16 $123, -256(%edx){1to8}, %xmm2 {%k7} {z} // CHECK: encoding: [0x62,0xf3,0x7f,0x9f,0x26,0x52,0x80,0x7b] - vgetmantpbf16 $123, -256(%edx){1to8}, %xmm2 {%k7} {z} + vgetmantbf16 $123, -256(%edx){1to8}, %xmm2 {%k7} {z} -// CHECK: vgetmantpbf16 $123, 268435456(%esp,%esi,8), %ymm2 +// CHECK: vgetmantbf16 $123, 268435456(%esp,%esi,8), %ymm2 // CHECK: encoding: [0x62,0xf3,0x7f,0x28,0x26,0x94,0xf4,0x00,0x00,0x00,0x10,0x7b] - vgetmantpbf16 $123, 268435456(%esp,%esi,8), %ymm2 + vgetmantbf16 $123, 268435456(%esp,%esi,8), %ymm2 -// CHECK: vgetmantpbf16 $123, 291(%edi,%eax,4), %ymm2 {%k7} +// CHECK: vgetmantbf16 $123, 291(%edi,%eax,4), %ymm2 {%k7} // CHECK: encoding: [0x62,0xf3,0x7f,0x2f,0x26,0x94,0x87,0x23,0x01,0x00,0x00,0x7b] - vgetmantpbf16 $123, 291(%edi,%eax,4), %ymm2 {%k7} + vgetmantbf16 $123, 291(%edi,%eax,4), %ymm2 {%k7} -// CHECK: vgetmantpbf16 $123, (%eax){1to16}, %ymm2 +// CHECK: vgetmantbf16 $123, (%eax){1to16}, %ymm2 // CHECK: encoding: [0x62,0xf3,0x7f,0x38,0x26,0x10,0x7b] - vgetmantpbf16 $123, (%eax){1to16}, %ymm2 + vgetmantbf16 $123, (%eax){1to16}, %ymm2 -// CHECK: vgetmantpbf16 $123, -1024(,%ebp,2), %ymm2 +// CHECK: vgetmantbf16 $123, -1024(,%ebp,2), %ymm2 // CHECK: encoding: [0x62,0xf3,0x7f,0x28,0x26,0x14,0x6d,0x00,0xfc,0xff,0xff,0x7b] - vgetmantpbf16 $123, -1024(,%ebp,2), %ymm2 + vgetmantbf16 $123, -1024(,%ebp,2), %ymm2 -// CHECK: vgetmantpbf16 $123, 4064(%ecx), %ymm2 {%k7} {z} +// CHECK: vgetmantbf16 $123, 4064(%ecx), %ymm2 {%k7} {z} // CHECK: encoding: [0x62,0xf3,0x7f,0xaf,0x26,0x51,0x7f,0x7b] - vgetmantpbf16 $123, 4064(%ecx), %ymm2 {%k7} {z} + vgetmantbf16 $123, 4064(%ecx), %ymm2 {%k7} {z} -// CHECK: vgetmantpbf16 $123, -256(%edx){1to16}, %ymm2 {%k7} {z} +// CHECK: vgetmantbf16 $123, -256(%edx){1to16}, %ymm2 {%k7} {z} // CHECK: encoding: [0x62,0xf3,0x7f,0xbf,0x26,0x52,0x80,0x7b] - vgetmantpbf16 $123, -256(%edx){1to16}, %ymm2 {%k7} {z} + vgetmantbf16 $123, -256(%edx){1to16}, %ymm2 {%k7} {z} -// CHECK: vgetmantpbf16 $123, 268435456(%esp,%esi,8), %zmm2 +// CHECK: vgetmantbf16 $123, 268435456(%esp,%esi,8), %zmm2 // CHECK: encoding: [0x62,0xf3,0x7f,0x48,0x26,0x94,0xf4,0x00,0x00,0x00,0x10,0x7b] - vgetmantpbf16 $123, 268435456(%esp,%esi,8), %zmm2 + vgetmantbf16 $123, 268435456(%esp,%esi,8), %zmm2 -// CHECK: vgetmantpbf16 $123, 291(%edi,%eax,4), %zmm2 {%k7} +// CHECK: vgetmantbf16 $123, 291(%edi,%eax,4), %zmm2 {%k7} // CHECK: encoding: [0x62,0xf3,0x7f,0x4f,0x26,0x94,0x87,0x23,0x01,0x00,0x00,0x7b] - vgetmantpbf16 $123, 291(%edi,%eax,4), %zmm2 {%k7} + vgetmantbf16 $123, 291(%edi,%eax,4), %zmm2 {%k7} -// CHECK: vgetmantpbf16 $123, (%eax){1to32}, %zmm2 +// CHECK: vgetmantbf16 $123, (%eax){1to32}, %zmm2 // CHECK: encoding: [0x62,0xf3,0x7f,0x58,0x26,0x10,0x7b] - vgetmantpbf16 $123, (%eax){1to32}, %zmm2 + vgetmantbf16 $123, (%eax){1to32}, %zmm2 -// CHECK: vgetmantpbf16 $123, -2048(,%ebp,2), %zmm2 +// CHECK: vgetmantbf16 $123, -2048(,%ebp,2), %zmm2 // CHECK: encoding: [0x62,0xf3,0x7f,0x48,0x26,0x14,0x6d,0x00,0xf8,0xff,0xff,0x7b] - vgetmantpbf16 $123, -2048(,%ebp,2), %zmm2 + vgetmantbf16 $123, -2048(,%ebp,2), %zmm2 -// CHECK: vgetmantpbf16 $123, 8128(%ecx), %zmm2 {%k7} {z} +// CHECK: vgetmantbf16 $123, 8128(%ecx), %zmm2 {%k7} {z} // CHECK: encoding: [0x62,0xf3,0x7f,0xcf,0x26,0x51,0x7f,0x7b] - vgetmantpbf16 $123, 8128(%ecx), %zmm2 {%k7} {z} + vgetmantbf16 $123, 8128(%ecx), %zmm2 {%k7} {z} -// CHECK: vgetmantpbf16 $123, -256(%edx){1to32}, %zmm2 {%k7} {z} +// CHECK: vgetmantbf16 $123, -256(%edx){1to32}, %zmm2 {%k7} {z} // CHECK: encoding: [0x62,0xf3,0x7f,0xdf,0x26,0x52,0x80,0x7b] - vgetmantpbf16 $123, -256(%edx){1to32}, %zmm2 {%k7} {z} + vgetmantbf16 $123, -256(%edx){1to32}, %zmm2 {%k7} {z} -// CHECK: vmaxpbf16 %ymm4, %ymm3, %ymm2 +// CHECK: vmaxbf16 %ymm4, %ymm3, %ymm2 // CHECK: encoding: [0x62,0xf5,0x65,0x28,0x5f,0xd4] - vmaxpbf16 %ymm4, %ymm3, %ymm2 + vmaxbf16 %ymm4, %ymm3, %ymm2 -// CHECK: vmaxpbf16 %ymm4, %ymm3, %ymm2 {%k7} +// CHECK: vmaxbf16 %ymm4, %ymm3, %ymm2 {%k7} // CHECK: encoding: [0x62,0xf5,0x65,0x2f,0x5f,0xd4] - vmaxpbf16 %ymm4, %ymm3, %ymm2 {%k7} + vmaxbf16 %ymm4, %ymm3, %ymm2 {%k7} -// CHECK: vmaxpbf16 %ymm4, %ymm3, %ymm2 {%k7} {z} +// CHECK: vmaxbf16 %ymm4, %ymm3, %ymm2 {%k7} {z} // CHECK: encoding: [0x62,0xf5,0x65,0xaf,0x5f,0xd4] - vmaxpbf16 %ymm4, %ymm3, %ymm2 {%k7} {z} + vmaxbf16 %ymm4, %ymm3, %ymm2 {%k7} {z} -// CHECK: vmaxpbf16 %zmm4, %zmm3, %zmm2 +// CHECK: vmaxbf16 %zmm4, %zmm3, %zmm2 // CHECK: encoding: [0x62,0xf5,0x65,0x48,0x5f,0xd4] - vmaxpbf16 %zmm4, %zmm3, %zmm2 + vmaxbf16 %zmm4, %zmm3, %zmm2 -// CHECK: vmaxpbf16 %zmm4, %zmm3, %zmm2 {%k7} +// CHECK: vmaxbf16 %zmm4, %zmm3, %zmm2 {%k7} // CHECK: encoding: [0x62,0xf5,0x65,0x4f,0x5f,0xd4] - vmaxpbf16 %zmm4, %zmm3, %zmm2 {%k7} + vmaxbf16 %zmm4, %zmm3, %zmm2 {%k7} -// CHECK: vmaxpbf16 %zmm4, %zmm3, %zmm2 {%k7} {z} +// CHECK: vmaxbf16 %zmm4, %zmm3, %zmm2 {%k7} {z} // CHECK: encoding: [0x62,0xf5,0x65,0xcf,0x5f,0xd4] - vmaxpbf16 %zmm4, %zmm3, %zmm2 {%k7} {z} + vmaxbf16 %zmm4, %zmm3, %zmm2 {%k7} {z} -// CHECK: vmaxpbf16 %xmm4, %xmm3, %xmm2 +// CHECK: vmaxbf16 %xmm4, %xmm3, %xmm2 // CHECK: encoding: [0x62,0xf5,0x65,0x08,0x5f,0xd4] - vmaxpbf16 %xmm4, %xmm3, %xmm2 + vmaxbf16 %xmm4, %xmm3, %xmm2 -// CHECK: vmaxpbf16 %xmm4, %xmm3, %xmm2 {%k7} +// CHECK: vmaxbf16 %xmm4, %xmm3, %xmm2 {%k7} // CHECK: encoding: [0x62,0xf5,0x65,0x0f,0x5f,0xd4] - vmaxpbf16 %xmm4, %xmm3, %xmm2 {%k7} + vmaxbf16 %xmm4, %xmm3, %xmm2 {%k7} -// CHECK: vmaxpbf16 %xmm4, %xmm3, %xmm2 {%k7} {z} +// CHECK: vmaxbf16 %xmm4, %xmm3, %xmm2 {%k7} {z} // CHECK: encoding: [0x62,0xf5,0x65,0x8f,0x5f,0xd4] - vmaxpbf16 %xmm4, %xmm3, %xmm2 {%k7} {z} + vmaxbf16 %xmm4, %xmm3, %xmm2 {%k7} {z} -// CHECK: vmaxpbf16 268435456(%esp,%esi,8), %zmm3, %zmm2 +// CHECK: vmaxbf16 268435456(%esp,%esi,8), %zmm3, %zmm2 // CHECK: encoding: [0x62,0xf5,0x65,0x48,0x5f,0x94,0xf4,0x00,0x00,0x00,0x10] - vmaxpbf16 268435456(%esp,%esi,8), %zmm3, %zmm2 + vmaxbf16 268435456(%esp,%esi,8), %zmm3, %zmm2 -// CHECK: vmaxpbf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7} +// CHECK: vmaxbf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7} // CHECK: encoding: [0x62,0xf5,0x65,0x4f,0x5f,0x94,0x87,0x23,0x01,0x00,0x00] - vmaxpbf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7} + vmaxbf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7} -// CHECK: vmaxpbf16 (%eax){1to32}, %zmm3, %zmm2 +// CHECK: vmaxbf16 (%eax){1to32}, %zmm3, %zmm2 // CHECK: encoding: [0x62,0xf5,0x65,0x58,0x5f,0x10] - vmaxpbf16 (%eax){1to32}, %zmm3, %zmm2 + vmaxbf16 (%eax){1to32}, %zmm3, %zmm2 -// CHECK: vmaxpbf16 -2048(,%ebp,2), %zmm3, %zmm2 +// CHECK: vmaxbf16 -2048(,%ebp,2), %zmm3, %zmm2 // CHECK: encoding: [0x62,0xf5,0x65,0x48,0x5f,0x14,0x6d,0x00,0xf8,0xff,0xff] - vmaxpbf16 -2048(,%ebp,2), %zmm3, %zmm2 + vmaxbf16 -2048(,%ebp,2), %zmm3, %zmm2 -// CHECK: vmaxpbf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z} +// CHECK: vmaxbf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z} // CHECK: encoding: [0x62,0xf5,0x65,0xcf,0x5f,0x51,0x7f] - vmaxpbf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z} + vmaxbf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z} -// CHECK: vmaxpbf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z} +// CHECK: vmaxbf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z} // CHECK: encoding: [0x62,0xf5,0x65,0xdf,0x5f,0x52,0x80] - vmaxpbf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z} + vmaxbf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z} -// CHECK: vmaxpbf16 268435456(%esp,%esi,8), %ymm3, %ymm2 +// CHECK: vmaxbf16 268435456(%esp,%esi,8), %ymm3, %ymm2 // CHECK: encoding: [0x62,0xf5,0x65,0x28,0x5f,0x94,0xf4,0x00,0x00,0x00,0x10] - vmaxpbf16 268435456(%esp,%esi,8), %ymm3, %ymm2 + vmaxbf16 268435456(%esp,%esi,8), %ymm3, %ymm2 -// CHECK: vmaxpbf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7} +// CHECK: vmaxbf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7} // CHECK: encoding: [0x62,0xf5,0x65,0x2f,0x5f,0x94,0x87,0x23,0x01,0x00,0x00] - vmaxpbf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7} + vmaxbf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7} -// CHECK: vmaxpbf16 (%eax){1to16}, %ymm3, %ymm2 +// CHECK: vmaxbf16 (%eax){1to16}, %ymm3, %ymm2 // CHECK: encoding: [0x62,0xf5,0x65,0x38,0x5f,0x10] - vmaxpbf16 (%eax){1to16}, %ymm3, %ymm2 + vmaxbf16 (%eax){1to16}, %ymm3, %ymm2 -// CHECK: vmaxpbf16 -1024(,%ebp,2), %ymm3, %ymm2 +// CHECK: vmaxbf16 -1024(,%ebp,2), %ymm3, %ymm2 // CHECK: encoding: [0x62,0xf5,0x65,0x28,0x5f,0x14,0x6d,0x00,0xfc,0xff,0xff] - vmaxpbf16 -1024(,%ebp,2), %ymm3, %ymm2 + vmaxbf16 -1024(,%ebp,2), %ymm3, %ymm2 -// CHECK: vmaxpbf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z} +// CHECK: vmaxbf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z} // CHECK: encoding: [0x62,0xf5,0x65,0xaf,0x5f,0x51,0x7f] - vmaxpbf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z} + vmaxbf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z} -// CHECK: vmaxpbf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z} +// CHECK: vmaxbf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z} // CHECK: encoding: [0x62,0xf5,0x65,0xbf,0x5f,0x52,0x80] - vmaxpbf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z} + vmaxbf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z} -// CHECK: vmaxpbf16 268435456(%esp,%esi,8), %xmm3, %xmm2 +// CHECK: vmaxbf16 268435456(%esp,%esi,8), %xmm3, %xmm2 // CHECK: encoding: [0x62,0xf5,0x65,0x08,0x5f,0x94,0xf4,0x00,0x00,0x00,0x10] - vmaxpbf16 268435456(%esp,%esi,8), %xmm3, %xmm2 + vmaxbf16 268435456(%esp,%esi,8), %xmm3, %xmm2 -// CHECK: vmaxpbf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7} +// CHECK: vmaxbf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7} // CHECK: encoding: [0x62,0xf5,0x65,0x0f,0x5f,0x94,0x87,0x23,0x01,0x00,0x00] - vmaxpbf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7} + vmaxbf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7} -// CHECK: vmaxpbf16 (%eax){1to8}, %xmm3, %xmm2 +// CHECK: vmaxbf16 (%eax){1to8}, %xmm3, %xmm2 // CHECK: encoding: [0x62,0xf5,0x65,0x18,0x5f,0x10] - vmaxpbf16 (%eax){1to8}, %xmm3, %xmm2 + vmaxbf16 (%eax){1to8}, %xmm3, %xmm2 -// CHECK: vmaxpbf16 -512(,%ebp,2), %xmm3, %xmm2 +// CHECK: vmaxbf16 -512(,%ebp,2), %xmm3, %xmm2 // CHECK: encoding: [0x62,0xf5,0x65,0x08,0x5f,0x14,0x6d,0x00,0xfe,0xff,0xff] - vmaxpbf16 -512(,%ebp,2), %xmm3, %xmm2 + vmaxbf16 -512(,%ebp,2), %xmm3, %xmm2 -// CHECK: vmaxpbf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z} +// CHECK: vmaxbf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z} // CHECK: encoding: [0x62,0xf5,0x65,0x8f,0x5f,0x51,0x7f] - vmaxpbf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z} + vmaxbf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z} -// CHECK: vmaxpbf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z} +// CHECK: vmaxbf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z} // CHECK: encoding: [0x62,0xf5,0x65,0x9f,0x5f,0x52,0x80] - vmaxpbf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z} + vmaxbf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z} -// CHECK: vminpbf16 %ymm4, %ymm3, %ymm2 +// CHECK: vminbf16 %ymm4, %ymm3, %ymm2 // CHECK: encoding: [0x62,0xf5,0x65,0x28,0x5d,0xd4] - vminpbf16 %ymm4, %ymm3, %ymm2 + vminbf16 %ymm4, %ymm3, %ymm2 -// CHECK: vminpbf16 %ymm4, %ymm3, %ymm2 {%k7} +// CHECK: vminbf16 %ymm4, %ymm3, %ymm2 {%k7} // CHECK: encoding: [0x62,0xf5,0x65,0x2f,0x5d,0xd4] - vminpbf16 %ymm4, %ymm3, %ymm2 {%k7} + vminbf16 %ymm4, %ymm3, %ymm2 {%k7} -// CHECK: vminpbf16 %ymm4, %ymm3, %ymm2 {%k7} {z} +// CHECK: vminbf16 %ymm4, %ymm3, %ymm2 {%k7} {z} // CHECK: encoding: [0x62,0xf5,0x65,0xaf,0x5d,0xd4] - vminpbf16 %ymm4, %ymm3, %ymm2 {%k7} {z} + vminbf16 %ymm4, %ymm3, %ymm2 {%k7} {z} -// CHECK: vminpbf16 %zmm4, %zmm3, %zmm2 +// CHECK: vminbf16 %zmm4, %zmm3, %zmm2 // CHECK: encoding: [0x62,0xf5,0x65,0x48,0x5d,0xd4] - vminpbf16 %zmm4, %zmm3, %zmm2 + vminbf16 %zmm4, %zmm3, %zmm2 -// CHECK: vminpbf16 %zmm4, %zmm3, %zmm2 {%k7} +// CHECK: vminbf16 %zmm4, %zmm3, %zmm2 {%k7} // CHECK: encoding: [0x62,0xf5,0x65,0x4f,0x5d,0xd4] - vminpbf16 %zmm4, %zmm3, %zmm2 {%k7} + vminbf16 %zmm4, %zmm3, %zmm2 {%k7} -// CHECK: vminpbf16 %zmm4, %zmm3, %zmm2 {%k7} {z} +// CHECK: vminbf16 %zmm4, %zmm3, %zmm2 {%k7} {z} // CHECK: encoding: [0x62,0xf5,0x65,0xcf,0x5d,0xd4] - vminpbf16 %zmm4, %zmm3, %zmm2 {%k7} {z} + vminbf16 %zmm4, %zmm3, %zmm2 {%k7} {z} -// CHECK: vminpbf16 %xmm4, %xmm3, %xmm2 +// CHECK: vminbf16 %xmm4, %xmm3, %xmm2 // CHECK: encoding: [0x62,0xf5,0x65,0x08,0x5d,0xd4] - vminpbf16 %xmm4, %xmm3, %xmm2 + vminbf16 %xmm4, %xmm3, %xmm2 -// CHECK: vminpbf16 %xmm4, %xmm3, %xmm2 {%k7} +// CHECK: vminbf16 %xmm4, %xmm3, %xmm2 {%k7} // CHECK: encoding: [0x62,0xf5,0x65,0x0f,0x5d,0xd4] - vminpbf16 %xmm4, %xmm3, %xmm2 {%k7} + vminbf16 %xmm4, %xmm3, %xmm2 {%k7} -// CHECK: vminpbf16 %xmm4, %xmm3, %xmm2 {%k7} {z} +// CHECK: vminbf16 %xmm4, %xmm3, %xmm2 {%k7} {z} // CHECK: encoding: [0x62,0xf5,0x65,0x8f,0x5d,0xd4] - vminpbf16 %xmm4, %xmm3, %xmm2 {%k7} {z} + vminbf16 %xmm4, %xmm3, %xmm2 {%k7} {z} -// CHECK: vminpbf16 268435456(%esp,%esi,8), %zmm3, %zmm2 +// CHECK: vminbf16 268435456(%esp,%esi,8), %zmm3, %zmm2 // CHECK: encoding: [0x62,0xf5,0x65,0x48,0x5d,0x94,0xf4,0x00,0x00,0x00,0x10] - vminpbf16 268435456(%esp,%esi,8), %zmm3, %zmm2 + vminbf16 268435456(%esp,%esi,8), %zmm3, %zmm2 -// CHECK: vminpbf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7} +// CHECK: vminbf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7} // CHECK: encoding: [0x62,0xf5,0x65,0x4f,0x5d,0x94,0x87,0x23,0x01,0x00,0x00] - vminpbf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7} + vminbf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7} -// CHECK: vminpbf16 (%eax){1to32}, %zmm3, %zmm2 +// CHECK: vminbf16 (%eax){1to32}, %zmm3, %zmm2 // CHECK: encoding: [0x62,0xf5,0x65,0x58,0x5d,0x10] - vminpbf16 (%eax){1to32}, %zmm3, %zmm2 + vminbf16 (%eax){1to32}, %zmm3, %zmm2 -// CHECK: vminpbf16 -2048(,%ebp,2), %zmm3, %zmm2 +// CHECK: vminbf16 -2048(,%ebp,2), %zmm3, %zmm2 // CHECK: encoding: [0x62,0xf5,0x65,0x48,0x5d,0x14,0x6d,0x00,0xf8,0xff,0xff] - vminpbf16 -2048(,%ebp,2), %zmm3, %zmm2 + vminbf16 -2048(,%ebp,2), %zmm3, %zmm2 -// CHECK: vminpbf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z} +// CHECK: vminbf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z} // CHECK: encoding: [0x62,0xf5,0x65,0xcf,0x5d,0x51,0x7f] - vminpbf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z} + vminbf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z} -// CHECK: vminpbf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z} +// CHECK: vminbf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z} // CHECK: encoding: [0x62,0xf5,0x65,0xdf,0x5d,0x52,0x80] - vminpbf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z} + vminbf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z} -// CHECK: vminpbf16 268435456(%esp,%esi,8), %ymm3, %ymm2 +// CHECK: vminbf16 268435456(%esp,%esi,8), %ymm3, %ymm2 // CHECK: encoding: [0x62,0xf5,0x65,0x28,0x5d,0x94,0xf4,0x00,0x00,0x00,0x10] - vminpbf16 268435456(%esp,%esi,8), %ymm3, %ymm2 + vminbf16 268435456(%esp,%esi,8), %ymm3, %ymm2 -// CHECK: vminpbf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7} +// CHECK: vminbf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7} // CHECK: encoding: [0x62,0xf5,0x65,0x2f,0x5d,0x94,0x87,0x23,0x01,0x00,0x00] - vminpbf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7} + vminbf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7} -// CHECK: vminpbf16 (%eax){1to16}, %ymm3, %ymm2 +// CHECK: vminbf16 (%eax){1to16}, %ymm3, %ymm2 // CHECK: encoding: [0x62,0xf5,0x65,0x38,0x5d,0x10] - vminpbf16 (%eax){1to16}, %ymm3, %ymm2 + vminbf16 (%eax){1to16}, %ymm3, %ymm2 -// CHECK: vminpbf16 -1024(,%ebp,2), %ymm3, %ymm2 +// CHECK: vminbf16 -1024(,%ebp,2), %ymm3, %ymm2 // CHECK: encoding: [0x62,0xf5,0x65,0x28,0x5d,0x14,0x6d,0x00,0xfc,0xff,0xff] - vminpbf16 -1024(,%ebp,2), %ymm3, %ymm2 + vminbf16 -1024(,%ebp,2), %ymm3, %ymm2 -// CHECK: vminpbf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z} +// CHECK: vminbf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z} // CHECK: encoding: [0x62,0xf5,0x65,0xaf,0x5d,0x51,0x7f] - vminpbf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z} + vminbf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z} -// CHECK: vminpbf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z} +// CHECK: vminbf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z} // CHECK: encoding: [0x62,0xf5,0x65,0xbf,0x5d,0x52,0x80] - vminpbf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z} + vminbf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z} -// CHECK: vminpbf16 268435456(%esp,%esi,8), %xmm3, %xmm2 +// CHECK: vminbf16 268435456(%esp,%esi,8), %xmm3, %xmm2 // CHECK: encoding: [0x62,0xf5,0x65,0x08,0x5d,0x94,0xf4,0x00,0x00,0x00,0x10] - vminpbf16 268435456(%esp,%esi,8), %xmm3, %xmm2 + vminbf16 268435456(%esp,%esi,8), %xmm3, %xmm2 -// CHECK: vminpbf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7} +// CHECK: vminbf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7} // CHECK: encoding: [0x62,0xf5,0x65,0x0f,0x5d,0x94,0x87,0x23,0x01,0x00,0x00] - vminpbf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7} + vminbf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7} -// CHECK: vminpbf16 (%eax){1to8}, %xmm3, %xmm2 +// CHECK: vminbf16 (%eax){1to8}, %xmm3, %xmm2 // CHECK: encoding: [0x62,0xf5,0x65,0x18,0x5d,0x10] - vminpbf16 (%eax){1to8}, %xmm3, %xmm2 + vminbf16 (%eax){1to8}, %xmm3, %xmm2 -// CHECK: vminpbf16 -512(,%ebp,2), %xmm3, %xmm2 +// CHECK: vminbf16 -512(,%ebp,2), %xmm3, %xmm2 // CHECK: encoding: [0x62,0xf5,0x65,0x08,0x5d,0x14,0x6d,0x00,0xfe,0xff,0xff] - vminpbf16 -512(,%ebp,2), %xmm3, %xmm2 + vminbf16 -512(,%ebp,2), %xmm3, %xmm2 -// CHECK: vminpbf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z} +// CHECK: vminbf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z} // CHECK: encoding: [0x62,0xf5,0x65,0x8f,0x5d,0x51,0x7f] - vminpbf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z} + vminbf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z} -// CHECK: vminpbf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z} +// CHECK: vminbf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z} // CHECK: encoding: [0x62,0xf5,0x65,0x9f,0x5d,0x52,0x80] - vminpbf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z} + vminbf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z} -// CHECK: vmulnepbf16 %ymm4, %ymm3, %ymm2 +// CHECK: vmulbf16 %ymm4, %ymm3, %ymm2 // CHECK: encoding: [0x62,0xf5,0x65,0x28,0x59,0xd4] - vmulnepbf16 %ymm4, %ymm3, %ymm2 + vmulbf16 %ymm4, %ymm3, %ymm2 -// CHECK: vmulnepbf16 %ymm4, %ymm3, %ymm2 {%k7} +// CHECK: vmulbf16 %ymm4, %ymm3, %ymm2 {%k7} // CHECK: encoding: [0x62,0xf5,0x65,0x2f,0x59,0xd4] - vmulnepbf16 %ymm4, %ymm3, %ymm2 {%k7} + vmulbf16 %ymm4, %ymm3, %ymm2 {%k7} -// CHECK: vmulnepbf16 %ymm4, %ymm3, %ymm2 {%k7} {z} +// CHECK: vmulbf16 %ymm4, %ymm3, %ymm2 {%k7} {z} // CHECK: encoding: [0x62,0xf5,0x65,0xaf,0x59,0xd4] - vmulnepbf16 %ymm4, %ymm3, %ymm2 {%k7} {z} + vmulbf16 %ymm4, %ymm3, %ymm2 {%k7} {z} -// CHECK: vmulnepbf16 %zmm4, %zmm3, %zmm2 +// CHECK: vmulbf16 %zmm4, %zmm3, %zmm2 // CHECK: encoding: [0x62,0xf5,0x65,0x48,0x59,0xd4] - vmulnepbf16 %zmm4, %zmm3, %zmm2 + vmulbf16 %zmm4, %zmm3, %zmm2 -// CHECK: vmulnepbf16 %zmm4, %zmm3, %zmm2 {%k7} +// CHECK: vmulbf16 %zmm4, %zmm3, %zmm2 {%k7} // CHECK: encoding: [0x62,0xf5,0x65,0x4f,0x59,0xd4] - vmulnepbf16 %zmm4, %zmm3, %zmm2 {%k7} + vmulbf16 %zmm4, %zmm3, %zmm2 {%k7} -// CHECK: vmulnepbf16 %zmm4, %zmm3, %zmm2 {%k7} {z} +// CHECK: vmulbf16 %zmm4, %zmm3, %zmm2 {%k7} {z} // CHECK: encoding: [0x62,0xf5,0x65,0xcf,0x59,0xd4] - vmulnepbf16 %zmm4, %zmm3, %zmm2 {%k7} {z} + vmulbf16 %zmm4, %zmm3, %zmm2 {%k7} {z} -// CHECK: vmulnepbf16 %xmm4, %xmm3, %xmm2 +// CHECK: vmulbf16 %xmm4, %xmm3, %xmm2 // CHECK: encoding: [0x62,0xf5,0x65,0x08,0x59,0xd4] - vmulnepbf16 %xmm4, %xmm3, %xmm2 + vmulbf16 %xmm4, %xmm3, %xmm2 -// CHECK: vmulnepbf16 %xmm4, %xmm3, %xmm2 {%k7} +// CHECK: vmulbf16 %xmm4, %xmm3, %xmm2 {%k7} // CHECK: encoding: [0x62,0xf5,0x65,0x0f,0x59,0xd4] - vmulnepbf16 %xmm4, %xmm3, %xmm2 {%k7} + vmulbf16 %xmm4, %xmm3, %xmm2 {%k7} -// CHECK: vmulnepbf16 %xmm4, %xmm3, %xmm2 {%k7} {z} +// CHECK: vmulbf16 %xmm4, %xmm3, %xmm2 {%k7} {z} // CHECK: encoding: [0x62,0xf5,0x65,0x8f,0x59,0xd4] - vmulnepbf16 %xmm4, %xmm3, %xmm2 {%k7} {z} + vmulbf16 %xmm4, %xmm3, %xmm2 {%k7} {z} -// CHECK: vmulnepbf16 268435456(%esp,%esi,8), %zmm3, %zmm2 +// CHECK: vmulbf16 268435456(%esp,%esi,8), %zmm3, %zmm2 // CHECK: encoding: [0x62,0xf5,0x65,0x48,0x59,0x94,0xf4,0x00,0x00,0x00,0x10] - vmulnepbf16 268435456(%esp,%esi,8), %zmm3, %zmm2 + vmulbf16 268435456(%esp,%esi,8), %zmm3, %zmm2 -// CHECK: vmulnepbf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7} +// CHECK: vmulbf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7} // CHECK: encoding: [0x62,0xf5,0x65,0x4f,0x59,0x94,0x87,0x23,0x01,0x00,0x00] - vmulnepbf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7} + vmulbf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7} -// CHECK: vmulnepbf16 (%eax){1to32}, %zmm3, %zmm2 +// CHECK: vmulbf16 (%eax){1to32}, %zmm3, %zmm2 // CHECK: encoding: [0x62,0xf5,0x65,0x58,0x59,0x10] - vmulnepbf16 (%eax){1to32}, %zmm3, %zmm2 + vmulbf16 (%eax){1to32}, %zmm3, %zmm2 -// CHECK: vmulnepbf16 -2048(,%ebp,2), %zmm3, %zmm2 +// CHECK: vmulbf16 -2048(,%ebp,2), %zmm3, %zmm2 // CHECK: encoding: [0x62,0xf5,0x65,0x48,0x59,0x14,0x6d,0x00,0xf8,0xff,0xff] - vmulnepbf16 -2048(,%ebp,2), %zmm3, %zmm2 + vmulbf16 -2048(,%ebp,2), %zmm3, %zmm2 -// CHECK: vmulnepbf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z} +// CHECK: vmulbf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z} // CHECK: encoding: [0x62,0xf5,0x65,0xcf,0x59,0x51,0x7f] - vmulnepbf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z} + vmulbf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z} -// CHECK: vmulnepbf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z} +// CHECK: vmulbf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z} // CHECK: encoding: [0x62,0xf5,0x65,0xdf,0x59,0x52,0x80] - vmulnepbf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z} + vmulbf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z} -// CHECK: vmulnepbf16 268435456(%esp,%esi,8), %ymm3, %ymm2 +// CHECK: vmulbf16 268435456(%esp,%esi,8), %ymm3, %ymm2 // CHECK: encoding: [0x62,0xf5,0x65,0x28,0x59,0x94,0xf4,0x00,0x00,0x00,0x10] - vmulnepbf16 268435456(%esp,%esi,8), %ymm3, %ymm2 + vmulbf16 268435456(%esp,%esi,8), %ymm3, %ymm2 -// CHECK: vmulnepbf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7} +// CHECK: vmulbf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7} // CHECK: encoding: [0x62,0xf5,0x65,0x2f,0x59,0x94,0x87,0x23,0x01,0x00,0x00] - vmulnepbf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7} + vmulbf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7} -// CHECK: vmulnepbf16 (%eax){1to16}, %ymm3, %ymm2 +// CHECK: vmulbf16 (%eax){1to16}, %ymm3, %ymm2 // CHECK: encoding: [0x62,0xf5,0x65,0x38,0x59,0x10] - vmulnepbf16 (%eax){1to16}, %ymm3, %ymm2 + vmulbf16 (%eax){1to16}, %ymm3, %ymm2 -// CHECK: vmulnepbf16 -1024(,%ebp,2), %ymm3, %ymm2 +// CHECK: vmulbf16 -1024(,%ebp,2), %ymm3, %ymm2 // CHECK: encoding: [0x62,0xf5,0x65,0x28,0x59,0x14,0x6d,0x00,0xfc,0xff,0xff] - vmulnepbf16 -1024(,%ebp,2), %ymm3, %ymm2 + vmulbf16 -1024(,%ebp,2), %ymm3, %ymm2 -// CHECK: vmulnepbf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z} +// CHECK: vmulbf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z} // CHECK: encoding: [0x62,0xf5,0x65,0xaf,0x59,0x51,0x7f] - vmulnepbf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z} + vmulbf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z} -// CHECK: vmulnepbf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z} +// CHECK: vmulbf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z} // CHECK: encoding: [0x62,0xf5,0x65,0xbf,0x59,0x52,0x80] - vmulnepbf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z} + vmulbf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z} -// CHECK: vmulnepbf16 268435456(%esp,%esi,8), %xmm3, %xmm2 +// CHECK: vmulbf16 268435456(%esp,%esi,8), %xmm3, %xmm2 // CHECK: encoding: [0x62,0xf5,0x65,0x08,0x59,0x94,0xf4,0x00,0x00,0x00,0x10] - vmulnepbf16 268435456(%esp,%esi,8), %xmm3, %xmm2 + vmulbf16 268435456(%esp,%esi,8), %xmm3, %xmm2 -// CHECK: vmulnepbf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7} +// CHECK: vmulbf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7} // CHECK: encoding: [0x62,0xf5,0x65,0x0f,0x59,0x94,0x87,0x23,0x01,0x00,0x00] - vmulnepbf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7} + vmulbf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7} -// CHECK: vmulnepbf16 (%eax){1to8}, %xmm3, %xmm2 +// CHECK: vmulbf16 (%eax){1to8}, %xmm3, %xmm2 // CHECK: encoding: [0x62,0xf5,0x65,0x18,0x59,0x10] - vmulnepbf16 (%eax){1to8}, %xmm3, %xmm2 + vmulbf16 (%eax){1to8}, %xmm3, %xmm2 -// CHECK: vmulnepbf16 -512(,%ebp,2), %xmm3, %xmm2 +// CHECK: vmulbf16 -512(,%ebp,2), %xmm3, %xmm2 // CHECK: encoding: [0x62,0xf5,0x65,0x08,0x59,0x14,0x6d,0x00,0xfe,0xff,0xff] - vmulnepbf16 -512(,%ebp,2), %xmm3, %xmm2 + vmulbf16 -512(,%ebp,2), %xmm3, %xmm2 -// CHECK: vmulnepbf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z} +// CHECK: vmulbf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z} // CHECK: encoding: [0x62,0xf5,0x65,0x8f,0x59,0x51,0x7f] - vmulnepbf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z} + vmulbf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z} -// CHECK: vmulnepbf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z} +// CHECK: vmulbf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z} // CHECK: encoding: [0x62,0xf5,0x65,0x9f,0x59,0x52,0x80] - vmulnepbf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z} + vmulbf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z} -// CHECK: vrcppbf16 %xmm3, %xmm2 +// CHECK: vrcpbf16 %xmm3, %xmm2 // CHECK: encoding: [0x62,0xf6,0x7c,0x08,0x4c,0xd3] - vrcppbf16 %xmm3, %xmm2 + vrcpbf16 %xmm3, %xmm2 -// CHECK: vrcppbf16 %xmm3, %xmm2 {%k7} +// CHECK: vrcpbf16 %xmm3, %xmm2 {%k7} // CHECK: encoding: [0x62,0xf6,0x7c,0x0f,0x4c,0xd3] - vrcppbf16 %xmm3, %xmm2 {%k7} + vrcpbf16 %xmm3, %xmm2 {%k7} -// CHECK: vrcppbf16 %xmm3, %xmm2 {%k7} {z} +// CHECK: vrcpbf16 %xmm3, %xmm2 {%k7} {z} // CHECK: encoding: [0x62,0xf6,0x7c,0x8f,0x4c,0xd3] - vrcppbf16 %xmm3, %xmm2 {%k7} {z} + vrcpbf16 %xmm3, %xmm2 {%k7} {z} -// CHECK: vrcppbf16 %zmm3, %zmm2 +// CHECK: vrcpbf16 %zmm3, %zmm2 // CHECK: encoding: [0x62,0xf6,0x7c,0x48,0x4c,0xd3] - vrcppbf16 %zmm3, %zmm2 + vrcpbf16 %zmm3, %zmm2 -// CHECK: vrcppbf16 %zmm3, %zmm2 {%k7} +// CHECK: vrcpbf16 %zmm3, %zmm2 {%k7} // CHECK: encoding: [0x62,0xf6,0x7c,0x4f,0x4c,0xd3] - vrcppbf16 %zmm3, %zmm2 {%k7} + vrcpbf16 %zmm3, %zmm2 {%k7} -// CHECK: vrcppbf16 %zmm3, %zmm2 {%k7} {z} +// CHECK: vrcpbf16 %zmm3, %zmm2 {%k7} {z} // CHECK: encoding: [0x62,0xf6,0x7c,0xcf,0x4c,0xd3] - vrcppbf16 %zmm3, %zmm2 {%k7} {z} + vrcpbf16 %zmm3, %zmm2 {%k7} {z} -// CHECK: vrcppbf16 %ymm3, %ymm2 +// CHECK: vrcpbf16 %ymm3, %ymm2 // CHECK: encoding: [0x62,0xf6,0x7c,0x28,0x4c,0xd3] - vrcppbf16 %ymm3, %ymm2 + vrcpbf16 %ymm3, %ymm2 -// CHECK: vrcppbf16 %ymm3, %ymm2 {%k7} +// CHECK: vrcpbf16 %ymm3, %ymm2 {%k7} // CHECK: encoding: [0x62,0xf6,0x7c,0x2f,0x4c,0xd3] - vrcppbf16 %ymm3, %ymm2 {%k7} + vrcpbf16 %ymm3, %ymm2 {%k7} -// CHECK: vrcppbf16 %ymm3, %ymm2 {%k7} {z} +// CHECK: vrcpbf16 %ymm3, %ymm2 {%k7} {z} // CHECK: encoding: [0x62,0xf6,0x7c,0xaf,0x4c,0xd3] - vrcppbf16 %ymm3, %ymm2 {%k7} {z} + vrcpbf16 %ymm3, %ymm2 {%k7} {z} -// CHECK: vrcppbf16 268435456(%esp,%esi,8), %xmm2 +// CHECK: vrcpbf16 268435456(%esp,%esi,8), %xmm2 // CHECK: encoding: [0x62,0xf6,0x7c,0x08,0x4c,0x94,0xf4,0x00,0x00,0x00,0x10] - vrcppbf16 268435456(%esp,%esi,8), %xmm2 + vrcpbf16 268435456(%esp,%esi,8), %xmm2 -// CHECK: vrcppbf16 291(%edi,%eax,4), %xmm2 {%k7} +// CHECK: vrcpbf16 291(%edi,%eax,4), %xmm2 {%k7} // CHECK: encoding: [0x62,0xf6,0x7c,0x0f,0x4c,0x94,0x87,0x23,0x01,0x00,0x00] - vrcppbf16 291(%edi,%eax,4), %xmm2 {%k7} + vrcpbf16 291(%edi,%eax,4), %xmm2 {%k7} -// CHECK: vrcppbf16 (%eax){1to8}, %xmm2 +// CHECK: vrcpbf16 (%eax){1to8}, %xmm2 // CHECK: encoding: [0x62,0xf6,0x7c,0x18,0x4c,0x10] - vrcppbf16 (%eax){1to8}, %xmm2 + vrcpbf16 (%eax){1to8}, %xmm2 -// CHECK: vrcppbf16 -512(,%ebp,2), %xmm2 +// CHECK: vrcpbf16 -512(,%ebp,2), %xmm2 // CHECK: encoding: [0x62,0xf6,0x7c,0x08,0x4c,0x14,0x6d,0x00,0xfe,0xff,0xff] - vrcppbf16 -512(,%ebp,2), %xmm2 + vrcpbf16 -512(,%ebp,2), %xmm2 -// CHECK: vrcppbf16 2032(%ecx), %xmm2 {%k7} {z} +// CHECK: vrcpbf16 2032(%ecx), %xmm2 {%k7} {z} // CHECK: encoding: [0x62,0xf6,0x7c,0x8f,0x4c,0x51,0x7f] - vrcppbf16 2032(%ecx), %xmm2 {%k7} {z} + vrcpbf16 2032(%ecx), %xmm2 {%k7} {z} -// CHECK: vrcppbf16 -256(%edx){1to8}, %xmm2 {%k7} {z} +// CHECK: vrcpbf16 -256(%edx){1to8}, %xmm2 {%k7} {z} // CHECK: encoding: [0x62,0xf6,0x7c,0x9f,0x4c,0x52,0x80] - vrcppbf16 -256(%edx){1to8}, %xmm2 {%k7} {z} + vrcpbf16 -256(%edx){1to8}, %xmm2 {%k7} {z} -// CHECK: vrcppbf16 268435456(%esp,%esi,8), %ymm2 +// CHECK: vrcpbf16 268435456(%esp,%esi,8), %ymm2 // CHECK: encoding: [0x62,0xf6,0x7c,0x28,0x4c,0x94,0xf4,0x00,0x00,0x00,0x10] - vrcppbf16 268435456(%esp,%esi,8), %ymm2 + vrcpbf16 268435456(%esp,%esi,8), %ymm2 -// CHECK: vrcppbf16 291(%edi,%eax,4), %ymm2 {%k7} +// CHECK: vrcpbf16 291(%edi,%eax,4), %ymm2 {%k7} // CHECK: encoding: [0x62,0xf6,0x7c,0x2f,0x4c,0x94,0x87,0x23,0x01,0x00,0x00] - vrcppbf16 291(%edi,%eax,4), %ymm2 {%k7} + vrcpbf16 291(%edi,%eax,4), %ymm2 {%k7} -// CHECK: vrcppbf16 (%eax){1to16}, %ymm2 +// CHECK: vrcpbf16 (%eax){1to16}, %ymm2 // CHECK: encoding: [0x62,0xf6,0x7c,0x38,0x4c,0x10] - vrcppbf16 (%eax){1to16}, %ymm2 + vrcpbf16 (%eax){1to16}, %ymm2 -// CHECK: vrcppbf16 -1024(,%ebp,2), %ymm2 +// CHECK: vrcpbf16 -1024(,%ebp,2), %ymm2 // CHECK: encoding: [0x62,0xf6,0x7c,0x28,0x4c,0x14,0x6d,0x00,0xfc,0xff,0xff] - vrcppbf16 -1024(,%ebp,2), %ymm2 + vrcpbf16 -1024(,%ebp,2), %ymm2 -// CHECK: vrcppbf16 4064(%ecx), %ymm2 {%k7} {z} +// CHECK: vrcpbf16 4064(%ecx), %ymm2 {%k7} {z} // CHECK: encoding: [0x62,0xf6,0x7c,0xaf,0x4c,0x51,0x7f] - vrcppbf16 4064(%ecx), %ymm2 {%k7} {z} + vrcpbf16 4064(%ecx), %ymm2 {%k7} {z} -// CHECK: vrcppbf16 -256(%edx){1to16}, %ymm2 {%k7} {z} +// CHECK: vrcpbf16 -256(%edx){1to16}, %ymm2 {%k7} {z} // CHECK: encoding: [0x62,0xf6,0x7c,0xbf,0x4c,0x52,0x80] - vrcppbf16 -256(%edx){1to16}, %ymm2 {%k7} {z} + vrcpbf16 -256(%edx){1to16}, %ymm2 {%k7} {z} -// CHECK: vrcppbf16 268435456(%esp,%esi,8), %zmm2 +// CHECK: vrcpbf16 268435456(%esp,%esi,8), %zmm2 // CHECK: encoding: [0x62,0xf6,0x7c,0x48,0x4c,0x94,0xf4,0x00,0x00,0x00,0x10] - vrcppbf16 268435456(%esp,%esi,8), %zmm2 + vrcpbf16 268435456(%esp,%esi,8), %zmm2 -// CHECK: vrcppbf16 291(%edi,%eax,4), %zmm2 {%k7} +// CHECK: vrcpbf16 291(%edi,%eax,4), %zmm2 {%k7} // CHECK: encoding: [0x62,0xf6,0x7c,0x4f,0x4c,0x94,0x87,0x23,0x01,0x00,0x00] - vrcppbf16 291(%edi,%eax,4), %zmm2 {%k7} + vrcpbf16 291(%edi,%eax,4), %zmm2 {%k7} -// CHECK: vrcppbf16 (%eax){1to32}, %zmm2 +// CHECK: vrcpbf16 (%eax){1to32}, %zmm2 // CHECK: encoding: [0x62,0xf6,0x7c,0x58,0x4c,0x10] - vrcppbf16 (%eax){1to32}, %zmm2 + vrcpbf16 (%eax){1to32}, %zmm2 -// CHECK: vrcppbf16 -2048(,%ebp,2), %zmm2 +// CHECK: vrcpbf16 -2048(,%ebp,2), %zmm2 // CHECK: encoding: [0x62,0xf6,0x7c,0x48,0x4c,0x14,0x6d,0x00,0xf8,0xff,0xff] - vrcppbf16 -2048(,%ebp,2), %zmm2 + vrcpbf16 -2048(,%ebp,2), %zmm2 -// CHECK: vrcppbf16 8128(%ecx), %zmm2 {%k7} {z} +// CHECK: vrcpbf16 8128(%ecx), %zmm2 {%k7} {z} // CHECK: encoding: [0x62,0xf6,0x7c,0xcf,0x4c,0x51,0x7f] - vrcppbf16 8128(%ecx), %zmm2 {%k7} {z} + vrcpbf16 8128(%ecx), %zmm2 {%k7} {z} -// CHECK: vrcppbf16 -256(%edx){1to32}, %zmm2 {%k7} {z} +// CHECK: vrcpbf16 -256(%edx){1to32}, %zmm2 {%k7} {z} // CHECK: encoding: [0x62,0xf6,0x7c,0xdf,0x4c,0x52,0x80] - vrcppbf16 -256(%edx){1to32}, %zmm2 {%k7} {z} + vrcpbf16 -256(%edx){1to32}, %zmm2 {%k7} {z} -// CHECK: vreducenepbf16 $123, %zmm3, %zmm2 +// CHECK: vreducebf16 $123, %zmm3, %zmm2 // CHECK: encoding: [0x62,0xf3,0x7f,0x48,0x56,0xd3,0x7b] - vreducenepbf16 $123, %zmm3, %zmm2 + vreducebf16 $123, %zmm3, %zmm2 -// CHECK: vreducenepbf16 $123, %zmm3, %zmm2 {%k7} +// CHECK: vreducebf16 $123, %zmm3, %zmm2 {%k7} // CHECK: encoding: [0x62,0xf3,0x7f,0x4f,0x56,0xd3,0x7b] - vreducenepbf16 $123, %zmm3, %zmm2 {%k7} + vreducebf16 $123, %zmm3, %zmm2 {%k7} -// CHECK: vreducenepbf16 $123, %zmm3, %zmm2 {%k7} {z} +// CHECK: vreducebf16 $123, %zmm3, %zmm2 {%k7} {z} // CHECK: encoding: [0x62,0xf3,0x7f,0xcf,0x56,0xd3,0x7b] - vreducenepbf16 $123, %zmm3, %zmm2 {%k7} {z} + vreducebf16 $123, %zmm3, %zmm2 {%k7} {z} -// CHECK: vreducenepbf16 $123, %ymm3, %ymm2 +// CHECK: vreducebf16 $123, %ymm3, %ymm2 // CHECK: encoding: [0x62,0xf3,0x7f,0x28,0x56,0xd3,0x7b] - vreducenepbf16 $123, %ymm3, %ymm2 + vreducebf16 $123, %ymm3, %ymm2 -// CHECK: vreducenepbf16 $123, %ymm3, %ymm2 {%k7} +// CHECK: vreducebf16 $123, %ymm3, %ymm2 {%k7} // CHECK: encoding: [0x62,0xf3,0x7f,0x2f,0x56,0xd3,0x7b] - vreducenepbf16 $123, %ymm3, %ymm2 {%k7} + vreducebf16 $123, %ymm3, %ymm2 {%k7} -// CHECK: vreducenepbf16 $123, %ymm3, %ymm2 {%k7} {z} +// CHECK: vreducebf16 $123, %ymm3, %ymm2 {%k7} {z} // CHECK: encoding: [0x62,0xf3,0x7f,0xaf,0x56,0xd3,0x7b] - vreducenepbf16 $123, %ymm3, %ymm2 {%k7} {z} + vreducebf16 $123, %ymm3, %ymm2 {%k7} {z} -// CHECK: vreducenepbf16 $123, %xmm3, %xmm2 +// CHECK: vreducebf16 $123, %xmm3, %xmm2 // CHECK: encoding: [0x62,0xf3,0x7f,0x08,0x56,0xd3,0x7b] - vreducenepbf16 $123, %xmm3, %xmm2 + vreducebf16 $123, %xmm3, %xmm2 -// CHECK: vreducenepbf16 $123, %xmm3, %xmm2 {%k7} +// CHECK: vreducebf16 $123, %xmm3, %xmm2 {%k7} // CHECK: encoding: [0x62,0xf3,0x7f,0x0f,0x56,0xd3,0x7b] - vreducenepbf16 $123, %xmm3, %xmm2 {%k7} + vreducebf16 $123, %xmm3, %xmm2 {%k7} -// CHECK: vreducenepbf16 $123, %xmm3, %xmm2 {%k7} {z} +// CHECK: vreducebf16 $123, %xmm3, %xmm2 {%k7} {z} // CHECK: encoding: [0x62,0xf3,0x7f,0x8f,0x56,0xd3,0x7b] - vreducenepbf16 $123, %xmm3, %xmm2 {%k7} {z} + vreducebf16 $123, %xmm3, %xmm2 {%k7} {z} -// CHECK: vreducenepbf16 $123, 268435456(%esp,%esi,8), %xmm2 +// CHECK: vreducebf16 $123, 268435456(%esp,%esi,8), %xmm2 // CHECK: encoding: [0x62,0xf3,0x7f,0x08,0x56,0x94,0xf4,0x00,0x00,0x00,0x10,0x7b] - vreducenepbf16 $123, 268435456(%esp,%esi,8), %xmm2 + vreducebf16 $123, 268435456(%esp,%esi,8), %xmm2 -// CHECK: vreducenepbf16 $123, 291(%edi,%eax,4), %xmm2 {%k7} +// CHECK: vreducebf16 $123, 291(%edi,%eax,4), %xmm2 {%k7} // CHECK: encoding: [0x62,0xf3,0x7f,0x0f,0x56,0x94,0x87,0x23,0x01,0x00,0x00,0x7b] - vreducenepbf16 $123, 291(%edi,%eax,4), %xmm2 {%k7} + vreducebf16 $123, 291(%edi,%eax,4), %xmm2 {%k7} -// CHECK: vreducenepbf16 $123, (%eax){1to8}, %xmm2 +// CHECK: vreducebf16 $123, (%eax){1to8}, %xmm2 // CHECK: encoding: [0x62,0xf3,0x7f,0x18,0x56,0x10,0x7b] - vreducenepbf16 $123, (%eax){1to8}, %xmm2 + vreducebf16 $123, (%eax){1to8}, %xmm2 -// CHECK: vreducenepbf16 $123, -512(,%ebp,2), %xmm2 +// CHECK: vreducebf16 $123, -512(,%ebp,2), %xmm2 // CHECK: encoding: [0x62,0xf3,0x7f,0x08,0x56,0x14,0x6d,0x00,0xfe,0xff,0xff,0x7b] - vreducenepbf16 $123, -512(,%ebp,2), %xmm2 + vreducebf16 $123, -512(,%ebp,2), %xmm2 -// CHECK: vreducenepbf16 $123, 2032(%ecx), %xmm2 {%k7} {z} +// CHECK: vreducebf16 $123, 2032(%ecx), %xmm2 {%k7} {z} // CHECK: encoding: [0x62,0xf3,0x7f,0x8f,0x56,0x51,0x7f,0x7b] - vreducenepbf16 $123, 2032(%ecx), %xmm2 {%k7} {z} + vreducebf16 $123, 2032(%ecx), %xmm2 {%k7} {z} -// CHECK: vreducenepbf16 $123, -256(%edx){1to8}, %xmm2 {%k7} {z} +// CHECK: vreducebf16 $123, -256(%edx){1to8}, %xmm2 {%k7} {z} // CHECK: encoding: [0x62,0xf3,0x7f,0x9f,0x56,0x52,0x80,0x7b] - vreducenepbf16 $123, -256(%edx){1to8}, %xmm2 {%k7} {z} + vreducebf16 $123, -256(%edx){1to8}, %xmm2 {%k7} {z} -// CHECK: vreducenepbf16 $123, 268435456(%esp,%esi,8), %ymm2 +// CHECK: vreducebf16 $123, 268435456(%esp,%esi,8), %ymm2 // CHECK: encoding: [0x62,0xf3,0x7f,0x28,0x56,0x94,0xf4,0x00,0x00,0x00,0x10,0x7b] - vreducenepbf16 $123, 268435456(%esp,%esi,8), %ymm2 + vreducebf16 $123, 268435456(%esp,%esi,8), %ymm2 -// CHECK: vreducenepbf16 $123, 291(%edi,%eax,4), %ymm2 {%k7} +// CHECK: vreducebf16 $123, 291(%edi,%eax,4), %ymm2 {%k7} // CHECK: encoding: [0x62,0xf3,0x7f,0x2f,0x56,0x94,0x87,0x23,0x01,0x00,0x00,0x7b] - vreducenepbf16 $123, 291(%edi,%eax,4), %ymm2 {%k7} + vreducebf16 $123, 291(%edi,%eax,4), %ymm2 {%k7} -// CHECK: vreducenepbf16 $123, (%eax){1to16}, %ymm2 +// CHECK: vreducebf16 $123, (%eax){1to16}, %ymm2 // CHECK: encoding: [0x62,0xf3,0x7f,0x38,0x56,0x10,0x7b] - vreducenepbf16 $123, (%eax){1to16}, %ymm2 + vreducebf16 $123, (%eax){1to16}, %ymm2 -// CHECK: vreducenepbf16 $123, -1024(,%ebp,2), %ymm2 +// CHECK: vreducebf16 $123, -1024(,%ebp,2), %ymm2 // CHECK: encoding: [0x62,0xf3,0x7f,0x28,0x56,0x14,0x6d,0x00,0xfc,0xff,0xff,0x7b] - vreducenepbf16 $123, -1024(,%ebp,2), %ymm2 + vreducebf16 $123, -1024(,%ebp,2), %ymm2 -// CHECK: vreducenepbf16 $123, 4064(%ecx), %ymm2 {%k7} {z} +// CHECK: vreducebf16 $123, 4064(%ecx), %ymm2 {%k7} {z} // CHECK: encoding: [0x62,0xf3,0x7f,0xaf,0x56,0x51,0x7f,0x7b] - vreducenepbf16 $123, 4064(%ecx), %ymm2 {%k7} {z} + vreducebf16 $123, 4064(%ecx), %ymm2 {%k7} {z} -// CHECK: vreducenepbf16 $123, -256(%edx){1to16}, %ymm2 {%k7} {z} +// CHECK: vreducebf16 $123, -256(%edx){1to16}, %ymm2 {%k7} {z} // CHECK: encoding: [0x62,0xf3,0x7f,0xbf,0x56,0x52,0x80,0x7b] - vreducenepbf16 $123, -256(%edx){1to16}, %ymm2 {%k7} {z} + vreducebf16 $123, -256(%edx){1to16}, %ymm2 {%k7} {z} -// CHECK: vreducenepbf16 $123, 268435456(%esp,%esi,8), %zmm2 +// CHECK: vreducebf16 $123, 268435456(%esp,%esi,8), %zmm2 // CHECK: encoding: [0x62,0xf3,0x7f,0x48,0x56,0x94,0xf4,0x00,0x00,0x00,0x10,0x7b] - vreducenepbf16 $123, 268435456(%esp,%esi,8), %zmm2 + vreducebf16 $123, 268435456(%esp,%esi,8), %zmm2 -// CHECK: vreducenepbf16 $123, 291(%edi,%eax,4), %zmm2 {%k7} +// CHECK: vreducebf16 $123, 291(%edi,%eax,4), %zmm2 {%k7} // CHECK: encoding: [0x62,0xf3,0x7f,0x4f,0x56,0x94,0x87,0x23,0x01,0x00,0x00,0x7b] - vreducenepbf16 $123, 291(%edi,%eax,4), %zmm2 {%k7} + vreducebf16 $123, 291(%edi,%eax,4), %zmm2 {%k7} -// CHECK: vreducenepbf16 $123, (%eax){1to32}, %zmm2 +// CHECK: vreducebf16 $123, (%eax){1to32}, %zmm2 // CHECK: encoding: [0x62,0xf3,0x7f,0x58,0x56,0x10,0x7b] - vreducenepbf16 $123, (%eax){1to32}, %zmm2 + vreducebf16 $123, (%eax){1to32}, %zmm2 -// CHECK: vreducenepbf16 $123, -2048(,%ebp,2), %zmm2 +// CHECK: vreducebf16 $123, -2048(,%ebp,2), %zmm2 // CHECK: encoding: [0x62,0xf3,0x7f,0x48,0x56,0x14,0x6d,0x00,0xf8,0xff,0xff,0x7b] - vreducenepbf16 $123, -2048(,%ebp,2), %zmm2 + vreducebf16 $123, -2048(,%ebp,2), %zmm2 -// CHECK: vreducenepbf16 $123, 8128(%ecx), %zmm2 {%k7} {z} +// CHECK: vreducebf16 $123, 8128(%ecx), %zmm2 {%k7} {z} // CHECK: encoding: [0x62,0xf3,0x7f,0xcf,0x56,0x51,0x7f,0x7b] - vreducenepbf16 $123, 8128(%ecx), %zmm2 {%k7} {z} + vreducebf16 $123, 8128(%ecx), %zmm2 {%k7} {z} -// CHECK: vreducenepbf16 $123, -256(%edx){1to32}, %zmm2 {%k7} {z} +// CHECK: vreducebf16 $123, -256(%edx){1to32}, %zmm2 {%k7} {z} // CHECK: encoding: [0x62,0xf3,0x7f,0xdf,0x56,0x52,0x80,0x7b] - vreducenepbf16 $123, -256(%edx){1to32}, %zmm2 {%k7} {z} + vreducebf16 $123, -256(%edx){1to32}, %zmm2 {%k7} {z} -// CHECK: vrndscalenepbf16 $123, %zmm3, %zmm2 +// CHECK: vrndscalebf16 $123, %zmm3, %zmm2 // CHECK: encoding: [0x62,0xf3,0x7f,0x48,0x08,0xd3,0x7b] - vrndscalenepbf16 $123, %zmm3, %zmm2 + vrndscalebf16 $123, %zmm3, %zmm2 -// CHECK: vrndscalenepbf16 $123, %zmm3, %zmm2 {%k7} +// CHECK: vrndscalebf16 $123, %zmm3, %zmm2 {%k7} // CHECK: encoding: [0x62,0xf3,0x7f,0x4f,0x08,0xd3,0x7b] - vrndscalenepbf16 $123, %zmm3, %zmm2 {%k7} + vrndscalebf16 $123, %zmm3, %zmm2 {%k7} -// CHECK: vrndscalenepbf16 $123, %zmm3, %zmm2 {%k7} {z} +// CHECK: vrndscalebf16 $123, %zmm3, %zmm2 {%k7} {z} // CHECK: encoding: [0x62,0xf3,0x7f,0xcf,0x08,0xd3,0x7b] - vrndscalenepbf16 $123, %zmm3, %zmm2 {%k7} {z} + vrndscalebf16 $123, %zmm3, %zmm2 {%k7} {z} -// CHECK: vrndscalenepbf16 $123, %ymm3, %ymm2 +// CHECK: vrndscalebf16 $123, %ymm3, %ymm2 // CHECK: encoding: [0x62,0xf3,0x7f,0x28,0x08,0xd3,0x7b] - vrndscalenepbf16 $123, %ymm3, %ymm2 + vrndscalebf16 $123, %ymm3, %ymm2 -// CHECK: vrndscalenepbf16 $123, %ymm3, %ymm2 {%k7} +// CHECK: vrndscalebf16 $123, %ymm3, %ymm2 {%k7} // CHECK: encoding: [0x62,0xf3,0x7f,0x2f,0x08,0xd3,0x7b] - vrndscalenepbf16 $123, %ymm3, %ymm2 {%k7} + vrndscalebf16 $123, %ymm3, %ymm2 {%k7} -// CHECK: vrndscalenepbf16 $123, %ymm3, %ymm2 {%k7} {z} +// CHECK: vrndscalebf16 $123, %ymm3, %ymm2 {%k7} {z} // CHECK: encoding: [0x62,0xf3,0x7f,0xaf,0x08,0xd3,0x7b] - vrndscalenepbf16 $123, %ymm3, %ymm2 {%k7} {z} + vrndscalebf16 $123, %ymm3, %ymm2 {%k7} {z} -// CHECK: vrndscalenepbf16 $123, %xmm3, %xmm2 +// CHECK: vrndscalebf16 $123, %xmm3, %xmm2 // CHECK: encoding: [0x62,0xf3,0x7f,0x08,0x08,0xd3,0x7b] - vrndscalenepbf16 $123, %xmm3, %xmm2 + vrndscalebf16 $123, %xmm3, %xmm2 -// CHECK: vrndscalenepbf16 $123, %xmm3, %xmm2 {%k7} +// CHECK: vrndscalebf16 $123, %xmm3, %xmm2 {%k7} // CHECK: encoding: [0x62,0xf3,0x7f,0x0f,0x08,0xd3,0x7b] - vrndscalenepbf16 $123, %xmm3, %xmm2 {%k7} + vrndscalebf16 $123, %xmm3, %xmm2 {%k7} -// CHECK: vrndscalenepbf16 $123, %xmm3, %xmm2 {%k7} {z} +// CHECK: vrndscalebf16 $123, %xmm3, %xmm2 {%k7} {z} // CHECK: encoding: [0x62,0xf3,0x7f,0x8f,0x08,0xd3,0x7b] - vrndscalenepbf16 $123, %xmm3, %xmm2 {%k7} {z} + vrndscalebf16 $123, %xmm3, %xmm2 {%k7} {z} -// CHECK: vrndscalenepbf16 $123, 268435456(%esp,%esi,8), %xmm2 +// CHECK: vrndscalebf16 $123, 268435456(%esp,%esi,8), %xmm2 // CHECK: encoding: [0x62,0xf3,0x7f,0x08,0x08,0x94,0xf4,0x00,0x00,0x00,0x10,0x7b] - vrndscalenepbf16 $123, 268435456(%esp,%esi,8), %xmm2 + vrndscalebf16 $123, 268435456(%esp,%esi,8), %xmm2 -// CHECK: vrndscalenepbf16 $123, 291(%edi,%eax,4), %xmm2 {%k7} +// CHECK: vrndscalebf16 $123, 291(%edi,%eax,4), %xmm2 {%k7} // CHECK: encoding: [0x62,0xf3,0x7f,0x0f,0x08,0x94,0x87,0x23,0x01,0x00,0x00,0x7b] - vrndscalenepbf16 $123, 291(%edi,%eax,4), %xmm2 {%k7} + vrndscalebf16 $123, 291(%edi,%eax,4), %xmm2 {%k7} -// CHECK: vrndscalenepbf16 $123, (%eax){1to8}, %xmm2 +// CHECK: vrndscalebf16 $123, (%eax){1to8}, %xmm2 // CHECK: encoding: [0x62,0xf3,0x7f,0x18,0x08,0x10,0x7b] - vrndscalenepbf16 $123, (%eax){1to8}, %xmm2 + vrndscalebf16 $123, (%eax){1to8}, %xmm2 -// CHECK: vrndscalenepbf16 $123, -512(,%ebp,2), %xmm2 +// CHECK: vrndscalebf16 $123, -512(,%ebp,2), %xmm2 // CHECK: encoding: [0x62,0xf3,0x7f,0x08,0x08,0x14,0x6d,0x00,0xfe,0xff,0xff,0x7b] - vrndscalenepbf16 $123, -512(,%ebp,2), %xmm2 + vrndscalebf16 $123, -512(,%ebp,2), %xmm2 -// CHECK: vrndscalenepbf16 $123, 2032(%ecx), %xmm2 {%k7} {z} +// CHECK: vrndscalebf16 $123, 2032(%ecx), %xmm2 {%k7} {z} // CHECK: encoding: [0x62,0xf3,0x7f,0x8f,0x08,0x51,0x7f,0x7b] - vrndscalenepbf16 $123, 2032(%ecx), %xmm2 {%k7} {z} + vrndscalebf16 $123, 2032(%ecx), %xmm2 {%k7} {z} -// CHECK: vrndscalenepbf16 $123, -256(%edx){1to8}, %xmm2 {%k7} {z} +// CHECK: vrndscalebf16 $123, -256(%edx){1to8}, %xmm2 {%k7} {z} // CHECK: encoding: [0x62,0xf3,0x7f,0x9f,0x08,0x52,0x80,0x7b] - vrndscalenepbf16 $123, -256(%edx){1to8}, %xmm2 {%k7} {z} + vrndscalebf16 $123, -256(%edx){1to8}, %xmm2 {%k7} {z} -// CHECK: vrndscalenepbf16 $123, 268435456(%esp,%esi,8), %ymm2 +// CHECK: vrndscalebf16 $123, 268435456(%esp,%esi,8), %ymm2 // CHECK: encoding: [0x62,0xf3,0x7f,0x28,0x08,0x94,0xf4,0x00,0x00,0x00,0x10,0x7b] - vrndscalenepbf16 $123, 268435456(%esp,%esi,8), %ymm2 + vrndscalebf16 $123, 268435456(%esp,%esi,8), %ymm2 -// CHECK: vrndscalenepbf16 $123, 291(%edi,%eax,4), %ymm2 {%k7} +// CHECK: vrndscalebf16 $123, 291(%edi,%eax,4), %ymm2 {%k7} // CHECK: encoding: [0x62,0xf3,0x7f,0x2f,0x08,0x94,0x87,0x23,0x01,0x00,0x00,0x7b] - vrndscalenepbf16 $123, 291(%edi,%eax,4), %ymm2 {%k7} + vrndscalebf16 $123, 291(%edi,%eax,4), %ymm2 {%k7} -// CHECK: vrndscalenepbf16 $123, (%eax){1to16}, %ymm2 +// CHECK: vrndscalebf16 $123, (%eax){1to16}, %ymm2 // CHECK: encoding: [0x62,0xf3,0x7f,0x38,0x08,0x10,0x7b] - vrndscalenepbf16 $123, (%eax){1to16}, %ymm2 + vrndscalebf16 $123, (%eax){1to16}, %ymm2 -// CHECK: vrndscalenepbf16 $123, -1024(,%ebp,2), %ymm2 +// CHECK: vrndscalebf16 $123, -1024(,%ebp,2), %ymm2 // CHECK: encoding: [0x62,0xf3,0x7f,0x28,0x08,0x14,0x6d,0x00,0xfc,0xff,0xff,0x7b] - vrndscalenepbf16 $123, -1024(,%ebp,2), %ymm2 + vrndscalebf16 $123, -1024(,%ebp,2), %ymm2 -// CHECK: vrndscalenepbf16 $123, 4064(%ecx), %ymm2 {%k7} {z} +// CHECK: vrndscalebf16 $123, 4064(%ecx), %ymm2 {%k7} {z} // CHECK: encoding: [0x62,0xf3,0x7f,0xaf,0x08,0x51,0x7f,0x7b] - vrndscalenepbf16 $123, 4064(%ecx), %ymm2 {%k7} {z} + vrndscalebf16 $123, 4064(%ecx), %ymm2 {%k7} {z} -// CHECK: vrndscalenepbf16 $123, -256(%edx){1to16}, %ymm2 {%k7} {z} +// CHECK: vrndscalebf16 $123, -256(%edx){1to16}, %ymm2 {%k7} {z} // CHECK: encoding: [0x62,0xf3,0x7f,0xbf,0x08,0x52,0x80,0x7b] - vrndscalenepbf16 $123, -256(%edx){1to16}, %ymm2 {%k7} {z} + vrndscalebf16 $123, -256(%edx){1to16}, %ymm2 {%k7} {z} -// CHECK: vrndscalenepbf16 $123, 268435456(%esp,%esi,8), %zmm2 +// CHECK: vrndscalebf16 $123, 268435456(%esp,%esi,8), %zmm2 // CHECK: encoding: [0x62,0xf3,0x7f,0x48,0x08,0x94,0xf4,0x00,0x00,0x00,0x10,0x7b] - vrndscalenepbf16 $123, 268435456(%esp,%esi,8), %zmm2 + vrndscalebf16 $123, 268435456(%esp,%esi,8), %zmm2 -// CHECK: vrndscalenepbf16 $123, 291(%edi,%eax,4), %zmm2 {%k7} +// CHECK: vrndscalebf16 $123, 291(%edi,%eax,4), %zmm2 {%k7} // CHECK: encoding: [0x62,0xf3,0x7f,0x4f,0x08,0x94,0x87,0x23,0x01,0x00,0x00,0x7b] - vrndscalenepbf16 $123, 291(%edi,%eax,4), %zmm2 {%k7} + vrndscalebf16 $123, 291(%edi,%eax,4), %zmm2 {%k7} -// CHECK: vrndscalenepbf16 $123, (%eax){1to32}, %zmm2 +// CHECK: vrndscalebf16 $123, (%eax){1to32}, %zmm2 // CHECK: encoding: [0x62,0xf3,0x7f,0x58,0x08,0x10,0x7b] - vrndscalenepbf16 $123, (%eax){1to32}, %zmm2 + vrndscalebf16 $123, (%eax){1to32}, %zmm2 -// CHECK: vrndscalenepbf16 $123, -2048(,%ebp,2), %zmm2 +// CHECK: vrndscalebf16 $123, -2048(,%ebp,2), %zmm2 // CHECK: encoding: [0x62,0xf3,0x7f,0x48,0x08,0x14,0x6d,0x00,0xf8,0xff,0xff,0x7b] - vrndscalenepbf16 $123, -2048(,%ebp,2), %zmm2 + vrndscalebf16 $123, -2048(,%ebp,2), %zmm2 -// CHECK: vrndscalenepbf16 $123, 8128(%ecx), %zmm2 {%k7} {z} +// CHECK: vrndscalebf16 $123, 8128(%ecx), %zmm2 {%k7} {z} // CHECK: encoding: [0x62,0xf3,0x7f,0xcf,0x08,0x51,0x7f,0x7b] - vrndscalenepbf16 $123, 8128(%ecx), %zmm2 {%k7} {z} + vrndscalebf16 $123, 8128(%ecx), %zmm2 {%k7} {z} -// CHECK: vrndscalenepbf16 $123, -256(%edx){1to32}, %zmm2 {%k7} {z} +// CHECK: vrndscalebf16 $123, -256(%edx){1to32}, %zmm2 {%k7} {z} // CHECK: encoding: [0x62,0xf3,0x7f,0xdf,0x08,0x52,0x80,0x7b] - vrndscalenepbf16 $123, -256(%edx){1to32}, %zmm2 {%k7} {z} + vrndscalebf16 $123, -256(%edx){1to32}, %zmm2 {%k7} {z} -// CHECK: vrsqrtpbf16 %xmm3, %xmm2 +// CHECK: vrsqrtbf16 %xmm3, %xmm2 // CHECK: encoding: [0x62,0xf6,0x7c,0x08,0x4e,0xd3] - vrsqrtpbf16 %xmm3, %xmm2 + vrsqrtbf16 %xmm3, %xmm2 -// CHECK: vrsqrtpbf16 %xmm3, %xmm2 {%k7} +// CHECK: vrsqrtbf16 %xmm3, %xmm2 {%k7} // CHECK: encoding: [0x62,0xf6,0x7c,0x0f,0x4e,0xd3] - vrsqrtpbf16 %xmm3, %xmm2 {%k7} + vrsqrtbf16 %xmm3, %xmm2 {%k7} -// CHECK: vrsqrtpbf16 %xmm3, %xmm2 {%k7} {z} +// CHECK: vrsqrtbf16 %xmm3, %xmm2 {%k7} {z} // CHECK: encoding: [0x62,0xf6,0x7c,0x8f,0x4e,0xd3] - vrsqrtpbf16 %xmm3, %xmm2 {%k7} {z} + vrsqrtbf16 %xmm3, %xmm2 {%k7} {z} -// CHECK: vrsqrtpbf16 %zmm3, %zmm2 +// CHECK: vrsqrtbf16 %zmm3, %zmm2 // CHECK: encoding: [0x62,0xf6,0x7c,0x48,0x4e,0xd3] - vrsqrtpbf16 %zmm3, %zmm2 + vrsqrtbf16 %zmm3, %zmm2 -// CHECK: vrsqrtpbf16 %zmm3, %zmm2 {%k7} +// CHECK: vrsqrtbf16 %zmm3, %zmm2 {%k7} // CHECK: encoding: [0x62,0xf6,0x7c,0x4f,0x4e,0xd3] - vrsqrtpbf16 %zmm3, %zmm2 {%k7} + vrsqrtbf16 %zmm3, %zmm2 {%k7} -// CHECK: vrsqrtpbf16 %zmm3, %zmm2 {%k7} {z} +// CHECK: vrsqrtbf16 %zmm3, %zmm2 {%k7} {z} // CHECK: encoding: [0x62,0xf6,0x7c,0xcf,0x4e,0xd3] - vrsqrtpbf16 %zmm3, %zmm2 {%k7} {z} + vrsqrtbf16 %zmm3, %zmm2 {%k7} {z} -// CHECK: vrsqrtpbf16 %ymm3, %ymm2 +// CHECK: vrsqrtbf16 %ymm3, %ymm2 // CHECK: encoding: [0x62,0xf6,0x7c,0x28,0x4e,0xd3] - vrsqrtpbf16 %ymm3, %ymm2 + vrsqrtbf16 %ymm3, %ymm2 -// CHECK: vrsqrtpbf16 %ymm3, %ymm2 {%k7} +// CHECK: vrsqrtbf16 %ymm3, %ymm2 {%k7} // CHECK: encoding: [0x62,0xf6,0x7c,0x2f,0x4e,0xd3] - vrsqrtpbf16 %ymm3, %ymm2 {%k7} + vrsqrtbf16 %ymm3, %ymm2 {%k7} -// CHECK: vrsqrtpbf16 %ymm3, %ymm2 {%k7} {z} +// CHECK: vrsqrtbf16 %ymm3, %ymm2 {%k7} {z} // CHECK: encoding: [0x62,0xf6,0x7c,0xaf,0x4e,0xd3] - vrsqrtpbf16 %ymm3, %ymm2 {%k7} {z} + vrsqrtbf16 %ymm3, %ymm2 {%k7} {z} -// CHECK: vrsqrtpbf16 268435456(%esp,%esi,8), %xmm2 +// CHECK: vrsqrtbf16 268435456(%esp,%esi,8), %xmm2 // CHECK: encoding: [0x62,0xf6,0x7c,0x08,0x4e,0x94,0xf4,0x00,0x00,0x00,0x10] - vrsqrtpbf16 268435456(%esp,%esi,8), %xmm2 + vrsqrtbf16 268435456(%esp,%esi,8), %xmm2 -// CHECK: vrsqrtpbf16 291(%edi,%eax,4), %xmm2 {%k7} +// CHECK: vrsqrtbf16 291(%edi,%eax,4), %xmm2 {%k7} // CHECK: encoding: [0x62,0xf6,0x7c,0x0f,0x4e,0x94,0x87,0x23,0x01,0x00,0x00] - vrsqrtpbf16 291(%edi,%eax,4), %xmm2 {%k7} + vrsqrtbf16 291(%edi,%eax,4), %xmm2 {%k7} -// CHECK: vrsqrtpbf16 (%eax){1to8}, %xmm2 +// CHECK: vrsqrtbf16 (%eax){1to8}, %xmm2 // CHECK: encoding: [0x62,0xf6,0x7c,0x18,0x4e,0x10] - vrsqrtpbf16 (%eax){1to8}, %xmm2 + vrsqrtbf16 (%eax){1to8}, %xmm2 -// CHECK: vrsqrtpbf16 -512(,%ebp,2), %xmm2 +// CHECK: vrsqrtbf16 -512(,%ebp,2), %xmm2 // CHECK: encoding: [0x62,0xf6,0x7c,0x08,0x4e,0x14,0x6d,0x00,0xfe,0xff,0xff] - vrsqrtpbf16 -512(,%ebp,2), %xmm2 + vrsqrtbf16 -512(,%ebp,2), %xmm2 -// CHECK: vrsqrtpbf16 2032(%ecx), %xmm2 {%k7} {z} +// CHECK: vrsqrtbf16 2032(%ecx), %xmm2 {%k7} {z} // CHECK: encoding: [0x62,0xf6,0x7c,0x8f,0x4e,0x51,0x7f] - vrsqrtpbf16 2032(%ecx), %xmm2 {%k7} {z} + vrsqrtbf16 2032(%ecx), %xmm2 {%k7} {z} -// CHECK: vrsqrtpbf16 -256(%edx){1to8}, %xmm2 {%k7} {z} +// CHECK: vrsqrtbf16 -256(%edx){1to8}, %xmm2 {%k7} {z} // CHECK: encoding: [0x62,0xf6,0x7c,0x9f,0x4e,0x52,0x80] - vrsqrtpbf16 -256(%edx){1to8}, %xmm2 {%k7} {z} + vrsqrtbf16 -256(%edx){1to8}, %xmm2 {%k7} {z} -// CHECK: vrsqrtpbf16 268435456(%esp,%esi,8), %ymm2 +// CHECK: vrsqrtbf16 268435456(%esp,%esi,8), %ymm2 // CHECK: encoding: [0x62,0xf6,0x7c,0x28,0x4e,0x94,0xf4,0x00,0x00,0x00,0x10] - vrsqrtpbf16 268435456(%esp,%esi,8), %ymm2 + vrsqrtbf16 268435456(%esp,%esi,8), %ymm2 -// CHECK: vrsqrtpbf16 291(%edi,%eax,4), %ymm2 {%k7} +// CHECK: vrsqrtbf16 291(%edi,%eax,4), %ymm2 {%k7} // CHECK: encoding: [0x62,0xf6,0x7c,0x2f,0x4e,0x94,0x87,0x23,0x01,0x00,0x00] - vrsqrtpbf16 291(%edi,%eax,4), %ymm2 {%k7} + vrsqrtbf16 291(%edi,%eax,4), %ymm2 {%k7} -// CHECK: vrsqrtpbf16 (%eax){1to16}, %ymm2 +// CHECK: vrsqrtbf16 (%eax){1to16}, %ymm2 // CHECK: encoding: [0x62,0xf6,0x7c,0x38,0x4e,0x10] - vrsqrtpbf16 (%eax){1to16}, %ymm2 + vrsqrtbf16 (%eax){1to16}, %ymm2 -// CHECK: vrsqrtpbf16 -1024(,%ebp,2), %ymm2 +// CHECK: vrsqrtbf16 -1024(,%ebp,2), %ymm2 // CHECK: encoding: [0x62,0xf6,0x7c,0x28,0x4e,0x14,0x6d,0x00,0xfc,0xff,0xff] - vrsqrtpbf16 -1024(,%ebp,2), %ymm2 + vrsqrtbf16 -1024(,%ebp,2), %ymm2 -// CHECK: vrsqrtpbf16 4064(%ecx), %ymm2 {%k7} {z} +// CHECK: vrsqrtbf16 4064(%ecx), %ymm2 {%k7} {z} // CHECK: encoding: [0x62,0xf6,0x7c,0xaf,0x4e,0x51,0x7f] - vrsqrtpbf16 4064(%ecx), %ymm2 {%k7} {z} + vrsqrtbf16 4064(%ecx), %ymm2 {%k7} {z} -// CHECK: vrsqrtpbf16 -256(%edx){1to16}, %ymm2 {%k7} {z} +// CHECK: vrsqrtbf16 -256(%edx){1to16}, %ymm2 {%k7} {z} // CHECK: encoding: [0x62,0xf6,0x7c,0xbf,0x4e,0x52,0x80] - vrsqrtpbf16 -256(%edx){1to16}, %ymm2 {%k7} {z} + vrsqrtbf16 -256(%edx){1to16}, %ymm2 {%k7} {z} -// CHECK: vrsqrtpbf16 268435456(%esp,%esi,8), %zmm2 +// CHECK: vrsqrtbf16 268435456(%esp,%esi,8), %zmm2 // CHECK: encoding: [0x62,0xf6,0x7c,0x48,0x4e,0x94,0xf4,0x00,0x00,0x00,0x10] - vrsqrtpbf16 268435456(%esp,%esi,8), %zmm2 + vrsqrtbf16 268435456(%esp,%esi,8), %zmm2 -// CHECK: vrsqrtpbf16 291(%edi,%eax,4), %zmm2 {%k7} +// CHECK: vrsqrtbf16 291(%edi,%eax,4), %zmm2 {%k7} // CHECK: encoding: [0x62,0xf6,0x7c,0x4f,0x4e,0x94,0x87,0x23,0x01,0x00,0x00] - vrsqrtpbf16 291(%edi,%eax,4), %zmm2 {%k7} + vrsqrtbf16 291(%edi,%eax,4), %zmm2 {%k7} -// CHECK: vrsqrtpbf16 (%eax){1to32}, %zmm2 +// CHECK: vrsqrtbf16 (%eax){1to32}, %zmm2 // CHECK: encoding: [0x62,0xf6,0x7c,0x58,0x4e,0x10] - vrsqrtpbf16 (%eax){1to32}, %zmm2 + vrsqrtbf16 (%eax){1to32}, %zmm2 -// CHECK: vrsqrtpbf16 -2048(,%ebp,2), %zmm2 +// CHECK: vrsqrtbf16 -2048(,%ebp,2), %zmm2 // CHECK: encoding: [0x62,0xf6,0x7c,0x48,0x4e,0x14,0x6d,0x00,0xf8,0xff,0xff] - vrsqrtpbf16 -2048(,%ebp,2), %zmm2 + vrsqrtbf16 -2048(,%ebp,2), %zmm2 -// CHECK: vrsqrtpbf16 8128(%ecx), %zmm2 {%k7} {z} +// CHECK: vrsqrtbf16 8128(%ecx), %zmm2 {%k7} {z} // CHECK: encoding: [0x62,0xf6,0x7c,0xcf,0x4e,0x51,0x7f] - vrsqrtpbf16 8128(%ecx), %zmm2 {%k7} {z} + vrsqrtbf16 8128(%ecx), %zmm2 {%k7} {z} -// CHECK: vrsqrtpbf16 -256(%edx){1to32}, %zmm2 {%k7} {z} +// CHECK: vrsqrtbf16 -256(%edx){1to32}, %zmm2 {%k7} {z} // CHECK: encoding: [0x62,0xf6,0x7c,0xdf,0x4e,0x52,0x80] - vrsqrtpbf16 -256(%edx){1to32}, %zmm2 {%k7} {z} + vrsqrtbf16 -256(%edx){1to32}, %zmm2 {%k7} {z} -// CHECK: vscalefpbf16 %ymm4, %ymm3, %ymm2 +// CHECK: vscalefbf16 %ymm4, %ymm3, %ymm2 // CHECK: encoding: [0x62,0xf6,0x64,0x28,0x2c,0xd4] - vscalefpbf16 %ymm4, %ymm3, %ymm2 + vscalefbf16 %ymm4, %ymm3, %ymm2 -// CHECK: vscalefpbf16 %ymm4, %ymm3, %ymm2 {%k7} +// CHECK: vscalefbf16 %ymm4, %ymm3, %ymm2 {%k7} // CHECK: encoding: [0x62,0xf6,0x64,0x2f,0x2c,0xd4] - vscalefpbf16 %ymm4, %ymm3, %ymm2 {%k7} + vscalefbf16 %ymm4, %ymm3, %ymm2 {%k7} -// CHECK: vscalefpbf16 %ymm4, %ymm3, %ymm2 {%k7} {z} +// CHECK: vscalefbf16 %ymm4, %ymm3, %ymm2 {%k7} {z} // CHECK: encoding: [0x62,0xf6,0x64,0xaf,0x2c,0xd4] - vscalefpbf16 %ymm4, %ymm3, %ymm2 {%k7} {z} + vscalefbf16 %ymm4, %ymm3, %ymm2 {%k7} {z} -// CHECK: vscalefpbf16 %zmm4, %zmm3, %zmm2 +// CHECK: vscalefbf16 %zmm4, %zmm3, %zmm2 // CHECK: encoding: [0x62,0xf6,0x64,0x48,0x2c,0xd4] - vscalefpbf16 %zmm4, %zmm3, %zmm2 + vscalefbf16 %zmm4, %zmm3, %zmm2 -// CHECK: vscalefpbf16 %zmm4, %zmm3, %zmm2 {%k7} +// CHECK: vscalefbf16 %zmm4, %zmm3, %zmm2 {%k7} // CHECK: encoding: [0x62,0xf6,0x64,0x4f,0x2c,0xd4] - vscalefpbf16 %zmm4, %zmm3, %zmm2 {%k7} + vscalefbf16 %zmm4, %zmm3, %zmm2 {%k7} -// CHECK: vscalefpbf16 %zmm4, %zmm3, %zmm2 {%k7} {z} +// CHECK: vscalefbf16 %zmm4, %zmm3, %zmm2 {%k7} {z} // CHECK: encoding: [0x62,0xf6,0x64,0xcf,0x2c,0xd4] - vscalefpbf16 %zmm4, %zmm3, %zmm2 {%k7} {z} + vscalefbf16 %zmm4, %zmm3, %zmm2 {%k7} {z} -// CHECK: vscalefpbf16 %xmm4, %xmm3, %xmm2 +// CHECK: vscalefbf16 %xmm4, %xmm3, %xmm2 // CHECK: encoding: [0x62,0xf6,0x64,0x08,0x2c,0xd4] - vscalefpbf16 %xmm4, %xmm3, %xmm2 + vscalefbf16 %xmm4, %xmm3, %xmm2 -// CHECK: vscalefpbf16 %xmm4, %xmm3, %xmm2 {%k7} +// CHECK: vscalefbf16 %xmm4, %xmm3, %xmm2 {%k7} // CHECK: encoding: [0x62,0xf6,0x64,0x0f,0x2c,0xd4] - vscalefpbf16 %xmm4, %xmm3, %xmm2 {%k7} + vscalefbf16 %xmm4, %xmm3, %xmm2 {%k7} -// CHECK: vscalefpbf16 %xmm4, %xmm3, %xmm2 {%k7} {z} +// CHECK: vscalefbf16 %xmm4, %xmm3, %xmm2 {%k7} {z} // CHECK: encoding: [0x62,0xf6,0x64,0x8f,0x2c,0xd4] - vscalefpbf16 %xmm4, %xmm3, %xmm2 {%k7} {z} + vscalefbf16 %xmm4, %xmm3, %xmm2 {%k7} {z} -// CHECK: vscalefpbf16 268435456(%esp,%esi,8), %zmm3, %zmm2 +// CHECK: vscalefbf16 268435456(%esp,%esi,8), %zmm3, %zmm2 // CHECK: encoding: [0x62,0xf6,0x64,0x48,0x2c,0x94,0xf4,0x00,0x00,0x00,0x10] - vscalefpbf16 268435456(%esp,%esi,8), %zmm3, %zmm2 + vscalefbf16 268435456(%esp,%esi,8), %zmm3, %zmm2 -// CHECK: vscalefpbf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7} +// CHECK: vscalefbf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7} // CHECK: encoding: [0x62,0xf6,0x64,0x4f,0x2c,0x94,0x87,0x23,0x01,0x00,0x00] - vscalefpbf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7} + vscalefbf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7} -// CHECK: vscalefpbf16 (%eax){1to32}, %zmm3, %zmm2 +// CHECK: vscalefbf16 (%eax){1to32}, %zmm3, %zmm2 // CHECK: encoding: [0x62,0xf6,0x64,0x58,0x2c,0x10] - vscalefpbf16 (%eax){1to32}, %zmm3, %zmm2 + vscalefbf16 (%eax){1to32}, %zmm3, %zmm2 -// CHECK: vscalefpbf16 -2048(,%ebp,2), %zmm3, %zmm2 +// CHECK: vscalefbf16 -2048(,%ebp,2), %zmm3, %zmm2 // CHECK: encoding: [0x62,0xf6,0x64,0x48,0x2c,0x14,0x6d,0x00,0xf8,0xff,0xff] - vscalefpbf16 -2048(,%ebp,2), %zmm3, %zmm2 + vscalefbf16 -2048(,%ebp,2), %zmm3, %zmm2 -// CHECK: vscalefpbf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z} +// CHECK: vscalefbf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z} // CHECK: encoding: [0x62,0xf6,0x64,0xcf,0x2c,0x51,0x7f] - vscalefpbf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z} + vscalefbf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z} -// CHECK: vscalefpbf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z} +// CHECK: vscalefbf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z} // CHECK: encoding: [0x62,0xf6,0x64,0xdf,0x2c,0x52,0x80] - vscalefpbf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z} + vscalefbf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z} -// CHECK: vscalefpbf16 268435456(%esp,%esi,8), %ymm3, %ymm2 +// CHECK: vscalefbf16 268435456(%esp,%esi,8), %ymm3, %ymm2 // CHECK: encoding: [0x62,0xf6,0x64,0x28,0x2c,0x94,0xf4,0x00,0x00,0x00,0x10] - vscalefpbf16 268435456(%esp,%esi,8), %ymm3, %ymm2 + vscalefbf16 268435456(%esp,%esi,8), %ymm3, %ymm2 -// CHECK: vscalefpbf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7} +// CHECK: vscalefbf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7} // CHECK: encoding: [0x62,0xf6,0x64,0x2f,0x2c,0x94,0x87,0x23,0x01,0x00,0x00] - vscalefpbf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7} + vscalefbf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7} -// CHECK: vscalefpbf16 (%eax){1to16}, %ymm3, %ymm2 +// CHECK: vscalefbf16 (%eax){1to16}, %ymm3, %ymm2 // CHECK: encoding: [0x62,0xf6,0x64,0x38,0x2c,0x10] - vscalefpbf16 (%eax){1to16}, %ymm3, %ymm2 + vscalefbf16 (%eax){1to16}, %ymm3, %ymm2 -// CHECK: vscalefpbf16 -1024(,%ebp,2), %ymm3, %ymm2 +// CHECK: vscalefbf16 -1024(,%ebp,2), %ymm3, %ymm2 // CHECK: encoding: [0x62,0xf6,0x64,0x28,0x2c,0x14,0x6d,0x00,0xfc,0xff,0xff] - vscalefpbf16 -1024(,%ebp,2), %ymm3, %ymm2 + vscalefbf16 -1024(,%ebp,2), %ymm3, %ymm2 -// CHECK: vscalefpbf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z} +// CHECK: vscalefbf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z} // CHECK: encoding: [0x62,0xf6,0x64,0xaf,0x2c,0x51,0x7f] - vscalefpbf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z} + vscalefbf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z} -// CHECK: vscalefpbf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z} +// CHECK: vscalefbf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z} // CHECK: encoding: [0x62,0xf6,0x64,0xbf,0x2c,0x52,0x80] - vscalefpbf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z} + vscalefbf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z} -// CHECK: vscalefpbf16 268435456(%esp,%esi,8), %xmm3, %xmm2 +// CHECK: vscalefbf16 268435456(%esp,%esi,8), %xmm3, %xmm2 // CHECK: encoding: [0x62,0xf6,0x64,0x08,0x2c,0x94,0xf4,0x00,0x00,0x00,0x10] - vscalefpbf16 268435456(%esp,%esi,8), %xmm3, %xmm2 + vscalefbf16 268435456(%esp,%esi,8), %xmm3, %xmm2 -// CHECK: vscalefpbf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7} +// CHECK: vscalefbf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7} // CHECK: encoding: [0x62,0xf6,0x64,0x0f,0x2c,0x94,0x87,0x23,0x01,0x00,0x00] - vscalefpbf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7} + vscalefbf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7} -// CHECK: vscalefpbf16 (%eax){1to8}, %xmm3, %xmm2 +// CHECK: vscalefbf16 (%eax){1to8}, %xmm3, %xmm2 // CHECK: encoding: [0x62,0xf6,0x64,0x18,0x2c,0x10] - vscalefpbf16 (%eax){1to8}, %xmm3, %xmm2 + vscalefbf16 (%eax){1to8}, %xmm3, %xmm2 -// CHECK: vscalefpbf16 -512(,%ebp,2), %xmm3, %xmm2 +// CHECK: vscalefbf16 -512(,%ebp,2), %xmm3, %xmm2 // CHECK: encoding: [0x62,0xf6,0x64,0x08,0x2c,0x14,0x6d,0x00,0xfe,0xff,0xff] - vscalefpbf16 -512(,%ebp,2), %xmm3, %xmm2 + vscalefbf16 -512(,%ebp,2), %xmm3, %xmm2 -// CHECK: vscalefpbf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z} +// CHECK: vscalefbf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z} // CHECK: encoding: [0x62,0xf6,0x64,0x8f,0x2c,0x51,0x7f] - vscalefpbf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z} + vscalefbf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z} -// CHECK: vscalefpbf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z} +// CHECK: vscalefbf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z} // CHECK: encoding: [0x62,0xf6,0x64,0x9f,0x2c,0x52,0x80] - vscalefpbf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z} + vscalefbf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z} -// CHECK: vsqrtnepbf16 %xmm3, %xmm2 +// CHECK: vsqrtbf16 %xmm3, %xmm2 // CHECK: encoding: [0x62,0xf5,0x7d,0x08,0x51,0xd3] - vsqrtnepbf16 %xmm3, %xmm2 + vsqrtbf16 %xmm3, %xmm2 -// CHECK: vsqrtnepbf16 %xmm3, %xmm2 {%k7} +// CHECK: vsqrtbf16 %xmm3, %xmm2 {%k7} // CHECK: encoding: [0x62,0xf5,0x7d,0x0f,0x51,0xd3] - vsqrtnepbf16 %xmm3, %xmm2 {%k7} + vsqrtbf16 %xmm3, %xmm2 {%k7} -// CHECK: vsqrtnepbf16 %xmm3, %xmm2 {%k7} {z} +// CHECK: vsqrtbf16 %xmm3, %xmm2 {%k7} {z} // CHECK: encoding: [0x62,0xf5,0x7d,0x8f,0x51,0xd3] - vsqrtnepbf16 %xmm3, %xmm2 {%k7} {z} + vsqrtbf16 %xmm3, %xmm2 {%k7} {z} -// CHECK: vsqrtnepbf16 %zmm3, %zmm2 +// CHECK: vsqrtbf16 %zmm3, %zmm2 // CHECK: encoding: [0x62,0xf5,0x7d,0x48,0x51,0xd3] - vsqrtnepbf16 %zmm3, %zmm2 + vsqrtbf16 %zmm3, %zmm2 -// CHECK: vsqrtnepbf16 %zmm3, %zmm2 {%k7} +// CHECK: vsqrtbf16 %zmm3, %zmm2 {%k7} // CHECK: encoding: [0x62,0xf5,0x7d,0x4f,0x51,0xd3] - vsqrtnepbf16 %zmm3, %zmm2 {%k7} + vsqrtbf16 %zmm3, %zmm2 {%k7} -// CHECK: vsqrtnepbf16 %zmm3, %zmm2 {%k7} {z} +// CHECK: vsqrtbf16 %zmm3, %zmm2 {%k7} {z} // CHECK: encoding: [0x62,0xf5,0x7d,0xcf,0x51,0xd3] - vsqrtnepbf16 %zmm3, %zmm2 {%k7} {z} + vsqrtbf16 %zmm3, %zmm2 {%k7} {z} -// CHECK: vsqrtnepbf16 %ymm3, %ymm2 +// CHECK: vsqrtbf16 %ymm3, %ymm2 // CHECK: encoding: [0x62,0xf5,0x7d,0x28,0x51,0xd3] - vsqrtnepbf16 %ymm3, %ymm2 + vsqrtbf16 %ymm3, %ymm2 -// CHECK: vsqrtnepbf16 %ymm3, %ymm2 {%k7} +// CHECK: vsqrtbf16 %ymm3, %ymm2 {%k7} // CHECK: encoding: [0x62,0xf5,0x7d,0x2f,0x51,0xd3] - vsqrtnepbf16 %ymm3, %ymm2 {%k7} + vsqrtbf16 %ymm3, %ymm2 {%k7} -// CHECK: vsqrtnepbf16 %ymm3, %ymm2 {%k7} {z} +// CHECK: vsqrtbf16 %ymm3, %ymm2 {%k7} {z} // CHECK: encoding: [0x62,0xf5,0x7d,0xaf,0x51,0xd3] - vsqrtnepbf16 %ymm3, %ymm2 {%k7} {z} + vsqrtbf16 %ymm3, %ymm2 {%k7} {z} -// CHECK: vsqrtnepbf16 268435456(%esp,%esi,8), %xmm2 +// CHECK: vsqrtbf16 268435456(%esp,%esi,8), %xmm2 // CHECK: encoding: [0x62,0xf5,0x7d,0x08,0x51,0x94,0xf4,0x00,0x00,0x00,0x10] - vsqrtnepbf16 268435456(%esp,%esi,8), %xmm2 + vsqrtbf16 268435456(%esp,%esi,8), %xmm2 -// CHECK: vsqrtnepbf16 291(%edi,%eax,4), %xmm2 {%k7} +// CHECK: vsqrtbf16 291(%edi,%eax,4), %xmm2 {%k7} // CHECK: encoding: [0x62,0xf5,0x7d,0x0f,0x51,0x94,0x87,0x23,0x01,0x00,0x00] - vsqrtnepbf16 291(%edi,%eax,4), %xmm2 {%k7} + vsqrtbf16 291(%edi,%eax,4), %xmm2 {%k7} -// CHECK: vsqrtnepbf16 (%eax){1to8}, %xmm2 +// CHECK: vsqrtbf16 (%eax){1to8}, %xmm2 // CHECK: encoding: [0x62,0xf5,0x7d,0x18,0x51,0x10] - vsqrtnepbf16 (%eax){1to8}, %xmm2 + vsqrtbf16 (%eax){1to8}, %xmm2 -// CHECK: vsqrtnepbf16 -512(,%ebp,2), %xmm2 +// CHECK: vsqrtbf16 -512(,%ebp,2), %xmm2 // CHECK: encoding: [0x62,0xf5,0x7d,0x08,0x51,0x14,0x6d,0x00,0xfe,0xff,0xff] - vsqrtnepbf16 -512(,%ebp,2), %xmm2 + vsqrtbf16 -512(,%ebp,2), %xmm2 -// CHECK: vsqrtnepbf16 2032(%ecx), %xmm2 {%k7} {z} +// CHECK: vsqrtbf16 2032(%ecx), %xmm2 {%k7} {z} // CHECK: encoding: [0x62,0xf5,0x7d,0x8f,0x51,0x51,0x7f] - vsqrtnepbf16 2032(%ecx), %xmm2 {%k7} {z} + vsqrtbf16 2032(%ecx), %xmm2 {%k7} {z} -// CHECK: vsqrtnepbf16 -256(%edx){1to8}, %xmm2 {%k7} {z} +// CHECK: vsqrtbf16 -256(%edx){1to8}, %xmm2 {%k7} {z} // CHECK: encoding: [0x62,0xf5,0x7d,0x9f,0x51,0x52,0x80] - vsqrtnepbf16 -256(%edx){1to8}, %xmm2 {%k7} {z} + vsqrtbf16 -256(%edx){1to8}, %xmm2 {%k7} {z} -// CHECK: vsqrtnepbf16 268435456(%esp,%esi,8), %ymm2 +// CHECK: vsqrtbf16 268435456(%esp,%esi,8), %ymm2 // CHECK: encoding: [0x62,0xf5,0x7d,0x28,0x51,0x94,0xf4,0x00,0x00,0x00,0x10] - vsqrtnepbf16 268435456(%esp,%esi,8), %ymm2 + vsqrtbf16 268435456(%esp,%esi,8), %ymm2 -// CHECK: vsqrtnepbf16 291(%edi,%eax,4), %ymm2 {%k7} +// CHECK: vsqrtbf16 291(%edi,%eax,4), %ymm2 {%k7} // CHECK: encoding: [0x62,0xf5,0x7d,0x2f,0x51,0x94,0x87,0x23,0x01,0x00,0x00] - vsqrtnepbf16 291(%edi,%eax,4), %ymm2 {%k7} + vsqrtbf16 291(%edi,%eax,4), %ymm2 {%k7} -// CHECK: vsqrtnepbf16 (%eax){1to16}, %ymm2 +// CHECK: vsqrtbf16 (%eax){1to16}, %ymm2 // CHECK: encoding: [0x62,0xf5,0x7d,0x38,0x51,0x10] - vsqrtnepbf16 (%eax){1to16}, %ymm2 + vsqrtbf16 (%eax){1to16}, %ymm2 -// CHECK: vsqrtnepbf16 -1024(,%ebp,2), %ymm2 +// CHECK: vsqrtbf16 -1024(,%ebp,2), %ymm2 // CHECK: encoding: [0x62,0xf5,0x7d,0x28,0x51,0x14,0x6d,0x00,0xfc,0xff,0xff] - vsqrtnepbf16 -1024(,%ebp,2), %ymm2 + vsqrtbf16 -1024(,%ebp,2), %ymm2 -// CHECK: vsqrtnepbf16 4064(%ecx), %ymm2 {%k7} {z} +// CHECK: vsqrtbf16 4064(%ecx), %ymm2 {%k7} {z} // CHECK: encoding: [0x62,0xf5,0x7d,0xaf,0x51,0x51,0x7f] - vsqrtnepbf16 4064(%ecx), %ymm2 {%k7} {z} + vsqrtbf16 4064(%ecx), %ymm2 {%k7} {z} -// CHECK: vsqrtnepbf16 -256(%edx){1to16}, %ymm2 {%k7} {z} +// CHECK: vsqrtbf16 -256(%edx){1to16}, %ymm2 {%k7} {z} // CHECK: encoding: [0x62,0xf5,0x7d,0xbf,0x51,0x52,0x80] - vsqrtnepbf16 -256(%edx){1to16}, %ymm2 {%k7} {z} + vsqrtbf16 -256(%edx){1to16}, %ymm2 {%k7} {z} -// CHECK: vsqrtnepbf16 268435456(%esp,%esi,8), %zmm2 +// CHECK: vsqrtbf16 268435456(%esp,%esi,8), %zmm2 // CHECK: encoding: [0x62,0xf5,0x7d,0x48,0x51,0x94,0xf4,0x00,0x00,0x00,0x10] - vsqrtnepbf16 268435456(%esp,%esi,8), %zmm2 + vsqrtbf16 268435456(%esp,%esi,8), %zmm2 -// CHECK: vsqrtnepbf16 291(%edi,%eax,4), %zmm2 {%k7} +// CHECK: vsqrtbf16 291(%edi,%eax,4), %zmm2 {%k7} // CHECK: encoding: [0x62,0xf5,0x7d,0x4f,0x51,0x94,0x87,0x23,0x01,0x00,0x00] - vsqrtnepbf16 291(%edi,%eax,4), %zmm2 {%k7} + vsqrtbf16 291(%edi,%eax,4), %zmm2 {%k7} -// CHECK: vsqrtnepbf16 (%eax){1to32}, %zmm2 +// CHECK: vsqrtbf16 (%eax){1to32}, %zmm2 // CHECK: encoding: [0x62,0xf5,0x7d,0x58,0x51,0x10] - vsqrtnepbf16 (%eax){1to32}, %zmm2 + vsqrtbf16 (%eax){1to32}, %zmm2 -// CHECK: vsqrtnepbf16 -2048(,%ebp,2), %zmm2 +// CHECK: vsqrtbf16 -2048(,%ebp,2), %zmm2 // CHECK: encoding: [0x62,0xf5,0x7d,0x48,0x51,0x14,0x6d,0x00,0xf8,0xff,0xff] - vsqrtnepbf16 -2048(,%ebp,2), %zmm2 + vsqrtbf16 -2048(,%ebp,2), %zmm2 -// CHECK: vsqrtnepbf16 8128(%ecx), %zmm2 {%k7} {z} +// CHECK: vsqrtbf16 8128(%ecx), %zmm2 {%k7} {z} // CHECK: encoding: [0x62,0xf5,0x7d,0xcf,0x51,0x51,0x7f] - vsqrtnepbf16 8128(%ecx), %zmm2 {%k7} {z} + vsqrtbf16 8128(%ecx), %zmm2 {%k7} {z} -// CHECK: vsqrtnepbf16 -256(%edx){1to32}, %zmm2 {%k7} {z} +// CHECK: vsqrtbf16 -256(%edx){1to32}, %zmm2 {%k7} {z} // CHECK: encoding: [0x62,0xf5,0x7d,0xdf,0x51,0x52,0x80] - vsqrtnepbf16 -256(%edx){1to32}, %zmm2 {%k7} {z} + vsqrtbf16 -256(%edx){1to32}, %zmm2 {%k7} {z} -// CHECK: vsubnepbf16 %ymm4, %ymm3, %ymm2 +// CHECK: vsubbf16 %ymm4, %ymm3, %ymm2 // CHECK: encoding: [0x62,0xf5,0x65,0x28,0x5c,0xd4] - vsubnepbf16 %ymm4, %ymm3, %ymm2 + vsubbf16 %ymm4, %ymm3, %ymm2 -// CHECK: vsubnepbf16 %ymm4, %ymm3, %ymm2 {%k7} +// CHECK: vsubbf16 %ymm4, %ymm3, %ymm2 {%k7} // CHECK: encoding: [0x62,0xf5,0x65,0x2f,0x5c,0xd4] - vsubnepbf16 %ymm4, %ymm3, %ymm2 {%k7} + vsubbf16 %ymm4, %ymm3, %ymm2 {%k7} -// CHECK: vsubnepbf16 %ymm4, %ymm3, %ymm2 {%k7} {z} +// CHECK: vsubbf16 %ymm4, %ymm3, %ymm2 {%k7} {z} // CHECK: encoding: [0x62,0xf5,0x65,0xaf,0x5c,0xd4] - vsubnepbf16 %ymm4, %ymm3, %ymm2 {%k7} {z} + vsubbf16 %ymm4, %ymm3, %ymm2 {%k7} {z} -// CHECK: vsubnepbf16 %zmm4, %zmm3, %zmm2 +// CHECK: vsubbf16 %zmm4, %zmm3, %zmm2 // CHECK: encoding: [0x62,0xf5,0x65,0x48,0x5c,0xd4] - vsubnepbf16 %zmm4, %zmm3, %zmm2 + vsubbf16 %zmm4, %zmm3, %zmm2 -// CHECK: vsubnepbf16 %zmm4, %zmm3, %zmm2 {%k7} +// CHECK: vsubbf16 %zmm4, %zmm3, %zmm2 {%k7} // CHECK: encoding: [0x62,0xf5,0x65,0x4f,0x5c,0xd4] - vsubnepbf16 %zmm4, %zmm3, %zmm2 {%k7} + vsubbf16 %zmm4, %zmm3, %zmm2 {%k7} -// CHECK: vsubnepbf16 %zmm4, %zmm3, %zmm2 {%k7} {z} +// CHECK: vsubbf16 %zmm4, %zmm3, %zmm2 {%k7} {z} // CHECK: encoding: [0x62,0xf5,0x65,0xcf,0x5c,0xd4] - vsubnepbf16 %zmm4, %zmm3, %zmm2 {%k7} {z} + vsubbf16 %zmm4, %zmm3, %zmm2 {%k7} {z} -// CHECK: vsubnepbf16 %xmm4, %xmm3, %xmm2 +// CHECK: vsubbf16 %xmm4, %xmm3, %xmm2 // CHECK: encoding: [0x62,0xf5,0x65,0x08,0x5c,0xd4] - vsubnepbf16 %xmm4, %xmm3, %xmm2 + vsubbf16 %xmm4, %xmm3, %xmm2 -// CHECK: vsubnepbf16 %xmm4, %xmm3, %xmm2 {%k7} +// CHECK: vsubbf16 %xmm4, %xmm3, %xmm2 {%k7} // CHECK: encoding: [0x62,0xf5,0x65,0x0f,0x5c,0xd4] - vsubnepbf16 %xmm4, %xmm3, %xmm2 {%k7} + vsubbf16 %xmm4, %xmm3, %xmm2 {%k7} -// CHECK: vsubnepbf16 %xmm4, %xmm3, %xmm2 {%k7} {z} +// CHECK: vsubbf16 %xmm4, %xmm3, %xmm2 {%k7} {z} // CHECK: encoding: [0x62,0xf5,0x65,0x8f,0x5c,0xd4] - vsubnepbf16 %xmm4, %xmm3, %xmm2 {%k7} {z} + vsubbf16 %xmm4, %xmm3, %xmm2 {%k7} {z} -// CHECK: vsubnepbf16 268435456(%esp,%esi,8), %zmm3, %zmm2 +// CHECK: vsubbf16 268435456(%esp,%esi,8), %zmm3, %zmm2 // CHECK: encoding: [0x62,0xf5,0x65,0x48,0x5c,0x94,0xf4,0x00,0x00,0x00,0x10] - vsubnepbf16 268435456(%esp,%esi,8), %zmm3, %zmm2 + vsubbf16 268435456(%esp,%esi,8), %zmm3, %zmm2 -// CHECK: vsubnepbf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7} +// CHECK: vsubbf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7} // CHECK: encoding: [0x62,0xf5,0x65,0x4f,0x5c,0x94,0x87,0x23,0x01,0x00,0x00] - vsubnepbf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7} + vsubbf16 291(%edi,%eax,4), %zmm3, %zmm2 {%k7} -// CHECK: vsubnepbf16 (%eax){1to32}, %zmm3, %zmm2 +// CHECK: vsubbf16 (%eax){1to32}, %zmm3, %zmm2 // CHECK: encoding: [0x62,0xf5,0x65,0x58,0x5c,0x10] - vsubnepbf16 (%eax){1to32}, %zmm3, %zmm2 + vsubbf16 (%eax){1to32}, %zmm3, %zmm2 -// CHECK: vsubnepbf16 -2048(,%ebp,2), %zmm3, %zmm2 +// CHECK: vsubbf16 -2048(,%ebp,2), %zmm3, %zmm2 // CHECK: encoding: [0x62,0xf5,0x65,0x48,0x5c,0x14,0x6d,0x00,0xf8,0xff,0xff] - vsubnepbf16 -2048(,%ebp,2), %zmm3, %zmm2 + vsubbf16 -2048(,%ebp,2), %zmm3, %zmm2 -// CHECK: vsubnepbf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z} +// CHECK: vsubbf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z} // CHECK: encoding: [0x62,0xf5,0x65,0xcf,0x5c,0x51,0x7f] - vsubnepbf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z} + vsubbf16 8128(%ecx), %zmm3, %zmm2 {%k7} {z} -// CHECK: vsubnepbf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z} +// CHECK: vsubbf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z} // CHECK: encoding: [0x62,0xf5,0x65,0xdf,0x5c,0x52,0x80] - vsubnepbf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z} + vsubbf16 -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z} -// CHECK: vsubnepbf16 268435456(%esp,%esi,8), %ymm3, %ymm2 +// CHECK: vsubbf16 268435456(%esp,%esi,8), %ymm3, %ymm2 // CHECK: encoding: [0x62,0xf5,0x65,0x28,0x5c,0x94,0xf4,0x00,0x00,0x00,0x10] - vsubnepbf16 268435456(%esp,%esi,8), %ymm3, %ymm2 + vsubbf16 268435456(%esp,%esi,8), %ymm3, %ymm2 -// CHECK: vsubnepbf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7} +// CHECK: vsubbf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7} // CHECK: encoding: [0x62,0xf5,0x65,0x2f,0x5c,0x94,0x87,0x23,0x01,0x00,0x00] - vsubnepbf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7} + vsubbf16 291(%edi,%eax,4), %ymm3, %ymm2 {%k7} -// CHECK: vsubnepbf16 (%eax){1to16}, %ymm3, %ymm2 +// CHECK: vsubbf16 (%eax){1to16}, %ymm3, %ymm2 // CHECK: encoding: [0x62,0xf5,0x65,0x38,0x5c,0x10] - vsubnepbf16 (%eax){1to16}, %ymm3, %ymm2 + vsubbf16 (%eax){1to16}, %ymm3, %ymm2 -// CHECK: vsubnepbf16 -1024(,%ebp,2), %ymm3, %ymm2 +// CHECK: vsubbf16 -1024(,%ebp,2), %ymm3, %ymm2 // CHECK: encoding: [0x62,0xf5,0x65,0x28,0x5c,0x14,0x6d,0x00,0xfc,0xff,0xff] - vsubnepbf16 -1024(,%ebp,2), %ymm3, %ymm2 + vsubbf16 -1024(,%ebp,2), %ymm3, %ymm2 -// CHECK: vsubnepbf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z} +// CHECK: vsubbf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z} // CHECK: encoding: [0x62,0xf5,0x65,0xaf,0x5c,0x51,0x7f] - vsubnepbf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z} + vsubbf16 4064(%ecx), %ymm3, %ymm2 {%k7} {z} -// CHECK: vsubnepbf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z} +// CHECK: vsubbf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z} // CHECK: encoding: [0x62,0xf5,0x65,0xbf,0x5c,0x52,0x80] - vsubnepbf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z} + vsubbf16 -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z} -// CHECK: vsubnepbf16 268435456(%esp,%esi,8), %xmm3, %xmm2 +// CHECK: vsubbf16 268435456(%esp,%esi,8), %xmm3, %xmm2 // CHECK: encoding: [0x62,0xf5,0x65,0x08,0x5c,0x94,0xf4,0x00,0x00,0x00,0x10] - vsubnepbf16 268435456(%esp,%esi,8), %xmm3, %xmm2 + vsubbf16 268435456(%esp,%esi,8), %xmm3, %xmm2 -// CHECK: vsubnepbf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7} +// CHECK: vsubbf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7} // CHECK: encoding: [0x62,0xf5,0x65,0x0f,0x5c,0x94,0x87,0x23,0x01,0x00,0x00] - vsubnepbf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7} + vsubbf16 291(%edi,%eax,4), %xmm3, %xmm2 {%k7} -// CHECK: vsubnepbf16 (%eax){1to8}, %xmm3, %xmm2 +// CHECK: vsubbf16 (%eax){1to8}, %xmm3, %xmm2 // CHECK: encoding: [0x62,0xf5,0x65,0x18,0x5c,0x10] - vsubnepbf16 (%eax){1to8}, %xmm3, %xmm2 + vsubbf16 (%eax){1to8}, %xmm3, %xmm2 -// CHECK: vsubnepbf16 -512(,%ebp,2), %xmm3, %xmm2 +// CHECK: vsubbf16 -512(,%ebp,2), %xmm3, %xmm2 // CHECK: encoding: [0x62,0xf5,0x65,0x08,0x5c,0x14,0x6d,0x00,0xfe,0xff,0xff] - vsubnepbf16 -512(,%ebp,2), %xmm3, %xmm2 + vsubbf16 -512(,%ebp,2), %xmm3, %xmm2 -// CHECK: vsubnepbf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z} +// CHECK: vsubbf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z} // CHECK: encoding: [0x62,0xf5,0x65,0x8f,0x5c,0x51,0x7f] - vsubnepbf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z} + vsubbf16 2032(%ecx), %xmm3, %xmm2 {%k7} {z} -// CHECK: vsubnepbf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z} +// CHECK: vsubbf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z} // CHECK: encoding: [0x62,0xf5,0x65,0x9f,0x5c,0x52,0x80] - vsubnepbf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z} + vsubbf16 -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z} diff --git a/llvm/test/MC/X86/avx10.2-bf16-32-intel.s b/llvm/test/MC/X86/avx10.2-bf16-32-intel.s index 30c2cf45297bc..f19e41d52d4ee 100644 --- a/llvm/test/MC/X86/avx10.2-bf16-32-intel.s +++ b/llvm/test/MC/X86/avx10.2-bf16-32-intel.s @@ -1,208 +1,208 @@ // RUN: llvm-mc -triple i386 -x86-asm-syntax=intel -output-asm-variant=1 --show-encoding %s | FileCheck %s -// CHECK: vaddnepbf16 ymm2, ymm3, ymm4 +// CHECK: vaddbf16 ymm2, ymm3, ymm4 // CHECK: encoding: [0x62,0xf5,0x65,0x28,0x58,0xd4] - vaddnepbf16 ymm2, ymm3, ymm4 + vaddbf16 ymm2, ymm3, ymm4 -// CHECK: vaddnepbf16 ymm2 {k7}, ymm3, ymm4 +// CHECK: vaddbf16 ymm2 {k7}, ymm3, ymm4 // CHECK: encoding: [0x62,0xf5,0x65,0x2f,0x58,0xd4] - vaddnepbf16 ymm2 {k7}, ymm3, ymm4 + vaddbf16 ymm2 {k7}, ymm3, ymm4 -// CHECK: vaddnepbf16 ymm2 {k7} {z}, ymm3, ymm4 +// CHECK: vaddbf16 ymm2 {k7} {z}, ymm3, ymm4 // CHECK: encoding: [0x62,0xf5,0x65,0xaf,0x58,0xd4] - vaddnepbf16 ymm2 {k7} {z}, ymm3, ymm4 + vaddbf16 ymm2 {k7} {z}, ymm3, ymm4 -// CHECK: vaddnepbf16 zmm2, zmm3, zmm4 +// CHECK: vaddbf16 zmm2, zmm3, zmm4 // CHECK: encoding: [0x62,0xf5,0x65,0x48,0x58,0xd4] - vaddnepbf16 zmm2, zmm3, zmm4 + vaddbf16 zmm2, zmm3, zmm4 -// CHECK: vaddnepbf16 zmm2 {k7}, zmm3, zmm4 +// CHECK: vaddbf16 zmm2 {k7}, zmm3, zmm4 // CHECK: encoding: [0x62,0xf5,0x65,0x4f,0x58,0xd4] - vaddnepbf16 zmm2 {k7}, zmm3, zmm4 + vaddbf16 zmm2 {k7}, zmm3, zmm4 -// CHECK: vaddnepbf16 zmm2 {k7} {z}, zmm3, zmm4 +// CHECK: vaddbf16 zmm2 {k7} {z}, zmm3, zmm4 // CHECK: encoding: [0x62,0xf5,0x65,0xcf,0x58,0xd4] - vaddnepbf16 zmm2 {k7} {z}, zmm3, zmm4 + vaddbf16 zmm2 {k7} {z}, zmm3, zmm4 -// CHECK: vaddnepbf16 xmm2, xmm3, xmm4 +// CHECK: vaddbf16 xmm2, xmm3, xmm4 // CHECK: encoding: [0x62,0xf5,0x65,0x08,0x58,0xd4] - vaddnepbf16 xmm2, xmm3, xmm4 + vaddbf16 xmm2, xmm3, xmm4 -// CHECK: vaddnepbf16 xmm2 {k7}, xmm3, xmm4 +// CHECK: vaddbf16 xmm2 {k7}, xmm3, xmm4 // CHECK: encoding: [0x62,0xf5,0x65,0x0f,0x58,0xd4] - vaddnepbf16 xmm2 {k7}, xmm3, xmm4 + vaddbf16 xmm2 {k7}, xmm3, xmm4 -// CHECK: vaddnepbf16 xmm2 {k7} {z}, xmm3, xmm4 +// CHECK: vaddbf16 xmm2 {k7} {z}, xmm3, xmm4 // CHECK: encoding: [0x62,0xf5,0x65,0x8f,0x58,0xd4] - vaddnepbf16 xmm2 {k7} {z}, xmm3, xmm4 + vaddbf16 xmm2 {k7} {z}, xmm3, xmm4 -// CHECK: vaddnepbf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456] +// CHECK: vaddbf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456] // CHECK: encoding: [0x62,0xf5,0x65,0x48,0x58,0x94,0xf4,0x00,0x00,0x00,0x10] - vaddnepbf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456] + vaddbf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456] -// CHECK: vaddnepbf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291] +// CHECK: vaddbf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291] // CHECK: encoding: [0x62,0xf5,0x65,0x4f,0x58,0x94,0x87,0x23,0x01,0x00,0x00] - vaddnepbf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291] + vaddbf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291] -// CHECK: vaddnepbf16 zmm2, zmm3, word ptr [eax]{1to32} +// CHECK: vaddbf16 zmm2, zmm3, word ptr [eax]{1to32} // CHECK: encoding: [0x62,0xf5,0x65,0x58,0x58,0x10] - vaddnepbf16 zmm2, zmm3, word ptr [eax]{1to32} + vaddbf16 zmm2, zmm3, word ptr [eax]{1to32} -// CHECK: vaddnepbf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048] +// CHECK: vaddbf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048] // CHECK: encoding: [0x62,0xf5,0x65,0x48,0x58,0x14,0x6d,0x00,0xf8,0xff,0xff] - vaddnepbf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048] + vaddbf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048] -// CHECK: vaddnepbf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128] +// CHECK: vaddbf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128] // CHECK: encoding: [0x62,0xf5,0x65,0xcf,0x58,0x51,0x7f] - vaddnepbf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128] + vaddbf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128] -// CHECK: vaddnepbf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32} +// CHECK: vaddbf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32} // CHECK: encoding: [0x62,0xf5,0x65,0xdf,0x58,0x52,0x80] - vaddnepbf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32} + vaddbf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32} -// CHECK: vaddnepbf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456] +// CHECK: vaddbf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456] // CHECK: encoding: [0x62,0xf5,0x65,0x28,0x58,0x94,0xf4,0x00,0x00,0x00,0x10] - vaddnepbf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456] + vaddbf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456] -// CHECK: vaddnepbf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291] +// CHECK: vaddbf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291] // CHECK: encoding: [0x62,0xf5,0x65,0x2f,0x58,0x94,0x87,0x23,0x01,0x00,0x00] - vaddnepbf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291] + vaddbf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291] -// CHECK: vaddnepbf16 ymm2, ymm3, word ptr [eax]{1to16} +// CHECK: vaddbf16 ymm2, ymm3, word ptr [eax]{1to16} // CHECK: encoding: [0x62,0xf5,0x65,0x38,0x58,0x10] - vaddnepbf16 ymm2, ymm3, word ptr [eax]{1to16} + vaddbf16 ymm2, ymm3, word ptr [eax]{1to16} -// CHECK: vaddnepbf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024] +// CHECK: vaddbf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024] // CHECK: encoding: [0x62,0xf5,0x65,0x28,0x58,0x14,0x6d,0x00,0xfc,0xff,0xff] - vaddnepbf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024] + vaddbf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024] -// CHECK: vaddnepbf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064] +// CHECK: vaddbf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064] // CHECK: encoding: [0x62,0xf5,0x65,0xaf,0x58,0x51,0x7f] - vaddnepbf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064] + vaddbf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064] -// CHECK: vaddnepbf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16} +// CHECK: vaddbf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16} // CHECK: encoding: [0x62,0xf5,0x65,0xbf,0x58,0x52,0x80] - vaddnepbf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16} + vaddbf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16} -// CHECK: vaddnepbf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456] +// CHECK: vaddbf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456] // CHECK: encoding: [0x62,0xf5,0x65,0x08,0x58,0x94,0xf4,0x00,0x00,0x00,0x10] - vaddnepbf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456] + vaddbf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456] -// CHECK: vaddnepbf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291] +// CHECK: vaddbf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291] // CHECK: encoding: [0x62,0xf5,0x65,0x0f,0x58,0x94,0x87,0x23,0x01,0x00,0x00] - vaddnepbf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291] + vaddbf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291] -// CHECK: vaddnepbf16 xmm2, xmm3, word ptr [eax]{1to8} +// CHECK: vaddbf16 xmm2, xmm3, word ptr [eax]{1to8} // CHECK: encoding: [0x62,0xf5,0x65,0x18,0x58,0x10] - vaddnepbf16 xmm2, xmm3, word ptr [eax]{1to8} + vaddbf16 xmm2, xmm3, word ptr [eax]{1to8} -// CHECK: vaddnepbf16 xmm2, xmm3, xmmword ptr [2*ebp - 512] +// CHECK: vaddbf16 xmm2, xmm3, xmmword ptr [2*ebp - 512] // CHECK: encoding: [0x62,0xf5,0x65,0x08,0x58,0x14,0x6d,0x00,0xfe,0xff,0xff] - vaddnepbf16 xmm2, xmm3, xmmword ptr [2*ebp - 512] + vaddbf16 xmm2, xmm3, xmmword ptr [2*ebp - 512] -// CHECK: vaddnepbf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032] +// CHECK: vaddbf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032] // CHECK: encoding: [0x62,0xf5,0x65,0x8f,0x58,0x51,0x7f] - vaddnepbf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032] + vaddbf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032] -// CHECK: vaddnepbf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8} +// CHECK: vaddbf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8} // CHECK: encoding: [0x62,0xf5,0x65,0x9f,0x58,0x52,0x80] - vaddnepbf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8} + vaddbf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8} -// CHECK: vcmppbf16 k5, ymm3, ymm4, 123 +// CHECK: vcmpbf16 k5, ymm3, ymm4, 123 // CHECK: encoding: [0x62,0xf3,0x67,0x28,0xc2,0xec,0x7b] - vcmppbf16 k5, ymm3, ymm4, 123 + vcmpbf16 k5, ymm3, ymm4, 123 -// CHECK: vcmppbf16 k5 {k7}, ymm3, ymm4, 123 +// CHECK: vcmpbf16 k5 {k7}, ymm3, ymm4, 123 // CHECK: encoding: [0x62,0xf3,0x67,0x2f,0xc2,0xec,0x7b] - vcmppbf16 k5 {k7}, ymm3, ymm4, 123 + vcmpbf16 k5 {k7}, ymm3, ymm4, 123 -// CHECK: vcmppbf16 k5, xmm3, xmm4, 123 +// CHECK: vcmpbf16 k5, xmm3, xmm4, 123 // CHECK: encoding: [0x62,0xf3,0x67,0x08,0xc2,0xec,0x7b] - vcmppbf16 k5, xmm3, xmm4, 123 + vcmpbf16 k5, xmm3, xmm4, 123 -// CHECK: vcmppbf16 k5 {k7}, xmm3, xmm4, 123 +// CHECK: vcmpbf16 k5 {k7}, xmm3, xmm4, 123 // CHECK: encoding: [0x62,0xf3,0x67,0x0f,0xc2,0xec,0x7b] - vcmppbf16 k5 {k7}, xmm3, xmm4, 123 + vcmpbf16 k5 {k7}, xmm3, xmm4, 123 -// CHECK: vcmppbf16 k5, zmm3, zmm4, 123 +// CHECK: vcmpbf16 k5, zmm3, zmm4, 123 // CHECK: encoding: [0x62,0xf3,0x67,0x48,0xc2,0xec,0x7b] - vcmppbf16 k5, zmm3, zmm4, 123 + vcmpbf16 k5, zmm3, zmm4, 123 -// CHECK: vcmppbf16 k5 {k7}, zmm3, zmm4, 123 +// CHECK: vcmpbf16 k5 {k7}, zmm3, zmm4, 123 // CHECK: encoding: [0x62,0xf3,0x67,0x4f,0xc2,0xec,0x7b] - vcmppbf16 k5 {k7}, zmm3, zmm4, 123 + vcmpbf16 k5 {k7}, zmm3, zmm4, 123 -// CHECK: vcmppbf16 k5, zmm3, zmmword ptr [esp + 8*esi + 268435456], 123 +// CHECK: vcmpbf16 k5, zmm3, zmmword ptr [esp + 8*esi + 268435456], 123 // CHECK: encoding: [0x62,0xf3,0x67,0x48,0xc2,0xac,0xf4,0x00,0x00,0x00,0x10,0x7b] - vcmppbf16 k5, zmm3, zmmword ptr [esp + 8*esi + 268435456], 123 + vcmpbf16 k5, zmm3, zmmword ptr [esp + 8*esi + 268435456], 123 -// CHECK: vcmppbf16 k5 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291], 123 +// CHECK: vcmpbf16 k5 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291], 123 // CHECK: encoding: [0x62,0xf3,0x67,0x4f,0xc2,0xac,0x87,0x23,0x01,0x00,0x00,0x7b] - vcmppbf16 k5 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291], 123 + vcmpbf16 k5 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291], 123 -// CHECK: vcmppbf16 k5, zmm3, word ptr [eax]{1to32}, 123 +// CHECK: vcmpbf16 k5, zmm3, word ptr [eax]{1to32}, 123 // CHECK: encoding: [0x62,0xf3,0x67,0x58,0xc2,0x28,0x7b] - vcmppbf16 k5, zmm3, word ptr [eax]{1to32}, 123 + vcmpbf16 k5, zmm3, word ptr [eax]{1to32}, 123 -// CHECK: vcmppbf16 k5, zmm3, zmmword ptr [2*ebp - 2048], 123 +// CHECK: vcmpbf16 k5, zmm3, zmmword ptr [2*ebp - 2048], 123 // CHECK: encoding: [0x62,0xf3,0x67,0x48,0xc2,0x2c,0x6d,0x00,0xf8,0xff,0xff,0x7b] - vcmppbf16 k5, zmm3, zmmword ptr [2*ebp - 2048], 123 + vcmpbf16 k5, zmm3, zmmword ptr [2*ebp - 2048], 123 -// CHECK: vcmppbf16 k5 {k7}, zmm3, zmmword ptr [ecx + 8128], 123 +// CHECK: vcmpbf16 k5 {k7}, zmm3, zmmword ptr [ecx + 8128], 123 // CHECK: encoding: [0x62,0xf3,0x67,0x4f,0xc2,0x69,0x7f,0x7b] - vcmppbf16 k5 {k7}, zmm3, zmmword ptr [ecx + 8128], 123 + vcmpbf16 k5 {k7}, zmm3, zmmword ptr [ecx + 8128], 123 -// CHECK: vcmppbf16 k5 {k7}, zmm3, word ptr [edx - 256]{1to32}, 123 +// CHECK: vcmpbf16 k5 {k7}, zmm3, word ptr [edx - 256]{1to32}, 123 // CHECK: encoding: [0x62,0xf3,0x67,0x5f,0xc2,0x6a,0x80,0x7b] - vcmppbf16 k5 {k7}, zmm3, word ptr [edx - 256]{1to32}, 123 + vcmpbf16 k5 {k7}, zmm3, word ptr [edx - 256]{1to32}, 123 -// CHECK: vcmppbf16 k5, xmm3, xmmword ptr [esp + 8*esi + 268435456], 123 +// CHECK: vcmpbf16 k5, xmm3, xmmword ptr [esp + 8*esi + 268435456], 123 // CHECK: encoding: [0x62,0xf3,0x67,0x08,0xc2,0xac,0xf4,0x00,0x00,0x00,0x10,0x7b] - vcmppbf16 k5, xmm3, xmmword ptr [esp + 8*esi + 268435456], 123 + vcmpbf16 k5, xmm3, xmmword ptr [esp + 8*esi + 268435456], 123 -// CHECK: vcmppbf16 k5 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291], 123 +// CHECK: vcmpbf16 k5 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291], 123 // CHECK: encoding: [0x62,0xf3,0x67,0x0f,0xc2,0xac,0x87,0x23,0x01,0x00,0x00,0x7b] - vcmppbf16 k5 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291], 123 + vcmpbf16 k5 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291], 123 -// CHECK: vcmppbf16 k5, xmm3, word ptr [eax]{1to8}, 123 +// CHECK: vcmpbf16 k5, xmm3, word ptr [eax]{1to8}, 123 // CHECK: encoding: [0x62,0xf3,0x67,0x18,0xc2,0x28,0x7b] - vcmppbf16 k5, xmm3, word ptr [eax]{1to8}, 123 + vcmpbf16 k5, xmm3, word ptr [eax]{1to8}, 123 -// CHECK: vcmppbf16 k5, xmm3, xmmword ptr [2*ebp - 512], 123 +// CHECK: vcmpbf16 k5, xmm3, xmmword ptr [2*ebp - 512], 123 // CHECK: encoding: [0x62,0xf3,0x67,0x08,0xc2,0x2c,0x6d,0x00,0xfe,0xff,0xff,0x7b] - vcmppbf16 k5, xmm3, xmmword ptr [2*ebp - 512], 123 + vcmpbf16 k5, xmm3, xmmword ptr [2*ebp - 512], 123 -// CHECK: vcmppbf16 k5 {k7}, xmm3, xmmword ptr [ecx + 2032], 123 +// CHECK: vcmpbf16 k5 {k7}, xmm3, xmmword ptr [ecx + 2032], 123 // CHECK: encoding: [0x62,0xf3,0x67,0x0f,0xc2,0x69,0x7f,0x7b] - vcmppbf16 k5 {k7}, xmm3, xmmword ptr [ecx + 2032], 123 + vcmpbf16 k5 {k7}, xmm3, xmmword ptr [ecx + 2032], 123 -// CHECK: vcmppbf16 k5 {k7}, xmm3, word ptr [edx - 256]{1to8}, 123 +// CHECK: vcmpbf16 k5 {k7}, xmm3, word ptr [edx - 256]{1to8}, 123 // CHECK: encoding: [0x62,0xf3,0x67,0x1f,0xc2,0x6a,0x80,0x7b] - vcmppbf16 k5 {k7}, xmm3, word ptr [edx - 256]{1to8}, 123 + vcmpbf16 k5 {k7}, xmm3, word ptr [edx - 256]{1to8}, 123 -// CHECK: vcmppbf16 k5, ymm3, ymmword ptr [esp + 8*esi + 268435456], 123 +// CHECK: vcmpbf16 k5, ymm3, ymmword ptr [esp + 8*esi + 268435456], 123 // CHECK: encoding: [0x62,0xf3,0x67,0x28,0xc2,0xac,0xf4,0x00,0x00,0x00,0x10,0x7b] - vcmppbf16 k5, ymm3, ymmword ptr [esp + 8*esi + 268435456], 123 + vcmpbf16 k5, ymm3, ymmword ptr [esp + 8*esi + 268435456], 123 -// CHECK: vcmppbf16 k5 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291], 123 +// CHECK: vcmpbf16 k5 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291], 123 // CHECK: encoding: [0x62,0xf3,0x67,0x2f,0xc2,0xac,0x87,0x23,0x01,0x00,0x00,0x7b] - vcmppbf16 k5 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291], 123 + vcmpbf16 k5 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291], 123 -// CHECK: vcmppbf16 k5, ymm3, word ptr [eax]{1to16}, 123 +// CHECK: vcmpbf16 k5, ymm3, word ptr [eax]{1to16}, 123 // CHECK: encoding: [0x62,0xf3,0x67,0x38,0xc2,0x28,0x7b] - vcmppbf16 k5, ymm3, word ptr [eax]{1to16}, 123 + vcmpbf16 k5, ymm3, word ptr [eax]{1to16}, 123 -// CHECK: vcmppbf16 k5, ymm3, ymmword ptr [2*ebp - 1024], 123 +// CHECK: vcmpbf16 k5, ymm3, ymmword ptr [2*ebp - 1024], 123 // CHECK: encoding: [0x62,0xf3,0x67,0x28,0xc2,0x2c,0x6d,0x00,0xfc,0xff,0xff,0x7b] - vcmppbf16 k5, ymm3, ymmword ptr [2*ebp - 1024], 123 + vcmpbf16 k5, ymm3, ymmword ptr [2*ebp - 1024], 123 -// CHECK: vcmppbf16 k5 {k7}, ymm3, ymmword ptr [ecx + 4064], 123 +// CHECK: vcmpbf16 k5 {k7}, ymm3, ymmword ptr [ecx + 4064], 123 // CHECK: encoding: [0x62,0xf3,0x67,0x2f,0xc2,0x69,0x7f,0x7b] - vcmppbf16 k5 {k7}, ymm3, ymmword ptr [ecx + 4064], 123 + vcmpbf16 k5 {k7}, ymm3, ymmword ptr [ecx + 4064], 123 -// CHECK: vcmppbf16 k5 {k7}, ymm3, word ptr [edx - 256]{1to16}, 123 +// CHECK: vcmpbf16 k5 {k7}, ymm3, word ptr [edx - 256]{1to16}, 123 // CHECK: encoding: [0x62,0xf3,0x67,0x3f,0xc2,0x6a,0x80,0x7b] - vcmppbf16 k5 {k7}, ymm3, word ptr [edx - 256]{1to16}, 123 + vcmpbf16 k5 {k7}, ymm3, word ptr [edx - 256]{1to16}, 123 // CHECK: vcomsbf16 xmm2, xmm3 // CHECK: encoding: [0x62,0xf5,0x7d,0x08,0x2f,0xd3] @@ -232,2783 +232,2783 @@ // CHECK: encoding: [0x62,0xf5,0x7d,0x08,0x2f,0x52,0x80] vcomsbf16 xmm2, word ptr [edx - 256] -// CHECK: vdivnepbf16 ymm2, ymm3, ymm4 +// CHECK: vdivbf16 ymm2, ymm3, ymm4 // CHECK: encoding: [0x62,0xf5,0x65,0x28,0x5e,0xd4] - vdivnepbf16 ymm2, ymm3, ymm4 + vdivbf16 ymm2, ymm3, ymm4 -// CHECK: vdivnepbf16 ymm2 {k7}, ymm3, ymm4 +// CHECK: vdivbf16 ymm2 {k7}, ymm3, ymm4 // CHECK: encoding: [0x62,0xf5,0x65,0x2f,0x5e,0xd4] - vdivnepbf16 ymm2 {k7}, ymm3, ymm4 + vdivbf16 ymm2 {k7}, ymm3, ymm4 -// CHECK: vdivnepbf16 ymm2 {k7} {z}, ymm3, ymm4 +// CHECK: vdivbf16 ymm2 {k7} {z}, ymm3, ymm4 // CHECK: encoding: [0x62,0xf5,0x65,0xaf,0x5e,0xd4] - vdivnepbf16 ymm2 {k7} {z}, ymm3, ymm4 + vdivbf16 ymm2 {k7} {z}, ymm3, ymm4 -// CHECK: vdivnepbf16 zmm2, zmm3, zmm4 +// CHECK: vdivbf16 zmm2, zmm3, zmm4 // CHECK: encoding: [0x62,0xf5,0x65,0x48,0x5e,0xd4] - vdivnepbf16 zmm2, zmm3, zmm4 + vdivbf16 zmm2, zmm3, zmm4 -// CHECK: vdivnepbf16 zmm2 {k7}, zmm3, zmm4 +// CHECK: vdivbf16 zmm2 {k7}, zmm3, zmm4 // CHECK: encoding: [0x62,0xf5,0x65,0x4f,0x5e,0xd4] - vdivnepbf16 zmm2 {k7}, zmm3, zmm4 + vdivbf16 zmm2 {k7}, zmm3, zmm4 -// CHECK: vdivnepbf16 zmm2 {k7} {z}, zmm3, zmm4 +// CHECK: vdivbf16 zmm2 {k7} {z}, zmm3, zmm4 // CHECK: encoding: [0x62,0xf5,0x65,0xcf,0x5e,0xd4] - vdivnepbf16 zmm2 {k7} {z}, zmm3, zmm4 + vdivbf16 zmm2 {k7} {z}, zmm3, zmm4 -// CHECK: vdivnepbf16 xmm2, xmm3, xmm4 +// CHECK: vdivbf16 xmm2, xmm3, xmm4 // CHECK: encoding: [0x62,0xf5,0x65,0x08,0x5e,0xd4] - vdivnepbf16 xmm2, xmm3, xmm4 + vdivbf16 xmm2, xmm3, xmm4 -// CHECK: vdivnepbf16 xmm2 {k7}, xmm3, xmm4 +// CHECK: vdivbf16 xmm2 {k7}, xmm3, xmm4 // CHECK: encoding: [0x62,0xf5,0x65,0x0f,0x5e,0xd4] - vdivnepbf16 xmm2 {k7}, xmm3, xmm4 + vdivbf16 xmm2 {k7}, xmm3, xmm4 -// CHECK: vdivnepbf16 xmm2 {k7} {z}, xmm3, xmm4 +// CHECK: vdivbf16 xmm2 {k7} {z}, xmm3, xmm4 // CHECK: encoding: [0x62,0xf5,0x65,0x8f,0x5e,0xd4] - vdivnepbf16 xmm2 {k7} {z}, xmm3, xmm4 + vdivbf16 xmm2 {k7} {z}, xmm3, xmm4 -// CHECK: vdivnepbf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456] +// CHECK: vdivbf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456] // CHECK: encoding: [0x62,0xf5,0x65,0x48,0x5e,0x94,0xf4,0x00,0x00,0x00,0x10] - vdivnepbf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456] + vdivbf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456] -// CHECK: vdivnepbf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291] +// CHECK: vdivbf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291] // CHECK: encoding: [0x62,0xf5,0x65,0x4f,0x5e,0x94,0x87,0x23,0x01,0x00,0x00] - vdivnepbf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291] + vdivbf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291] -// CHECK: vdivnepbf16 zmm2, zmm3, word ptr [eax]{1to32} +// CHECK: vdivbf16 zmm2, zmm3, word ptr [eax]{1to32} // CHECK: encoding: [0x62,0xf5,0x65,0x58,0x5e,0x10] - vdivnepbf16 zmm2, zmm3, word ptr [eax]{1to32} + vdivbf16 zmm2, zmm3, word ptr [eax]{1to32} -// CHECK: vdivnepbf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048] +// CHECK: vdivbf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048] // CHECK: encoding: [0x62,0xf5,0x65,0x48,0x5e,0x14,0x6d,0x00,0xf8,0xff,0xff] - vdivnepbf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048] + vdivbf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048] -// CHECK: vdivnepbf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128] +// CHECK: vdivbf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128] // CHECK: encoding: [0x62,0xf5,0x65,0xcf,0x5e,0x51,0x7f] - vdivnepbf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128] + vdivbf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128] -// CHECK: vdivnepbf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32} +// CHECK: vdivbf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32} // CHECK: encoding: [0x62,0xf5,0x65,0xdf,0x5e,0x52,0x80] - vdivnepbf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32} + vdivbf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32} -// CHECK: vdivnepbf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456] +// CHECK: vdivbf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456] // CHECK: encoding: [0x62,0xf5,0x65,0x28,0x5e,0x94,0xf4,0x00,0x00,0x00,0x10] - vdivnepbf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456] + vdivbf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456] -// CHECK: vdivnepbf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291] +// CHECK: vdivbf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291] // CHECK: encoding: [0x62,0xf5,0x65,0x2f,0x5e,0x94,0x87,0x23,0x01,0x00,0x00] - vdivnepbf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291] + vdivbf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291] -// CHECK: vdivnepbf16 ymm2, ymm3, word ptr [eax]{1to16} +// CHECK: vdivbf16 ymm2, ymm3, word ptr [eax]{1to16} // CHECK: encoding: [0x62,0xf5,0x65,0x38,0x5e,0x10] - vdivnepbf16 ymm2, ymm3, word ptr [eax]{1to16} + vdivbf16 ymm2, ymm3, word ptr [eax]{1to16} -// CHECK: vdivnepbf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024] +// CHECK: vdivbf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024] // CHECK: encoding: [0x62,0xf5,0x65,0x28,0x5e,0x14,0x6d,0x00,0xfc,0xff,0xff] - vdivnepbf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024] + vdivbf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024] -// CHECK: vdivnepbf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064] +// CHECK: vdivbf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064] // CHECK: encoding: [0x62,0xf5,0x65,0xaf,0x5e,0x51,0x7f] - vdivnepbf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064] + vdivbf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064] -// CHECK: vdivnepbf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16} +// CHECK: vdivbf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16} // CHECK: encoding: [0x62,0xf5,0x65,0xbf,0x5e,0x52,0x80] - vdivnepbf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16} + vdivbf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16} -// CHECK: vdivnepbf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456] +// CHECK: vdivbf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456] // CHECK: encoding: [0x62,0xf5,0x65,0x08,0x5e,0x94,0xf4,0x00,0x00,0x00,0x10] - vdivnepbf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456] + vdivbf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456] -// CHECK: vdivnepbf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291] +// CHECK: vdivbf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291] // CHECK: encoding: [0x62,0xf5,0x65,0x0f,0x5e,0x94,0x87,0x23,0x01,0x00,0x00] - vdivnepbf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291] + vdivbf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291] -// CHECK: vdivnepbf16 xmm2, xmm3, word ptr [eax]{1to8} +// CHECK: vdivbf16 xmm2, xmm3, word ptr [eax]{1to8} // CHECK: encoding: [0x62,0xf5,0x65,0x18,0x5e,0x10] - vdivnepbf16 xmm2, xmm3, word ptr [eax]{1to8} + vdivbf16 xmm2, xmm3, word ptr [eax]{1to8} -// CHECK: vdivnepbf16 xmm2, xmm3, xmmword ptr [2*ebp - 512] +// CHECK: vdivbf16 xmm2, xmm3, xmmword ptr [2*ebp - 512] // CHECK: encoding: [0x62,0xf5,0x65,0x08,0x5e,0x14,0x6d,0x00,0xfe,0xff,0xff] - vdivnepbf16 xmm2, xmm3, xmmword ptr [2*ebp - 512] + vdivbf16 xmm2, xmm3, xmmword ptr [2*ebp - 512] -// CHECK: vdivnepbf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032] +// CHECK: vdivbf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032] // CHECK: encoding: [0x62,0xf5,0x65,0x8f,0x5e,0x51,0x7f] - vdivnepbf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032] + vdivbf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032] -// CHECK: vdivnepbf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8} +// CHECK: vdivbf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8} // CHECK: encoding: [0x62,0xf5,0x65,0x9f,0x5e,0x52,0x80] - vdivnepbf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8} + vdivbf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8} -// CHECK: vfmadd132nepbf16 ymm2, ymm3, ymm4 +// CHECK: vfmadd132bf16 ymm2, ymm3, ymm4 // CHECK: encoding: [0x62,0xf6,0x64,0x28,0x98,0xd4] - vfmadd132nepbf16 ymm2, ymm3, ymm4 + vfmadd132bf16 ymm2, ymm3, ymm4 -// CHECK: vfmadd132nepbf16 ymm2 {k7}, ymm3, ymm4 +// CHECK: vfmadd132bf16 ymm2 {k7}, ymm3, ymm4 // CHECK: encoding: [0x62,0xf6,0x64,0x2f,0x98,0xd4] - vfmadd132nepbf16 ymm2 {k7}, ymm3, ymm4 + vfmadd132bf16 ymm2 {k7}, ymm3, ymm4 -// CHECK: vfmadd132nepbf16 ymm2 {k7} {z}, ymm3, ymm4 +// CHECK: vfmadd132bf16 ymm2 {k7} {z}, ymm3, ymm4 // CHECK: encoding: [0x62,0xf6,0x64,0xaf,0x98,0xd4] - vfmadd132nepbf16 ymm2 {k7} {z}, ymm3, ymm4 + vfmadd132bf16 ymm2 {k7} {z}, ymm3, ymm4 -// CHECK: vfmadd132nepbf16 zmm2, zmm3, zmm4 +// CHECK: vfmadd132bf16 zmm2, zmm3, zmm4 // CHECK: encoding: [0x62,0xf6,0x64,0x48,0x98,0xd4] - vfmadd132nepbf16 zmm2, zmm3, zmm4 + vfmadd132bf16 zmm2, zmm3, zmm4 -// CHECK: vfmadd132nepbf16 zmm2 {k7}, zmm3, zmm4 +// CHECK: vfmadd132bf16 zmm2 {k7}, zmm3, zmm4 // CHECK: encoding: [0x62,0xf6,0x64,0x4f,0x98,0xd4] - vfmadd132nepbf16 zmm2 {k7}, zmm3, zmm4 + vfmadd132bf16 zmm2 {k7}, zmm3, zmm4 -// CHECK: vfmadd132nepbf16 zmm2 {k7} {z}, zmm3, zmm4 +// CHECK: vfmadd132bf16 zmm2 {k7} {z}, zmm3, zmm4 // CHECK: encoding: [0x62,0xf6,0x64,0xcf,0x98,0xd4] - vfmadd132nepbf16 zmm2 {k7} {z}, zmm3, zmm4 + vfmadd132bf16 zmm2 {k7} {z}, zmm3, zmm4 -// CHECK: vfmadd132nepbf16 xmm2, xmm3, xmm4 +// CHECK: vfmadd132bf16 xmm2, xmm3, xmm4 // CHECK: encoding: [0x62,0xf6,0x64,0x08,0x98,0xd4] - vfmadd132nepbf16 xmm2, xmm3, xmm4 + vfmadd132bf16 xmm2, xmm3, xmm4 -// CHECK: vfmadd132nepbf16 xmm2 {k7}, xmm3, xmm4 +// CHECK: vfmadd132bf16 xmm2 {k7}, xmm3, xmm4 // CHECK: encoding: [0x62,0xf6,0x64,0x0f,0x98,0xd4] - vfmadd132nepbf16 xmm2 {k7}, xmm3, xmm4 + vfmadd132bf16 xmm2 {k7}, xmm3, xmm4 -// CHECK: vfmadd132nepbf16 xmm2 {k7} {z}, xmm3, xmm4 +// CHECK: vfmadd132bf16 xmm2 {k7} {z}, xmm3, xmm4 // CHECK: encoding: [0x62,0xf6,0x64,0x8f,0x98,0xd4] - vfmadd132nepbf16 xmm2 {k7} {z}, xmm3, xmm4 + vfmadd132bf16 xmm2 {k7} {z}, xmm3, xmm4 -// CHECK: vfmadd132nepbf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456] +// CHECK: vfmadd132bf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456] // CHECK: encoding: [0x62,0xf6,0x64,0x48,0x98,0x94,0xf4,0x00,0x00,0x00,0x10] - vfmadd132nepbf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456] + vfmadd132bf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456] -// CHECK: vfmadd132nepbf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291] +// CHECK: vfmadd132bf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291] // CHECK: encoding: [0x62,0xf6,0x64,0x4f,0x98,0x94,0x87,0x23,0x01,0x00,0x00] - vfmadd132nepbf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291] + vfmadd132bf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291] -// CHECK: vfmadd132nepbf16 zmm2, zmm3, word ptr [eax]{1to32} +// CHECK: vfmadd132bf16 zmm2, zmm3, word ptr [eax]{1to32} // CHECK: encoding: [0x62,0xf6,0x64,0x58,0x98,0x10] - vfmadd132nepbf16 zmm2, zmm3, word ptr [eax]{1to32} + vfmadd132bf16 zmm2, zmm3, word ptr [eax]{1to32} -// CHECK: vfmadd132nepbf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048] +// CHECK: vfmadd132bf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048] // CHECK: encoding: [0x62,0xf6,0x64,0x48,0x98,0x14,0x6d,0x00,0xf8,0xff,0xff] - vfmadd132nepbf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048] + vfmadd132bf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048] -// CHECK: vfmadd132nepbf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128] +// CHECK: vfmadd132bf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128] // CHECK: encoding: [0x62,0xf6,0x64,0xcf,0x98,0x51,0x7f] - vfmadd132nepbf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128] + vfmadd132bf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128] -// CHECK: vfmadd132nepbf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32} +// CHECK: vfmadd132bf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32} // CHECK: encoding: [0x62,0xf6,0x64,0xdf,0x98,0x52,0x80] - vfmadd132nepbf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32} + vfmadd132bf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32} -// CHECK: vfmadd132nepbf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456] +// CHECK: vfmadd132bf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456] // CHECK: encoding: [0x62,0xf6,0x64,0x28,0x98,0x94,0xf4,0x00,0x00,0x00,0x10] - vfmadd132nepbf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456] + vfmadd132bf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456] -// CHECK: vfmadd132nepbf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291] +// CHECK: vfmadd132bf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291] // CHECK: encoding: [0x62,0xf6,0x64,0x2f,0x98,0x94,0x87,0x23,0x01,0x00,0x00] - vfmadd132nepbf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291] + vfmadd132bf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291] -// CHECK: vfmadd132nepbf16 ymm2, ymm3, word ptr [eax]{1to16} +// CHECK: vfmadd132bf16 ymm2, ymm3, word ptr [eax]{1to16} // CHECK: encoding: [0x62,0xf6,0x64,0x38,0x98,0x10] - vfmadd132nepbf16 ymm2, ymm3, word ptr [eax]{1to16} + vfmadd132bf16 ymm2, ymm3, word ptr [eax]{1to16} -// CHECK: vfmadd132nepbf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024] +// CHECK: vfmadd132bf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024] // CHECK: encoding: [0x62,0xf6,0x64,0x28,0x98,0x14,0x6d,0x00,0xfc,0xff,0xff] - vfmadd132nepbf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024] + vfmadd132bf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024] -// CHECK: vfmadd132nepbf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064] +// CHECK: vfmadd132bf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064] // CHECK: encoding: [0x62,0xf6,0x64,0xaf,0x98,0x51,0x7f] - vfmadd132nepbf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064] + vfmadd132bf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064] -// CHECK: vfmadd132nepbf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16} +// CHECK: vfmadd132bf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16} // CHECK: encoding: [0x62,0xf6,0x64,0xbf,0x98,0x52,0x80] - vfmadd132nepbf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16} + vfmadd132bf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16} -// CHECK: vfmadd132nepbf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456] +// CHECK: vfmadd132bf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456] // CHECK: encoding: [0x62,0xf6,0x64,0x08,0x98,0x94,0xf4,0x00,0x00,0x00,0x10] - vfmadd132nepbf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456] + vfmadd132bf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456] -// CHECK: vfmadd132nepbf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291] +// CHECK: vfmadd132bf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291] // CHECK: encoding: [0x62,0xf6,0x64,0x0f,0x98,0x94,0x87,0x23,0x01,0x00,0x00] - vfmadd132nepbf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291] + vfmadd132bf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291] -// CHECK: vfmadd132nepbf16 xmm2, xmm3, word ptr [eax]{1to8} +// CHECK: vfmadd132bf16 xmm2, xmm3, word ptr [eax]{1to8} // CHECK: encoding: [0x62,0xf6,0x64,0x18,0x98,0x10] - vfmadd132nepbf16 xmm2, xmm3, word ptr [eax]{1to8} + vfmadd132bf16 xmm2, xmm3, word ptr [eax]{1to8} -// CHECK: vfmadd132nepbf16 xmm2, xmm3, xmmword ptr [2*ebp - 512] +// CHECK: vfmadd132bf16 xmm2, xmm3, xmmword ptr [2*ebp - 512] // CHECK: encoding: [0x62,0xf6,0x64,0x08,0x98,0x14,0x6d,0x00,0xfe,0xff,0xff] - vfmadd132nepbf16 xmm2, xmm3, xmmword ptr [2*ebp - 512] + vfmadd132bf16 xmm2, xmm3, xmmword ptr [2*ebp - 512] -// CHECK: vfmadd132nepbf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032] +// CHECK: vfmadd132bf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032] // CHECK: encoding: [0x62,0xf6,0x64,0x8f,0x98,0x51,0x7f] - vfmadd132nepbf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032] + vfmadd132bf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032] -// CHECK: vfmadd132nepbf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8} +// CHECK: vfmadd132bf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8} // CHECK: encoding: [0x62,0xf6,0x64,0x9f,0x98,0x52,0x80] - vfmadd132nepbf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8} + vfmadd132bf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8} -// CHECK: vfmadd213nepbf16 ymm2, ymm3, ymm4 +// CHECK: vfmadd213bf16 ymm2, ymm3, ymm4 // CHECK: encoding: [0x62,0xf6,0x64,0x28,0xa8,0xd4] - vfmadd213nepbf16 ymm2, ymm3, ymm4 + vfmadd213bf16 ymm2, ymm3, ymm4 -// CHECK: vfmadd213nepbf16 ymm2 {k7}, ymm3, ymm4 +// CHECK: vfmadd213bf16 ymm2 {k7}, ymm3, ymm4 // CHECK: encoding: [0x62,0xf6,0x64,0x2f,0xa8,0xd4] - vfmadd213nepbf16 ymm2 {k7}, ymm3, ymm4 + vfmadd213bf16 ymm2 {k7}, ymm3, ymm4 -// CHECK: vfmadd213nepbf16 ymm2 {k7} {z}, ymm3, ymm4 +// CHECK: vfmadd213bf16 ymm2 {k7} {z}, ymm3, ymm4 // CHECK: encoding: [0x62,0xf6,0x64,0xaf,0xa8,0xd4] - vfmadd213nepbf16 ymm2 {k7} {z}, ymm3, ymm4 + vfmadd213bf16 ymm2 {k7} {z}, ymm3, ymm4 -// CHECK: vfmadd213nepbf16 zmm2, zmm3, zmm4 +// CHECK: vfmadd213bf16 zmm2, zmm3, zmm4 // CHECK: encoding: [0x62,0xf6,0x64,0x48,0xa8,0xd4] - vfmadd213nepbf16 zmm2, zmm3, zmm4 + vfmadd213bf16 zmm2, zmm3, zmm4 -// CHECK: vfmadd213nepbf16 zmm2 {k7}, zmm3, zmm4 +// CHECK: vfmadd213bf16 zmm2 {k7}, zmm3, zmm4 // CHECK: encoding: [0x62,0xf6,0x64,0x4f,0xa8,0xd4] - vfmadd213nepbf16 zmm2 {k7}, zmm3, zmm4 + vfmadd213bf16 zmm2 {k7}, zmm3, zmm4 -// CHECK: vfmadd213nepbf16 zmm2 {k7} {z}, zmm3, zmm4 +// CHECK: vfmadd213bf16 zmm2 {k7} {z}, zmm3, zmm4 // CHECK: encoding: [0x62,0xf6,0x64,0xcf,0xa8,0xd4] - vfmadd213nepbf16 zmm2 {k7} {z}, zmm3, zmm4 + vfmadd213bf16 zmm2 {k7} {z}, zmm3, zmm4 -// CHECK: vfmadd213nepbf16 xmm2, xmm3, xmm4 +// CHECK: vfmadd213bf16 xmm2, xmm3, xmm4 // CHECK: encoding: [0x62,0xf6,0x64,0x08,0xa8,0xd4] - vfmadd213nepbf16 xmm2, xmm3, xmm4 + vfmadd213bf16 xmm2, xmm3, xmm4 -// CHECK: vfmadd213nepbf16 xmm2 {k7}, xmm3, xmm4 +// CHECK: vfmadd213bf16 xmm2 {k7}, xmm3, xmm4 // CHECK: encoding: [0x62,0xf6,0x64,0x0f,0xa8,0xd4] - vfmadd213nepbf16 xmm2 {k7}, xmm3, xmm4 + vfmadd213bf16 xmm2 {k7}, xmm3, xmm4 -// CHECK: vfmadd213nepbf16 xmm2 {k7} {z}, xmm3, xmm4 +// CHECK: vfmadd213bf16 xmm2 {k7} {z}, xmm3, xmm4 // CHECK: encoding: [0x62,0xf6,0x64,0x8f,0xa8,0xd4] - vfmadd213nepbf16 xmm2 {k7} {z}, xmm3, xmm4 + vfmadd213bf16 xmm2 {k7} {z}, xmm3, xmm4 -// CHECK: vfmadd213nepbf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456] +// CHECK: vfmadd213bf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456] // CHECK: encoding: [0x62,0xf6,0x64,0x48,0xa8,0x94,0xf4,0x00,0x00,0x00,0x10] - vfmadd213nepbf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456] + vfmadd213bf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456] -// CHECK: vfmadd213nepbf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291] +// CHECK: vfmadd213bf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291] // CHECK: encoding: [0x62,0xf6,0x64,0x4f,0xa8,0x94,0x87,0x23,0x01,0x00,0x00] - vfmadd213nepbf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291] + vfmadd213bf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291] -// CHECK: vfmadd213nepbf16 zmm2, zmm3, word ptr [eax]{1to32} +// CHECK: vfmadd213bf16 zmm2, zmm3, word ptr [eax]{1to32} // CHECK: encoding: [0x62,0xf6,0x64,0x58,0xa8,0x10] - vfmadd213nepbf16 zmm2, zmm3, word ptr [eax]{1to32} + vfmadd213bf16 zmm2, zmm3, word ptr [eax]{1to32} -// CHECK: vfmadd213nepbf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048] +// CHECK: vfmadd213bf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048] // CHECK: encoding: [0x62,0xf6,0x64,0x48,0xa8,0x14,0x6d,0x00,0xf8,0xff,0xff] - vfmadd213nepbf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048] + vfmadd213bf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048] -// CHECK: vfmadd213nepbf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128] +// CHECK: vfmadd213bf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128] // CHECK: encoding: [0x62,0xf6,0x64,0xcf,0xa8,0x51,0x7f] - vfmadd213nepbf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128] + vfmadd213bf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128] -// CHECK: vfmadd213nepbf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32} +// CHECK: vfmadd213bf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32} // CHECK: encoding: [0x62,0xf6,0x64,0xdf,0xa8,0x52,0x80] - vfmadd213nepbf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32} + vfmadd213bf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32} -// CHECK: vfmadd213nepbf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456] +// CHECK: vfmadd213bf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456] // CHECK: encoding: [0x62,0xf6,0x64,0x28,0xa8,0x94,0xf4,0x00,0x00,0x00,0x10] - vfmadd213nepbf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456] + vfmadd213bf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456] -// CHECK: vfmadd213nepbf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291] +// CHECK: vfmadd213bf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291] // CHECK: encoding: [0x62,0xf6,0x64,0x2f,0xa8,0x94,0x87,0x23,0x01,0x00,0x00] - vfmadd213nepbf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291] + vfmadd213bf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291] -// CHECK: vfmadd213nepbf16 ymm2, ymm3, word ptr [eax]{1to16} +// CHECK: vfmadd213bf16 ymm2, ymm3, word ptr [eax]{1to16} // CHECK: encoding: [0x62,0xf6,0x64,0x38,0xa8,0x10] - vfmadd213nepbf16 ymm2, ymm3, word ptr [eax]{1to16} + vfmadd213bf16 ymm2, ymm3, word ptr [eax]{1to16} -// CHECK: vfmadd213nepbf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024] +// CHECK: vfmadd213bf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024] // CHECK: encoding: [0x62,0xf6,0x64,0x28,0xa8,0x14,0x6d,0x00,0xfc,0xff,0xff] - vfmadd213nepbf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024] + vfmadd213bf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024] -// CHECK: vfmadd213nepbf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064] +// CHECK: vfmadd213bf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064] // CHECK: encoding: [0x62,0xf6,0x64,0xaf,0xa8,0x51,0x7f] - vfmadd213nepbf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064] + vfmadd213bf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064] -// CHECK: vfmadd213nepbf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16} +// CHECK: vfmadd213bf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16} // CHECK: encoding: [0x62,0xf6,0x64,0xbf,0xa8,0x52,0x80] - vfmadd213nepbf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16} + vfmadd213bf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16} -// CHECK: vfmadd213nepbf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456] +// CHECK: vfmadd213bf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456] // CHECK: encoding: [0x62,0xf6,0x64,0x08,0xa8,0x94,0xf4,0x00,0x00,0x00,0x10] - vfmadd213nepbf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456] + vfmadd213bf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456] -// CHECK: vfmadd213nepbf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291] +// CHECK: vfmadd213bf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291] // CHECK: encoding: [0x62,0xf6,0x64,0x0f,0xa8,0x94,0x87,0x23,0x01,0x00,0x00] - vfmadd213nepbf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291] + vfmadd213bf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291] -// CHECK: vfmadd213nepbf16 xmm2, xmm3, word ptr [eax]{1to8} +// CHECK: vfmadd213bf16 xmm2, xmm3, word ptr [eax]{1to8} // CHECK: encoding: [0x62,0xf6,0x64,0x18,0xa8,0x10] - vfmadd213nepbf16 xmm2, xmm3, word ptr [eax]{1to8} + vfmadd213bf16 xmm2, xmm3, word ptr [eax]{1to8} -// CHECK: vfmadd213nepbf16 xmm2, xmm3, xmmword ptr [2*ebp - 512] +// CHECK: vfmadd213bf16 xmm2, xmm3, xmmword ptr [2*ebp - 512] // CHECK: encoding: [0x62,0xf6,0x64,0x08,0xa8,0x14,0x6d,0x00,0xfe,0xff,0xff] - vfmadd213nepbf16 xmm2, xmm3, xmmword ptr [2*ebp - 512] + vfmadd213bf16 xmm2, xmm3, xmmword ptr [2*ebp - 512] -// CHECK: vfmadd213nepbf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032] +// CHECK: vfmadd213bf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032] // CHECK: encoding: [0x62,0xf6,0x64,0x8f,0xa8,0x51,0x7f] - vfmadd213nepbf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032] + vfmadd213bf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032] -// CHECK: vfmadd213nepbf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8} +// CHECK: vfmadd213bf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8} // CHECK: encoding: [0x62,0xf6,0x64,0x9f,0xa8,0x52,0x80] - vfmadd213nepbf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8} + vfmadd213bf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8} -// CHECK: vfmadd231nepbf16 ymm2, ymm3, ymm4 +// CHECK: vfmadd231bf16 ymm2, ymm3, ymm4 // CHECK: encoding: [0x62,0xf6,0x64,0x28,0xb8,0xd4] - vfmadd231nepbf16 ymm2, ymm3, ymm4 + vfmadd231bf16 ymm2, ymm3, ymm4 -// CHECK: vfmadd231nepbf16 ymm2 {k7}, ymm3, ymm4 +// CHECK: vfmadd231bf16 ymm2 {k7}, ymm3, ymm4 // CHECK: encoding: [0x62,0xf6,0x64,0x2f,0xb8,0xd4] - vfmadd231nepbf16 ymm2 {k7}, ymm3, ymm4 + vfmadd231bf16 ymm2 {k7}, ymm3, ymm4 -// CHECK: vfmadd231nepbf16 ymm2 {k7} {z}, ymm3, ymm4 +// CHECK: vfmadd231bf16 ymm2 {k7} {z}, ymm3, ymm4 // CHECK: encoding: [0x62,0xf6,0x64,0xaf,0xb8,0xd4] - vfmadd231nepbf16 ymm2 {k7} {z}, ymm3, ymm4 + vfmadd231bf16 ymm2 {k7} {z}, ymm3, ymm4 -// CHECK: vfmadd231nepbf16 zmm2, zmm3, zmm4 +// CHECK: vfmadd231bf16 zmm2, zmm3, zmm4 // CHECK: encoding: [0x62,0xf6,0x64,0x48,0xb8,0xd4] - vfmadd231nepbf16 zmm2, zmm3, zmm4 + vfmadd231bf16 zmm2, zmm3, zmm4 -// CHECK: vfmadd231nepbf16 zmm2 {k7}, zmm3, zmm4 +// CHECK: vfmadd231bf16 zmm2 {k7}, zmm3, zmm4 // CHECK: encoding: [0x62,0xf6,0x64,0x4f,0xb8,0xd4] - vfmadd231nepbf16 zmm2 {k7}, zmm3, zmm4 + vfmadd231bf16 zmm2 {k7}, zmm3, zmm4 -// CHECK: vfmadd231nepbf16 zmm2 {k7} {z}, zmm3, zmm4 +// CHECK: vfmadd231bf16 zmm2 {k7} {z}, zmm3, zmm4 // CHECK: encoding: [0x62,0xf6,0x64,0xcf,0xb8,0xd4] - vfmadd231nepbf16 zmm2 {k7} {z}, zmm3, zmm4 + vfmadd231bf16 zmm2 {k7} {z}, zmm3, zmm4 -// CHECK: vfmadd231nepbf16 xmm2, xmm3, xmm4 +// CHECK: vfmadd231bf16 xmm2, xmm3, xmm4 // CHECK: encoding: [0x62,0xf6,0x64,0x08,0xb8,0xd4] - vfmadd231nepbf16 xmm2, xmm3, xmm4 + vfmadd231bf16 xmm2, xmm3, xmm4 -// CHECK: vfmadd231nepbf16 xmm2 {k7}, xmm3, xmm4 +// CHECK: vfmadd231bf16 xmm2 {k7}, xmm3, xmm4 // CHECK: encoding: [0x62,0xf6,0x64,0x0f,0xb8,0xd4] - vfmadd231nepbf16 xmm2 {k7}, xmm3, xmm4 + vfmadd231bf16 xmm2 {k7}, xmm3, xmm4 -// CHECK: vfmadd231nepbf16 xmm2 {k7} {z}, xmm3, xmm4 +// CHECK: vfmadd231bf16 xmm2 {k7} {z}, xmm3, xmm4 // CHECK: encoding: [0x62,0xf6,0x64,0x8f,0xb8,0xd4] - vfmadd231nepbf16 xmm2 {k7} {z}, xmm3, xmm4 + vfmadd231bf16 xmm2 {k7} {z}, xmm3, xmm4 -// CHECK: vfmadd231nepbf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456] +// CHECK: vfmadd231bf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456] // CHECK: encoding: [0x62,0xf6,0x64,0x48,0xb8,0x94,0xf4,0x00,0x00,0x00,0x10] - vfmadd231nepbf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456] + vfmadd231bf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456] -// CHECK: vfmadd231nepbf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291] +// CHECK: vfmadd231bf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291] // CHECK: encoding: [0x62,0xf6,0x64,0x4f,0xb8,0x94,0x87,0x23,0x01,0x00,0x00] - vfmadd231nepbf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291] + vfmadd231bf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291] -// CHECK: vfmadd231nepbf16 zmm2, zmm3, word ptr [eax]{1to32} +// CHECK: vfmadd231bf16 zmm2, zmm3, word ptr [eax]{1to32} // CHECK: encoding: [0x62,0xf6,0x64,0x58,0xb8,0x10] - vfmadd231nepbf16 zmm2, zmm3, word ptr [eax]{1to32} + vfmadd231bf16 zmm2, zmm3, word ptr [eax]{1to32} -// CHECK: vfmadd231nepbf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048] +// CHECK: vfmadd231bf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048] // CHECK: encoding: [0x62,0xf6,0x64,0x48,0xb8,0x14,0x6d,0x00,0xf8,0xff,0xff] - vfmadd231nepbf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048] + vfmadd231bf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048] -// CHECK: vfmadd231nepbf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128] +// CHECK: vfmadd231bf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128] // CHECK: encoding: [0x62,0xf6,0x64,0xcf,0xb8,0x51,0x7f] - vfmadd231nepbf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128] + vfmadd231bf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128] -// CHECK: vfmadd231nepbf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32} +// CHECK: vfmadd231bf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32} // CHECK: encoding: [0x62,0xf6,0x64,0xdf,0xb8,0x52,0x80] - vfmadd231nepbf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32} + vfmadd231bf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32} -// CHECK: vfmadd231nepbf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456] +// CHECK: vfmadd231bf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456] // CHECK: encoding: [0x62,0xf6,0x64,0x28,0xb8,0x94,0xf4,0x00,0x00,0x00,0x10] - vfmadd231nepbf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456] + vfmadd231bf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456] -// CHECK: vfmadd231nepbf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291] +// CHECK: vfmadd231bf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291] // CHECK: encoding: [0x62,0xf6,0x64,0x2f,0xb8,0x94,0x87,0x23,0x01,0x00,0x00] - vfmadd231nepbf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291] + vfmadd231bf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291] -// CHECK: vfmadd231nepbf16 ymm2, ymm3, word ptr [eax]{1to16} +// CHECK: vfmadd231bf16 ymm2, ymm3, word ptr [eax]{1to16} // CHECK: encoding: [0x62,0xf6,0x64,0x38,0xb8,0x10] - vfmadd231nepbf16 ymm2, ymm3, word ptr [eax]{1to16} + vfmadd231bf16 ymm2, ymm3, word ptr [eax]{1to16} -// CHECK: vfmadd231nepbf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024] +// CHECK: vfmadd231bf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024] // CHECK: encoding: [0x62,0xf6,0x64,0x28,0xb8,0x14,0x6d,0x00,0xfc,0xff,0xff] - vfmadd231nepbf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024] + vfmadd231bf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024] -// CHECK: vfmadd231nepbf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064] +// CHECK: vfmadd231bf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064] // CHECK: encoding: [0x62,0xf6,0x64,0xaf,0xb8,0x51,0x7f] - vfmadd231nepbf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064] + vfmadd231bf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064] -// CHECK: vfmadd231nepbf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16} +// CHECK: vfmadd231bf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16} // CHECK: encoding: [0x62,0xf6,0x64,0xbf,0xb8,0x52,0x80] - vfmadd231nepbf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16} + vfmadd231bf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16} -// CHECK: vfmadd231nepbf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456] +// CHECK: vfmadd231bf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456] // CHECK: encoding: [0x62,0xf6,0x64,0x08,0xb8,0x94,0xf4,0x00,0x00,0x00,0x10] - vfmadd231nepbf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456] + vfmadd231bf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456] -// CHECK: vfmadd231nepbf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291] +// CHECK: vfmadd231bf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291] // CHECK: encoding: [0x62,0xf6,0x64,0x0f,0xb8,0x94,0x87,0x23,0x01,0x00,0x00] - vfmadd231nepbf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291] + vfmadd231bf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291] -// CHECK: vfmadd231nepbf16 xmm2, xmm3, word ptr [eax]{1to8} +// CHECK: vfmadd231bf16 xmm2, xmm3, word ptr [eax]{1to8} // CHECK: encoding: [0x62,0xf6,0x64,0x18,0xb8,0x10] - vfmadd231nepbf16 xmm2, xmm3, word ptr [eax]{1to8} + vfmadd231bf16 xmm2, xmm3, word ptr [eax]{1to8} -// CHECK: vfmadd231nepbf16 xmm2, xmm3, xmmword ptr [2*ebp - 512] +// CHECK: vfmadd231bf16 xmm2, xmm3, xmmword ptr [2*ebp - 512] // CHECK: encoding: [0x62,0xf6,0x64,0x08,0xb8,0x14,0x6d,0x00,0xfe,0xff,0xff] - vfmadd231nepbf16 xmm2, xmm3, xmmword ptr [2*ebp - 512] + vfmadd231bf16 xmm2, xmm3, xmmword ptr [2*ebp - 512] -// CHECK: vfmadd231nepbf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032] +// CHECK: vfmadd231bf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032] // CHECK: encoding: [0x62,0xf6,0x64,0x8f,0xb8,0x51,0x7f] - vfmadd231nepbf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032] + vfmadd231bf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032] -// CHECK: vfmadd231nepbf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8} +// CHECK: vfmadd231bf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8} // CHECK: encoding: [0x62,0xf6,0x64,0x9f,0xb8,0x52,0x80] - vfmadd231nepbf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8} + vfmadd231bf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8} -// CHECK: vfmsub132nepbf16 ymm2, ymm3, ymm4 +// CHECK: vfmsub132bf16 ymm2, ymm3, ymm4 // CHECK: encoding: [0x62,0xf6,0x64,0x28,0x9a,0xd4] - vfmsub132nepbf16 ymm2, ymm3, ymm4 + vfmsub132bf16 ymm2, ymm3, ymm4 -// CHECK: vfmsub132nepbf16 ymm2 {k7}, ymm3, ymm4 +// CHECK: vfmsub132bf16 ymm2 {k7}, ymm3, ymm4 // CHECK: encoding: [0x62,0xf6,0x64,0x2f,0x9a,0xd4] - vfmsub132nepbf16 ymm2 {k7}, ymm3, ymm4 + vfmsub132bf16 ymm2 {k7}, ymm3, ymm4 -// CHECK: vfmsub132nepbf16 ymm2 {k7} {z}, ymm3, ymm4 +// CHECK: vfmsub132bf16 ymm2 {k7} {z}, ymm3, ymm4 // CHECK: encoding: [0x62,0xf6,0x64,0xaf,0x9a,0xd4] - vfmsub132nepbf16 ymm2 {k7} {z}, ymm3, ymm4 + vfmsub132bf16 ymm2 {k7} {z}, ymm3, ymm4 -// CHECK: vfmsub132nepbf16 zmm2, zmm3, zmm4 +// CHECK: vfmsub132bf16 zmm2, zmm3, zmm4 // CHECK: encoding: [0x62,0xf6,0x64,0x48,0x9a,0xd4] - vfmsub132nepbf16 zmm2, zmm3, zmm4 + vfmsub132bf16 zmm2, zmm3, zmm4 -// CHECK: vfmsub132nepbf16 zmm2 {k7}, zmm3, zmm4 +// CHECK: vfmsub132bf16 zmm2 {k7}, zmm3, zmm4 // CHECK: encoding: [0x62,0xf6,0x64,0x4f,0x9a,0xd4] - vfmsub132nepbf16 zmm2 {k7}, zmm3, zmm4 + vfmsub132bf16 zmm2 {k7}, zmm3, zmm4 -// CHECK: vfmsub132nepbf16 zmm2 {k7} {z}, zmm3, zmm4 +// CHECK: vfmsub132bf16 zmm2 {k7} {z}, zmm3, zmm4 // CHECK: encoding: [0x62,0xf6,0x64,0xcf,0x9a,0xd4] - vfmsub132nepbf16 zmm2 {k7} {z}, zmm3, zmm4 + vfmsub132bf16 zmm2 {k7} {z}, zmm3, zmm4 -// CHECK: vfmsub132nepbf16 xmm2, xmm3, xmm4 +// CHECK: vfmsub132bf16 xmm2, xmm3, xmm4 // CHECK: encoding: [0x62,0xf6,0x64,0x08,0x9a,0xd4] - vfmsub132nepbf16 xmm2, xmm3, xmm4 + vfmsub132bf16 xmm2, xmm3, xmm4 -// CHECK: vfmsub132nepbf16 xmm2 {k7}, xmm3, xmm4 +// CHECK: vfmsub132bf16 xmm2 {k7}, xmm3, xmm4 // CHECK: encoding: [0x62,0xf6,0x64,0x0f,0x9a,0xd4] - vfmsub132nepbf16 xmm2 {k7}, xmm3, xmm4 + vfmsub132bf16 xmm2 {k7}, xmm3, xmm4 -// CHECK: vfmsub132nepbf16 xmm2 {k7} {z}, xmm3, xmm4 +// CHECK: vfmsub132bf16 xmm2 {k7} {z}, xmm3, xmm4 // CHECK: encoding: [0x62,0xf6,0x64,0x8f,0x9a,0xd4] - vfmsub132nepbf16 xmm2 {k7} {z}, xmm3, xmm4 + vfmsub132bf16 xmm2 {k7} {z}, xmm3, xmm4 -// CHECK: vfmsub132nepbf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456] +// CHECK: vfmsub132bf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456] // CHECK: encoding: [0x62,0xf6,0x64,0x48,0x9a,0x94,0xf4,0x00,0x00,0x00,0x10] - vfmsub132nepbf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456] + vfmsub132bf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456] -// CHECK: vfmsub132nepbf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291] +// CHECK: vfmsub132bf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291] // CHECK: encoding: [0x62,0xf6,0x64,0x4f,0x9a,0x94,0x87,0x23,0x01,0x00,0x00] - vfmsub132nepbf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291] + vfmsub132bf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291] -// CHECK: vfmsub132nepbf16 zmm2, zmm3, word ptr [eax]{1to32} +// CHECK: vfmsub132bf16 zmm2, zmm3, word ptr [eax]{1to32} // CHECK: encoding: [0x62,0xf6,0x64,0x58,0x9a,0x10] - vfmsub132nepbf16 zmm2, zmm3, word ptr [eax]{1to32} + vfmsub132bf16 zmm2, zmm3, word ptr [eax]{1to32} -// CHECK: vfmsub132nepbf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048] +// CHECK: vfmsub132bf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048] // CHECK: encoding: [0x62,0xf6,0x64,0x48,0x9a,0x14,0x6d,0x00,0xf8,0xff,0xff] - vfmsub132nepbf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048] + vfmsub132bf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048] -// CHECK: vfmsub132nepbf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128] +// CHECK: vfmsub132bf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128] // CHECK: encoding: [0x62,0xf6,0x64,0xcf,0x9a,0x51,0x7f] - vfmsub132nepbf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128] + vfmsub132bf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128] -// CHECK: vfmsub132nepbf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32} +// CHECK: vfmsub132bf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32} // CHECK: encoding: [0x62,0xf6,0x64,0xdf,0x9a,0x52,0x80] - vfmsub132nepbf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32} + vfmsub132bf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32} -// CHECK: vfmsub132nepbf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456] +// CHECK: vfmsub132bf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456] // CHECK: encoding: [0x62,0xf6,0x64,0x28,0x9a,0x94,0xf4,0x00,0x00,0x00,0x10] - vfmsub132nepbf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456] + vfmsub132bf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456] -// CHECK: vfmsub132nepbf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291] +// CHECK: vfmsub132bf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291] // CHECK: encoding: [0x62,0xf6,0x64,0x2f,0x9a,0x94,0x87,0x23,0x01,0x00,0x00] - vfmsub132nepbf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291] + vfmsub132bf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291] -// CHECK: vfmsub132nepbf16 ymm2, ymm3, word ptr [eax]{1to16} +// CHECK: vfmsub132bf16 ymm2, ymm3, word ptr [eax]{1to16} // CHECK: encoding: [0x62,0xf6,0x64,0x38,0x9a,0x10] - vfmsub132nepbf16 ymm2, ymm3, word ptr [eax]{1to16} + vfmsub132bf16 ymm2, ymm3, word ptr [eax]{1to16} -// CHECK: vfmsub132nepbf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024] +// CHECK: vfmsub132bf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024] // CHECK: encoding: [0x62,0xf6,0x64,0x28,0x9a,0x14,0x6d,0x00,0xfc,0xff,0xff] - vfmsub132nepbf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024] + vfmsub132bf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024] -// CHECK: vfmsub132nepbf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064] +// CHECK: vfmsub132bf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064] // CHECK: encoding: [0x62,0xf6,0x64,0xaf,0x9a,0x51,0x7f] - vfmsub132nepbf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064] + vfmsub132bf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064] -// CHECK: vfmsub132nepbf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16} +// CHECK: vfmsub132bf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16} // CHECK: encoding: [0x62,0xf6,0x64,0xbf,0x9a,0x52,0x80] - vfmsub132nepbf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16} + vfmsub132bf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16} -// CHECK: vfmsub132nepbf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456] +// CHECK: vfmsub132bf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456] // CHECK: encoding: [0x62,0xf6,0x64,0x08,0x9a,0x94,0xf4,0x00,0x00,0x00,0x10] - vfmsub132nepbf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456] + vfmsub132bf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456] -// CHECK: vfmsub132nepbf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291] +// CHECK: vfmsub132bf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291] // CHECK: encoding: [0x62,0xf6,0x64,0x0f,0x9a,0x94,0x87,0x23,0x01,0x00,0x00] - vfmsub132nepbf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291] + vfmsub132bf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291] -// CHECK: vfmsub132nepbf16 xmm2, xmm3, word ptr [eax]{1to8} +// CHECK: vfmsub132bf16 xmm2, xmm3, word ptr [eax]{1to8} // CHECK: encoding: [0x62,0xf6,0x64,0x18,0x9a,0x10] - vfmsub132nepbf16 xmm2, xmm3, word ptr [eax]{1to8} + vfmsub132bf16 xmm2, xmm3, word ptr [eax]{1to8} -// CHECK: vfmsub132nepbf16 xmm2, xmm3, xmmword ptr [2*ebp - 512] +// CHECK: vfmsub132bf16 xmm2, xmm3, xmmword ptr [2*ebp - 512] // CHECK: encoding: [0x62,0xf6,0x64,0x08,0x9a,0x14,0x6d,0x00,0xfe,0xff,0xff] - vfmsub132nepbf16 xmm2, xmm3, xmmword ptr [2*ebp - 512] + vfmsub132bf16 xmm2, xmm3, xmmword ptr [2*ebp - 512] -// CHECK: vfmsub132nepbf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032] +// CHECK: vfmsub132bf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032] // CHECK: encoding: [0x62,0xf6,0x64,0x8f,0x9a,0x51,0x7f] - vfmsub132nepbf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032] + vfmsub132bf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032] -// CHECK: vfmsub132nepbf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8} +// CHECK: vfmsub132bf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8} // CHECK: encoding: [0x62,0xf6,0x64,0x9f,0x9a,0x52,0x80] - vfmsub132nepbf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8} + vfmsub132bf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8} -// CHECK: vfmsub213nepbf16 ymm2, ymm3, ymm4 +// CHECK: vfmsub213bf16 ymm2, ymm3, ymm4 // CHECK: encoding: [0x62,0xf6,0x64,0x28,0xaa,0xd4] - vfmsub213nepbf16 ymm2, ymm3, ymm4 + vfmsub213bf16 ymm2, ymm3, ymm4 -// CHECK: vfmsub213nepbf16 ymm2 {k7}, ymm3, ymm4 +// CHECK: vfmsub213bf16 ymm2 {k7}, ymm3, ymm4 // CHECK: encoding: [0x62,0xf6,0x64,0x2f,0xaa,0xd4] - vfmsub213nepbf16 ymm2 {k7}, ymm3, ymm4 + vfmsub213bf16 ymm2 {k7}, ymm3, ymm4 -// CHECK: vfmsub213nepbf16 ymm2 {k7} {z}, ymm3, ymm4 +// CHECK: vfmsub213bf16 ymm2 {k7} {z}, ymm3, ymm4 // CHECK: encoding: [0x62,0xf6,0x64,0xaf,0xaa,0xd4] - vfmsub213nepbf16 ymm2 {k7} {z}, ymm3, ymm4 + vfmsub213bf16 ymm2 {k7} {z}, ymm3, ymm4 -// CHECK: vfmsub213nepbf16 zmm2, zmm3, zmm4 +// CHECK: vfmsub213bf16 zmm2, zmm3, zmm4 // CHECK: encoding: [0x62,0xf6,0x64,0x48,0xaa,0xd4] - vfmsub213nepbf16 zmm2, zmm3, zmm4 + vfmsub213bf16 zmm2, zmm3, zmm4 -// CHECK: vfmsub213nepbf16 zmm2 {k7}, zmm3, zmm4 +// CHECK: vfmsub213bf16 zmm2 {k7}, zmm3, zmm4 // CHECK: encoding: [0x62,0xf6,0x64,0x4f,0xaa,0xd4] - vfmsub213nepbf16 zmm2 {k7}, zmm3, zmm4 + vfmsub213bf16 zmm2 {k7}, zmm3, zmm4 -// CHECK: vfmsub213nepbf16 zmm2 {k7} {z}, zmm3, zmm4 +// CHECK: vfmsub213bf16 zmm2 {k7} {z}, zmm3, zmm4 // CHECK: encoding: [0x62,0xf6,0x64,0xcf,0xaa,0xd4] - vfmsub213nepbf16 zmm2 {k7} {z}, zmm3, zmm4 + vfmsub213bf16 zmm2 {k7} {z}, zmm3, zmm4 -// CHECK: vfmsub213nepbf16 xmm2, xmm3, xmm4 +// CHECK: vfmsub213bf16 xmm2, xmm3, xmm4 // CHECK: encoding: [0x62,0xf6,0x64,0x08,0xaa,0xd4] - vfmsub213nepbf16 xmm2, xmm3, xmm4 + vfmsub213bf16 xmm2, xmm3, xmm4 -// CHECK: vfmsub213nepbf16 xmm2 {k7}, xmm3, xmm4 +// CHECK: vfmsub213bf16 xmm2 {k7}, xmm3, xmm4 // CHECK: encoding: [0x62,0xf6,0x64,0x0f,0xaa,0xd4] - vfmsub213nepbf16 xmm2 {k7}, xmm3, xmm4 + vfmsub213bf16 xmm2 {k7}, xmm3, xmm4 -// CHECK: vfmsub213nepbf16 xmm2 {k7} {z}, xmm3, xmm4 +// CHECK: vfmsub213bf16 xmm2 {k7} {z}, xmm3, xmm4 // CHECK: encoding: [0x62,0xf6,0x64,0x8f,0xaa,0xd4] - vfmsub213nepbf16 xmm2 {k7} {z}, xmm3, xmm4 + vfmsub213bf16 xmm2 {k7} {z}, xmm3, xmm4 -// CHECK: vfmsub213nepbf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456] +// CHECK: vfmsub213bf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456] // CHECK: encoding: [0x62,0xf6,0x64,0x48,0xaa,0x94,0xf4,0x00,0x00,0x00,0x10] - vfmsub213nepbf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456] + vfmsub213bf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456] -// CHECK: vfmsub213nepbf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291] +// CHECK: vfmsub213bf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291] // CHECK: encoding: [0x62,0xf6,0x64,0x4f,0xaa,0x94,0x87,0x23,0x01,0x00,0x00] - vfmsub213nepbf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291] + vfmsub213bf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291] -// CHECK: vfmsub213nepbf16 zmm2, zmm3, word ptr [eax]{1to32} +// CHECK: vfmsub213bf16 zmm2, zmm3, word ptr [eax]{1to32} // CHECK: encoding: [0x62,0xf6,0x64,0x58,0xaa,0x10] - vfmsub213nepbf16 zmm2, zmm3, word ptr [eax]{1to32} + vfmsub213bf16 zmm2, zmm3, word ptr [eax]{1to32} -// CHECK: vfmsub213nepbf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048] +// CHECK: vfmsub213bf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048] // CHECK: encoding: [0x62,0xf6,0x64,0x48,0xaa,0x14,0x6d,0x00,0xf8,0xff,0xff] - vfmsub213nepbf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048] + vfmsub213bf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048] -// CHECK: vfmsub213nepbf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128] +// CHECK: vfmsub213bf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128] // CHECK: encoding: [0x62,0xf6,0x64,0xcf,0xaa,0x51,0x7f] - vfmsub213nepbf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128] + vfmsub213bf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128] -// CHECK: vfmsub213nepbf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32} +// CHECK: vfmsub213bf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32} // CHECK: encoding: [0x62,0xf6,0x64,0xdf,0xaa,0x52,0x80] - vfmsub213nepbf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32} + vfmsub213bf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32} -// CHECK: vfmsub213nepbf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456] +// CHECK: vfmsub213bf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456] // CHECK: encoding: [0x62,0xf6,0x64,0x28,0xaa,0x94,0xf4,0x00,0x00,0x00,0x10] - vfmsub213nepbf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456] + vfmsub213bf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456] -// CHECK: vfmsub213nepbf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291] +// CHECK: vfmsub213bf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291] // CHECK: encoding: [0x62,0xf6,0x64,0x2f,0xaa,0x94,0x87,0x23,0x01,0x00,0x00] - vfmsub213nepbf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291] + vfmsub213bf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291] -// CHECK: vfmsub213nepbf16 ymm2, ymm3, word ptr [eax]{1to16} +// CHECK: vfmsub213bf16 ymm2, ymm3, word ptr [eax]{1to16} // CHECK: encoding: [0x62,0xf6,0x64,0x38,0xaa,0x10] - vfmsub213nepbf16 ymm2, ymm3, word ptr [eax]{1to16} + vfmsub213bf16 ymm2, ymm3, word ptr [eax]{1to16} -// CHECK: vfmsub213nepbf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024] +// CHECK: vfmsub213bf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024] // CHECK: encoding: [0x62,0xf6,0x64,0x28,0xaa,0x14,0x6d,0x00,0xfc,0xff,0xff] - vfmsub213nepbf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024] + vfmsub213bf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024] -// CHECK: vfmsub213nepbf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064] +// CHECK: vfmsub213bf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064] // CHECK: encoding: [0x62,0xf6,0x64,0xaf,0xaa,0x51,0x7f] - vfmsub213nepbf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064] + vfmsub213bf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064] -// CHECK: vfmsub213nepbf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16} +// CHECK: vfmsub213bf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16} // CHECK: encoding: [0x62,0xf6,0x64,0xbf,0xaa,0x52,0x80] - vfmsub213nepbf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16} + vfmsub213bf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16} -// CHECK: vfmsub213nepbf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456] +// CHECK: vfmsub213bf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456] // CHECK: encoding: [0x62,0xf6,0x64,0x08,0xaa,0x94,0xf4,0x00,0x00,0x00,0x10] - vfmsub213nepbf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456] + vfmsub213bf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456] -// CHECK: vfmsub213nepbf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291] +// CHECK: vfmsub213bf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291] // CHECK: encoding: [0x62,0xf6,0x64,0x0f,0xaa,0x94,0x87,0x23,0x01,0x00,0x00] - vfmsub213nepbf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291] + vfmsub213bf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291] -// CHECK: vfmsub213nepbf16 xmm2, xmm3, word ptr [eax]{1to8} +// CHECK: vfmsub213bf16 xmm2, xmm3, word ptr [eax]{1to8} // CHECK: encoding: [0x62,0xf6,0x64,0x18,0xaa,0x10] - vfmsub213nepbf16 xmm2, xmm3, word ptr [eax]{1to8} + vfmsub213bf16 xmm2, xmm3, word ptr [eax]{1to8} -// CHECK: vfmsub213nepbf16 xmm2, xmm3, xmmword ptr [2*ebp - 512] +// CHECK: vfmsub213bf16 xmm2, xmm3, xmmword ptr [2*ebp - 512] // CHECK: encoding: [0x62,0xf6,0x64,0x08,0xaa,0x14,0x6d,0x00,0xfe,0xff,0xff] - vfmsub213nepbf16 xmm2, xmm3, xmmword ptr [2*ebp - 512] + vfmsub213bf16 xmm2, xmm3, xmmword ptr [2*ebp - 512] -// CHECK: vfmsub213nepbf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032] +// CHECK: vfmsub213bf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032] // CHECK: encoding: [0x62,0xf6,0x64,0x8f,0xaa,0x51,0x7f] - vfmsub213nepbf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032] + vfmsub213bf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032] -// CHECK: vfmsub213nepbf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8} +// CHECK: vfmsub213bf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8} // CHECK: encoding: [0x62,0xf6,0x64,0x9f,0xaa,0x52,0x80] - vfmsub213nepbf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8} + vfmsub213bf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8} -// CHECK: vfmsub231nepbf16 ymm2, ymm3, ymm4 +// CHECK: vfmsub231bf16 ymm2, ymm3, ymm4 // CHECK: encoding: [0x62,0xf6,0x64,0x28,0xba,0xd4] - vfmsub231nepbf16 ymm2, ymm3, ymm4 + vfmsub231bf16 ymm2, ymm3, ymm4 -// CHECK: vfmsub231nepbf16 ymm2 {k7}, ymm3, ymm4 +// CHECK: vfmsub231bf16 ymm2 {k7}, ymm3, ymm4 // CHECK: encoding: [0x62,0xf6,0x64,0x2f,0xba,0xd4] - vfmsub231nepbf16 ymm2 {k7}, ymm3, ymm4 + vfmsub231bf16 ymm2 {k7}, ymm3, ymm4 -// CHECK: vfmsub231nepbf16 ymm2 {k7} {z}, ymm3, ymm4 +// CHECK: vfmsub231bf16 ymm2 {k7} {z}, ymm3, ymm4 // CHECK: encoding: [0x62,0xf6,0x64,0xaf,0xba,0xd4] - vfmsub231nepbf16 ymm2 {k7} {z}, ymm3, ymm4 + vfmsub231bf16 ymm2 {k7} {z}, ymm3, ymm4 -// CHECK: vfmsub231nepbf16 zmm2, zmm3, zmm4 +// CHECK: vfmsub231bf16 zmm2, zmm3, zmm4 // CHECK: encoding: [0x62,0xf6,0x64,0x48,0xba,0xd4] - vfmsub231nepbf16 zmm2, zmm3, zmm4 + vfmsub231bf16 zmm2, zmm3, zmm4 -// CHECK: vfmsub231nepbf16 zmm2 {k7}, zmm3, zmm4 +// CHECK: vfmsub231bf16 zmm2 {k7}, zmm3, zmm4 // CHECK: encoding: [0x62,0xf6,0x64,0x4f,0xba,0xd4] - vfmsub231nepbf16 zmm2 {k7}, zmm3, zmm4 + vfmsub231bf16 zmm2 {k7}, zmm3, zmm4 -// CHECK: vfmsub231nepbf16 zmm2 {k7} {z}, zmm3, zmm4 +// CHECK: vfmsub231bf16 zmm2 {k7} {z}, zmm3, zmm4 // CHECK: encoding: [0x62,0xf6,0x64,0xcf,0xba,0xd4] - vfmsub231nepbf16 zmm2 {k7} {z}, zmm3, zmm4 + vfmsub231bf16 zmm2 {k7} {z}, zmm3, zmm4 -// CHECK: vfmsub231nepbf16 xmm2, xmm3, xmm4 +// CHECK: vfmsub231bf16 xmm2, xmm3, xmm4 // CHECK: encoding: [0x62,0xf6,0x64,0x08,0xba,0xd4] - vfmsub231nepbf16 xmm2, xmm3, xmm4 + vfmsub231bf16 xmm2, xmm3, xmm4 -// CHECK: vfmsub231nepbf16 xmm2 {k7}, xmm3, xmm4 +// CHECK: vfmsub231bf16 xmm2 {k7}, xmm3, xmm4 // CHECK: encoding: [0x62,0xf6,0x64,0x0f,0xba,0xd4] - vfmsub231nepbf16 xmm2 {k7}, xmm3, xmm4 + vfmsub231bf16 xmm2 {k7}, xmm3, xmm4 -// CHECK: vfmsub231nepbf16 xmm2 {k7} {z}, xmm3, xmm4 +// CHECK: vfmsub231bf16 xmm2 {k7} {z}, xmm3, xmm4 // CHECK: encoding: [0x62,0xf6,0x64,0x8f,0xba,0xd4] - vfmsub231nepbf16 xmm2 {k7} {z}, xmm3, xmm4 + vfmsub231bf16 xmm2 {k7} {z}, xmm3, xmm4 -// CHECK: vfmsub231nepbf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456] +// CHECK: vfmsub231bf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456] // CHECK: encoding: [0x62,0xf6,0x64,0x48,0xba,0x94,0xf4,0x00,0x00,0x00,0x10] - vfmsub231nepbf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456] + vfmsub231bf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456] -// CHECK: vfmsub231nepbf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291] +// CHECK: vfmsub231bf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291] // CHECK: encoding: [0x62,0xf6,0x64,0x4f,0xba,0x94,0x87,0x23,0x01,0x00,0x00] - vfmsub231nepbf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291] + vfmsub231bf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291] -// CHECK: vfmsub231nepbf16 zmm2, zmm3, word ptr [eax]{1to32} +// CHECK: vfmsub231bf16 zmm2, zmm3, word ptr [eax]{1to32} // CHECK: encoding: [0x62,0xf6,0x64,0x58,0xba,0x10] - vfmsub231nepbf16 zmm2, zmm3, word ptr [eax]{1to32} + vfmsub231bf16 zmm2, zmm3, word ptr [eax]{1to32} -// CHECK: vfmsub231nepbf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048] +// CHECK: vfmsub231bf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048] // CHECK: encoding: [0x62,0xf6,0x64,0x48,0xba,0x14,0x6d,0x00,0xf8,0xff,0xff] - vfmsub231nepbf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048] + vfmsub231bf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048] -// CHECK: vfmsub231nepbf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128] +// CHECK: vfmsub231bf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128] // CHECK: encoding: [0x62,0xf6,0x64,0xcf,0xba,0x51,0x7f] - vfmsub231nepbf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128] + vfmsub231bf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128] -// CHECK: vfmsub231nepbf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32} +// CHECK: vfmsub231bf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32} // CHECK: encoding: [0x62,0xf6,0x64,0xdf,0xba,0x52,0x80] - vfmsub231nepbf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32} + vfmsub231bf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32} -// CHECK: vfmsub231nepbf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456] +// CHECK: vfmsub231bf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456] // CHECK: encoding: [0x62,0xf6,0x64,0x28,0xba,0x94,0xf4,0x00,0x00,0x00,0x10] - vfmsub231nepbf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456] + vfmsub231bf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456] -// CHECK: vfmsub231nepbf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291] +// CHECK: vfmsub231bf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291] // CHECK: encoding: [0x62,0xf6,0x64,0x2f,0xba,0x94,0x87,0x23,0x01,0x00,0x00] - vfmsub231nepbf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291] + vfmsub231bf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291] -// CHECK: vfmsub231nepbf16 ymm2, ymm3, word ptr [eax]{1to16} +// CHECK: vfmsub231bf16 ymm2, ymm3, word ptr [eax]{1to16} // CHECK: encoding: [0x62,0xf6,0x64,0x38,0xba,0x10] - vfmsub231nepbf16 ymm2, ymm3, word ptr [eax]{1to16} + vfmsub231bf16 ymm2, ymm3, word ptr [eax]{1to16} -// CHECK: vfmsub231nepbf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024] +// CHECK: vfmsub231bf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024] // CHECK: encoding: [0x62,0xf6,0x64,0x28,0xba,0x14,0x6d,0x00,0xfc,0xff,0xff] - vfmsub231nepbf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024] + vfmsub231bf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024] -// CHECK: vfmsub231nepbf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064] +// CHECK: vfmsub231bf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064] // CHECK: encoding: [0x62,0xf6,0x64,0xaf,0xba,0x51,0x7f] - vfmsub231nepbf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064] + vfmsub231bf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064] -// CHECK: vfmsub231nepbf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16} +// CHECK: vfmsub231bf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16} // CHECK: encoding: [0x62,0xf6,0x64,0xbf,0xba,0x52,0x80] - vfmsub231nepbf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16} + vfmsub231bf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16} -// CHECK: vfmsub231nepbf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456] +// CHECK: vfmsub231bf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456] // CHECK: encoding: [0x62,0xf6,0x64,0x08,0xba,0x94,0xf4,0x00,0x00,0x00,0x10] - vfmsub231nepbf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456] + vfmsub231bf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456] -// CHECK: vfmsub231nepbf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291] +// CHECK: vfmsub231bf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291] // CHECK: encoding: [0x62,0xf6,0x64,0x0f,0xba,0x94,0x87,0x23,0x01,0x00,0x00] - vfmsub231nepbf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291] + vfmsub231bf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291] -// CHECK: vfmsub231nepbf16 xmm2, xmm3, word ptr [eax]{1to8} +// CHECK: vfmsub231bf16 xmm2, xmm3, word ptr [eax]{1to8} // CHECK: encoding: [0x62,0xf6,0x64,0x18,0xba,0x10] - vfmsub231nepbf16 xmm2, xmm3, word ptr [eax]{1to8} + vfmsub231bf16 xmm2, xmm3, word ptr [eax]{1to8} -// CHECK: vfmsub231nepbf16 xmm2, xmm3, xmmword ptr [2*ebp - 512] +// CHECK: vfmsub231bf16 xmm2, xmm3, xmmword ptr [2*ebp - 512] // CHECK: encoding: [0x62,0xf6,0x64,0x08,0xba,0x14,0x6d,0x00,0xfe,0xff,0xff] - vfmsub231nepbf16 xmm2, xmm3, xmmword ptr [2*ebp - 512] + vfmsub231bf16 xmm2, xmm3, xmmword ptr [2*ebp - 512] -// CHECK: vfmsub231nepbf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032] +// CHECK: vfmsub231bf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032] // CHECK: encoding: [0x62,0xf6,0x64,0x8f,0xba,0x51,0x7f] - vfmsub231nepbf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032] + vfmsub231bf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032] -// CHECK: vfmsub231nepbf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8} +// CHECK: vfmsub231bf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8} // CHECK: encoding: [0x62,0xf6,0x64,0x9f,0xba,0x52,0x80] - vfmsub231nepbf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8} + vfmsub231bf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8} -// CHECK: vfnmadd132nepbf16 ymm2, ymm3, ymm4 +// CHECK: vfnmadd132bf16 ymm2, ymm3, ymm4 // CHECK: encoding: [0x62,0xf6,0x64,0x28,0x9c,0xd4] - vfnmadd132nepbf16 ymm2, ymm3, ymm4 + vfnmadd132bf16 ymm2, ymm3, ymm4 -// CHECK: vfnmadd132nepbf16 ymm2 {k7}, ymm3, ymm4 +// CHECK: vfnmadd132bf16 ymm2 {k7}, ymm3, ymm4 // CHECK: encoding: [0x62,0xf6,0x64,0x2f,0x9c,0xd4] - vfnmadd132nepbf16 ymm2 {k7}, ymm3, ymm4 + vfnmadd132bf16 ymm2 {k7}, ymm3, ymm4 -// CHECK: vfnmadd132nepbf16 ymm2 {k7} {z}, ymm3, ymm4 +// CHECK: vfnmadd132bf16 ymm2 {k7} {z}, ymm3, ymm4 // CHECK: encoding: [0x62,0xf6,0x64,0xaf,0x9c,0xd4] - vfnmadd132nepbf16 ymm2 {k7} {z}, ymm3, ymm4 + vfnmadd132bf16 ymm2 {k7} {z}, ymm3, ymm4 -// CHECK: vfnmadd132nepbf16 zmm2, zmm3, zmm4 +// CHECK: vfnmadd132bf16 zmm2, zmm3, zmm4 // CHECK: encoding: [0x62,0xf6,0x64,0x48,0x9c,0xd4] - vfnmadd132nepbf16 zmm2, zmm3, zmm4 + vfnmadd132bf16 zmm2, zmm3, zmm4 -// CHECK: vfnmadd132nepbf16 zmm2 {k7}, zmm3, zmm4 +// CHECK: vfnmadd132bf16 zmm2 {k7}, zmm3, zmm4 // CHECK: encoding: [0x62,0xf6,0x64,0x4f,0x9c,0xd4] - vfnmadd132nepbf16 zmm2 {k7}, zmm3, zmm4 + vfnmadd132bf16 zmm2 {k7}, zmm3, zmm4 -// CHECK: vfnmadd132nepbf16 zmm2 {k7} {z}, zmm3, zmm4 +// CHECK: vfnmadd132bf16 zmm2 {k7} {z}, zmm3, zmm4 // CHECK: encoding: [0x62,0xf6,0x64,0xcf,0x9c,0xd4] - vfnmadd132nepbf16 zmm2 {k7} {z}, zmm3, zmm4 + vfnmadd132bf16 zmm2 {k7} {z}, zmm3, zmm4 -// CHECK: vfnmadd132nepbf16 xmm2, xmm3, xmm4 +// CHECK: vfnmadd132bf16 xmm2, xmm3, xmm4 // CHECK: encoding: [0x62,0xf6,0x64,0x08,0x9c,0xd4] - vfnmadd132nepbf16 xmm2, xmm3, xmm4 + vfnmadd132bf16 xmm2, xmm3, xmm4 -// CHECK: vfnmadd132nepbf16 xmm2 {k7}, xmm3, xmm4 +// CHECK: vfnmadd132bf16 xmm2 {k7}, xmm3, xmm4 // CHECK: encoding: [0x62,0xf6,0x64,0x0f,0x9c,0xd4] - vfnmadd132nepbf16 xmm2 {k7}, xmm3, xmm4 + vfnmadd132bf16 xmm2 {k7}, xmm3, xmm4 -// CHECK: vfnmadd132nepbf16 xmm2 {k7} {z}, xmm3, xmm4 +// CHECK: vfnmadd132bf16 xmm2 {k7} {z}, xmm3, xmm4 // CHECK: encoding: [0x62,0xf6,0x64,0x8f,0x9c,0xd4] - vfnmadd132nepbf16 xmm2 {k7} {z}, xmm3, xmm4 + vfnmadd132bf16 xmm2 {k7} {z}, xmm3, xmm4 -// CHECK: vfnmadd132nepbf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456] +// CHECK: vfnmadd132bf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456] // CHECK: encoding: [0x62,0xf6,0x64,0x48,0x9c,0x94,0xf4,0x00,0x00,0x00,0x10] - vfnmadd132nepbf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456] + vfnmadd132bf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456] -// CHECK: vfnmadd132nepbf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291] +// CHECK: vfnmadd132bf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291] // CHECK: encoding: [0x62,0xf6,0x64,0x4f,0x9c,0x94,0x87,0x23,0x01,0x00,0x00] - vfnmadd132nepbf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291] + vfnmadd132bf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291] -// CHECK: vfnmadd132nepbf16 zmm2, zmm3, word ptr [eax]{1to32} +// CHECK: vfnmadd132bf16 zmm2, zmm3, word ptr [eax]{1to32} // CHECK: encoding: [0x62,0xf6,0x64,0x58,0x9c,0x10] - vfnmadd132nepbf16 zmm2, zmm3, word ptr [eax]{1to32} + vfnmadd132bf16 zmm2, zmm3, word ptr [eax]{1to32} -// CHECK: vfnmadd132nepbf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048] +// CHECK: vfnmadd132bf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048] // CHECK: encoding: [0x62,0xf6,0x64,0x48,0x9c,0x14,0x6d,0x00,0xf8,0xff,0xff] - vfnmadd132nepbf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048] + vfnmadd132bf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048] -// CHECK: vfnmadd132nepbf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128] +// CHECK: vfnmadd132bf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128] // CHECK: encoding: [0x62,0xf6,0x64,0xcf,0x9c,0x51,0x7f] - vfnmadd132nepbf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128] + vfnmadd132bf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128] -// CHECK: vfnmadd132nepbf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32} +// CHECK: vfnmadd132bf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32} // CHECK: encoding: [0x62,0xf6,0x64,0xdf,0x9c,0x52,0x80] - vfnmadd132nepbf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32} + vfnmadd132bf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32} -// CHECK: vfnmadd132nepbf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456] +// CHECK: vfnmadd132bf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456] // CHECK: encoding: [0x62,0xf6,0x64,0x28,0x9c,0x94,0xf4,0x00,0x00,0x00,0x10] - vfnmadd132nepbf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456] + vfnmadd132bf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456] -// CHECK: vfnmadd132nepbf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291] +// CHECK: vfnmadd132bf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291] // CHECK: encoding: [0x62,0xf6,0x64,0x2f,0x9c,0x94,0x87,0x23,0x01,0x00,0x00] - vfnmadd132nepbf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291] + vfnmadd132bf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291] -// CHECK: vfnmadd132nepbf16 ymm2, ymm3, word ptr [eax]{1to16} +// CHECK: vfnmadd132bf16 ymm2, ymm3, word ptr [eax]{1to16} // CHECK: encoding: [0x62,0xf6,0x64,0x38,0x9c,0x10] - vfnmadd132nepbf16 ymm2, ymm3, word ptr [eax]{1to16} + vfnmadd132bf16 ymm2, ymm3, word ptr [eax]{1to16} -// CHECK: vfnmadd132nepbf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024] +// CHECK: vfnmadd132bf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024] // CHECK: encoding: [0x62,0xf6,0x64,0x28,0x9c,0x14,0x6d,0x00,0xfc,0xff,0xff] - vfnmadd132nepbf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024] + vfnmadd132bf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024] -// CHECK: vfnmadd132nepbf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064] +// CHECK: vfnmadd132bf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064] // CHECK: encoding: [0x62,0xf6,0x64,0xaf,0x9c,0x51,0x7f] - vfnmadd132nepbf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064] + vfnmadd132bf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064] -// CHECK: vfnmadd132nepbf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16} +// CHECK: vfnmadd132bf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16} // CHECK: encoding: [0x62,0xf6,0x64,0xbf,0x9c,0x52,0x80] - vfnmadd132nepbf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16} + vfnmadd132bf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16} -// CHECK: vfnmadd132nepbf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456] +// CHECK: vfnmadd132bf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456] // CHECK: encoding: [0x62,0xf6,0x64,0x08,0x9c,0x94,0xf4,0x00,0x00,0x00,0x10] - vfnmadd132nepbf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456] + vfnmadd132bf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456] -// CHECK: vfnmadd132nepbf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291] +// CHECK: vfnmadd132bf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291] // CHECK: encoding: [0x62,0xf6,0x64,0x0f,0x9c,0x94,0x87,0x23,0x01,0x00,0x00] - vfnmadd132nepbf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291] + vfnmadd132bf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291] -// CHECK: vfnmadd132nepbf16 xmm2, xmm3, word ptr [eax]{1to8} +// CHECK: vfnmadd132bf16 xmm2, xmm3, word ptr [eax]{1to8} // CHECK: encoding: [0x62,0xf6,0x64,0x18,0x9c,0x10] - vfnmadd132nepbf16 xmm2, xmm3, word ptr [eax]{1to8} + vfnmadd132bf16 xmm2, xmm3, word ptr [eax]{1to8} -// CHECK: vfnmadd132nepbf16 xmm2, xmm3, xmmword ptr [2*ebp - 512] +// CHECK: vfnmadd132bf16 xmm2, xmm3, xmmword ptr [2*ebp - 512] // CHECK: encoding: [0x62,0xf6,0x64,0x08,0x9c,0x14,0x6d,0x00,0xfe,0xff,0xff] - vfnmadd132nepbf16 xmm2, xmm3, xmmword ptr [2*ebp - 512] + vfnmadd132bf16 xmm2, xmm3, xmmword ptr [2*ebp - 512] -// CHECK: vfnmadd132nepbf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032] +// CHECK: vfnmadd132bf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032] // CHECK: encoding: [0x62,0xf6,0x64,0x8f,0x9c,0x51,0x7f] - vfnmadd132nepbf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032] + vfnmadd132bf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032] -// CHECK: vfnmadd132nepbf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8} +// CHECK: vfnmadd132bf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8} // CHECK: encoding: [0x62,0xf6,0x64,0x9f,0x9c,0x52,0x80] - vfnmadd132nepbf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8} + vfnmadd132bf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8} -// CHECK: vfnmadd213nepbf16 ymm2, ymm3, ymm4 +// CHECK: vfnmadd213bf16 ymm2, ymm3, ymm4 // CHECK: encoding: [0x62,0xf6,0x64,0x28,0xac,0xd4] - vfnmadd213nepbf16 ymm2, ymm3, ymm4 + vfnmadd213bf16 ymm2, ymm3, ymm4 -// CHECK: vfnmadd213nepbf16 ymm2 {k7}, ymm3, ymm4 +// CHECK: vfnmadd213bf16 ymm2 {k7}, ymm3, ymm4 // CHECK: encoding: [0x62,0xf6,0x64,0x2f,0xac,0xd4] - vfnmadd213nepbf16 ymm2 {k7}, ymm3, ymm4 + vfnmadd213bf16 ymm2 {k7}, ymm3, ymm4 -// CHECK: vfnmadd213nepbf16 ymm2 {k7} {z}, ymm3, ymm4 +// CHECK: vfnmadd213bf16 ymm2 {k7} {z}, ymm3, ymm4 // CHECK: encoding: [0x62,0xf6,0x64,0xaf,0xac,0xd4] - vfnmadd213nepbf16 ymm2 {k7} {z}, ymm3, ymm4 + vfnmadd213bf16 ymm2 {k7} {z}, ymm3, ymm4 -// CHECK: vfnmadd213nepbf16 zmm2, zmm3, zmm4 +// CHECK: vfnmadd213bf16 zmm2, zmm3, zmm4 // CHECK: encoding: [0x62,0xf6,0x64,0x48,0xac,0xd4] - vfnmadd213nepbf16 zmm2, zmm3, zmm4 + vfnmadd213bf16 zmm2, zmm3, zmm4 -// CHECK: vfnmadd213nepbf16 zmm2 {k7}, zmm3, zmm4 +// CHECK: vfnmadd213bf16 zmm2 {k7}, zmm3, zmm4 // CHECK: encoding: [0x62,0xf6,0x64,0x4f,0xac,0xd4] - vfnmadd213nepbf16 zmm2 {k7}, zmm3, zmm4 + vfnmadd213bf16 zmm2 {k7}, zmm3, zmm4 -// CHECK: vfnmadd213nepbf16 zmm2 {k7} {z}, zmm3, zmm4 +// CHECK: vfnmadd213bf16 zmm2 {k7} {z}, zmm3, zmm4 // CHECK: encoding: [0x62,0xf6,0x64,0xcf,0xac,0xd4] - vfnmadd213nepbf16 zmm2 {k7} {z}, zmm3, zmm4 + vfnmadd213bf16 zmm2 {k7} {z}, zmm3, zmm4 -// CHECK: vfnmadd213nepbf16 xmm2, xmm3, xmm4 +// CHECK: vfnmadd213bf16 xmm2, xmm3, xmm4 // CHECK: encoding: [0x62,0xf6,0x64,0x08,0xac,0xd4] - vfnmadd213nepbf16 xmm2, xmm3, xmm4 + vfnmadd213bf16 xmm2, xmm3, xmm4 -// CHECK: vfnmadd213nepbf16 xmm2 {k7}, xmm3, xmm4 +// CHECK: vfnmadd213bf16 xmm2 {k7}, xmm3, xmm4 // CHECK: encoding: [0x62,0xf6,0x64,0x0f,0xac,0xd4] - vfnmadd213nepbf16 xmm2 {k7}, xmm3, xmm4 + vfnmadd213bf16 xmm2 {k7}, xmm3, xmm4 -// CHECK: vfnmadd213nepbf16 xmm2 {k7} {z}, xmm3, xmm4 +// CHECK: vfnmadd213bf16 xmm2 {k7} {z}, xmm3, xmm4 // CHECK: encoding: [0x62,0xf6,0x64,0x8f,0xac,0xd4] - vfnmadd213nepbf16 xmm2 {k7} {z}, xmm3, xmm4 + vfnmadd213bf16 xmm2 {k7} {z}, xmm3, xmm4 -// CHECK: vfnmadd213nepbf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456] +// CHECK: vfnmadd213bf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456] // CHECK: encoding: [0x62,0xf6,0x64,0x48,0xac,0x94,0xf4,0x00,0x00,0x00,0x10] - vfnmadd213nepbf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456] + vfnmadd213bf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456] -// CHECK: vfnmadd213nepbf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291] +// CHECK: vfnmadd213bf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291] // CHECK: encoding: [0x62,0xf6,0x64,0x4f,0xac,0x94,0x87,0x23,0x01,0x00,0x00] - vfnmadd213nepbf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291] + vfnmadd213bf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291] -// CHECK: vfnmadd213nepbf16 zmm2, zmm3, word ptr [eax]{1to32} +// CHECK: vfnmadd213bf16 zmm2, zmm3, word ptr [eax]{1to32} // CHECK: encoding: [0x62,0xf6,0x64,0x58,0xac,0x10] - vfnmadd213nepbf16 zmm2, zmm3, word ptr [eax]{1to32} + vfnmadd213bf16 zmm2, zmm3, word ptr [eax]{1to32} -// CHECK: vfnmadd213nepbf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048] +// CHECK: vfnmadd213bf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048] // CHECK: encoding: [0x62,0xf6,0x64,0x48,0xac,0x14,0x6d,0x00,0xf8,0xff,0xff] - vfnmadd213nepbf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048] + vfnmadd213bf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048] -// CHECK: vfnmadd213nepbf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128] +// CHECK: vfnmadd213bf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128] // CHECK: encoding: [0x62,0xf6,0x64,0xcf,0xac,0x51,0x7f] - vfnmadd213nepbf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128] + vfnmadd213bf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128] -// CHECK: vfnmadd213nepbf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32} +// CHECK: vfnmadd213bf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32} // CHECK: encoding: [0x62,0xf6,0x64,0xdf,0xac,0x52,0x80] - vfnmadd213nepbf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32} + vfnmadd213bf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32} -// CHECK: vfnmadd213nepbf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456] +// CHECK: vfnmadd213bf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456] // CHECK: encoding: [0x62,0xf6,0x64,0x28,0xac,0x94,0xf4,0x00,0x00,0x00,0x10] - vfnmadd213nepbf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456] + vfnmadd213bf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456] -// CHECK: vfnmadd213nepbf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291] +// CHECK: vfnmadd213bf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291] // CHECK: encoding: [0x62,0xf6,0x64,0x2f,0xac,0x94,0x87,0x23,0x01,0x00,0x00] - vfnmadd213nepbf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291] + vfnmadd213bf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291] -// CHECK: vfnmadd213nepbf16 ymm2, ymm3, word ptr [eax]{1to16} +// CHECK: vfnmadd213bf16 ymm2, ymm3, word ptr [eax]{1to16} // CHECK: encoding: [0x62,0xf6,0x64,0x38,0xac,0x10] - vfnmadd213nepbf16 ymm2, ymm3, word ptr [eax]{1to16} + vfnmadd213bf16 ymm2, ymm3, word ptr [eax]{1to16} -// CHECK: vfnmadd213nepbf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024] +// CHECK: vfnmadd213bf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024] // CHECK: encoding: [0x62,0xf6,0x64,0x28,0xac,0x14,0x6d,0x00,0xfc,0xff,0xff] - vfnmadd213nepbf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024] + vfnmadd213bf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024] -// CHECK: vfnmadd213nepbf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064] +// CHECK: vfnmadd213bf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064] // CHECK: encoding: [0x62,0xf6,0x64,0xaf,0xac,0x51,0x7f] - vfnmadd213nepbf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064] + vfnmadd213bf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064] -// CHECK: vfnmadd213nepbf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16} +// CHECK: vfnmadd213bf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16} // CHECK: encoding: [0x62,0xf6,0x64,0xbf,0xac,0x52,0x80] - vfnmadd213nepbf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16} + vfnmadd213bf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16} -// CHECK: vfnmadd213nepbf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456] +// CHECK: vfnmadd213bf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456] // CHECK: encoding: [0x62,0xf6,0x64,0x08,0xac,0x94,0xf4,0x00,0x00,0x00,0x10] - vfnmadd213nepbf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456] + vfnmadd213bf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456] -// CHECK: vfnmadd213nepbf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291] +// CHECK: vfnmadd213bf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291] // CHECK: encoding: [0x62,0xf6,0x64,0x0f,0xac,0x94,0x87,0x23,0x01,0x00,0x00] - vfnmadd213nepbf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291] + vfnmadd213bf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291] -// CHECK: vfnmadd213nepbf16 xmm2, xmm3, word ptr [eax]{1to8} +// CHECK: vfnmadd213bf16 xmm2, xmm3, word ptr [eax]{1to8} // CHECK: encoding: [0x62,0xf6,0x64,0x18,0xac,0x10] - vfnmadd213nepbf16 xmm2, xmm3, word ptr [eax]{1to8} + vfnmadd213bf16 xmm2, xmm3, word ptr [eax]{1to8} -// CHECK: vfnmadd213nepbf16 xmm2, xmm3, xmmword ptr [2*ebp - 512] +// CHECK: vfnmadd213bf16 xmm2, xmm3, xmmword ptr [2*ebp - 512] // CHECK: encoding: [0x62,0xf6,0x64,0x08,0xac,0x14,0x6d,0x00,0xfe,0xff,0xff] - vfnmadd213nepbf16 xmm2, xmm3, xmmword ptr [2*ebp - 512] + vfnmadd213bf16 xmm2, xmm3, xmmword ptr [2*ebp - 512] -// CHECK: vfnmadd213nepbf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032] +// CHECK: vfnmadd213bf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032] // CHECK: encoding: [0x62,0xf6,0x64,0x8f,0xac,0x51,0x7f] - vfnmadd213nepbf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032] + vfnmadd213bf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032] -// CHECK: vfnmadd213nepbf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8} +// CHECK: vfnmadd213bf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8} // CHECK: encoding: [0x62,0xf6,0x64,0x9f,0xac,0x52,0x80] - vfnmadd213nepbf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8} + vfnmadd213bf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8} -// CHECK: vfnmadd231nepbf16 ymm2, ymm3, ymm4 +// CHECK: vfnmadd231bf16 ymm2, ymm3, ymm4 // CHECK: encoding: [0x62,0xf6,0x64,0x28,0xbc,0xd4] - vfnmadd231nepbf16 ymm2, ymm3, ymm4 + vfnmadd231bf16 ymm2, ymm3, ymm4 -// CHECK: vfnmadd231nepbf16 ymm2 {k7}, ymm3, ymm4 +// CHECK: vfnmadd231bf16 ymm2 {k7}, ymm3, ymm4 // CHECK: encoding: [0x62,0xf6,0x64,0x2f,0xbc,0xd4] - vfnmadd231nepbf16 ymm2 {k7}, ymm3, ymm4 + vfnmadd231bf16 ymm2 {k7}, ymm3, ymm4 -// CHECK: vfnmadd231nepbf16 ymm2 {k7} {z}, ymm3, ymm4 +// CHECK: vfnmadd231bf16 ymm2 {k7} {z}, ymm3, ymm4 // CHECK: encoding: [0x62,0xf6,0x64,0xaf,0xbc,0xd4] - vfnmadd231nepbf16 ymm2 {k7} {z}, ymm3, ymm4 + vfnmadd231bf16 ymm2 {k7} {z}, ymm3, ymm4 -// CHECK: vfnmadd231nepbf16 zmm2, zmm3, zmm4 +// CHECK: vfnmadd231bf16 zmm2, zmm3, zmm4 // CHECK: encoding: [0x62,0xf6,0x64,0x48,0xbc,0xd4] - vfnmadd231nepbf16 zmm2, zmm3, zmm4 + vfnmadd231bf16 zmm2, zmm3, zmm4 -// CHECK: vfnmadd231nepbf16 zmm2 {k7}, zmm3, zmm4 +// CHECK: vfnmadd231bf16 zmm2 {k7}, zmm3, zmm4 // CHECK: encoding: [0x62,0xf6,0x64,0x4f,0xbc,0xd4] - vfnmadd231nepbf16 zmm2 {k7}, zmm3, zmm4 + vfnmadd231bf16 zmm2 {k7}, zmm3, zmm4 -// CHECK: vfnmadd231nepbf16 zmm2 {k7} {z}, zmm3, zmm4 +// CHECK: vfnmadd231bf16 zmm2 {k7} {z}, zmm3, zmm4 // CHECK: encoding: [0x62,0xf6,0x64,0xcf,0xbc,0xd4] - vfnmadd231nepbf16 zmm2 {k7} {z}, zmm3, zmm4 + vfnmadd231bf16 zmm2 {k7} {z}, zmm3, zmm4 -// CHECK: vfnmadd231nepbf16 xmm2, xmm3, xmm4 +// CHECK: vfnmadd231bf16 xmm2, xmm3, xmm4 // CHECK: encoding: [0x62,0xf6,0x64,0x08,0xbc,0xd4] - vfnmadd231nepbf16 xmm2, xmm3, xmm4 + vfnmadd231bf16 xmm2, xmm3, xmm4 -// CHECK: vfnmadd231nepbf16 xmm2 {k7}, xmm3, xmm4 +// CHECK: vfnmadd231bf16 xmm2 {k7}, xmm3, xmm4 // CHECK: encoding: [0x62,0xf6,0x64,0x0f,0xbc,0xd4] - vfnmadd231nepbf16 xmm2 {k7}, xmm3, xmm4 + vfnmadd231bf16 xmm2 {k7}, xmm3, xmm4 -// CHECK: vfnmadd231nepbf16 xmm2 {k7} {z}, xmm3, xmm4 +// CHECK: vfnmadd231bf16 xmm2 {k7} {z}, xmm3, xmm4 // CHECK: encoding: [0x62,0xf6,0x64,0x8f,0xbc,0xd4] - vfnmadd231nepbf16 xmm2 {k7} {z}, xmm3, xmm4 + vfnmadd231bf16 xmm2 {k7} {z}, xmm3, xmm4 -// CHECK: vfnmadd231nepbf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456] +// CHECK: vfnmadd231bf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456] // CHECK: encoding: [0x62,0xf6,0x64,0x48,0xbc,0x94,0xf4,0x00,0x00,0x00,0x10] - vfnmadd231nepbf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456] + vfnmadd231bf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456] -// CHECK: vfnmadd231nepbf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291] +// CHECK: vfnmadd231bf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291] // CHECK: encoding: [0x62,0xf6,0x64,0x4f,0xbc,0x94,0x87,0x23,0x01,0x00,0x00] - vfnmadd231nepbf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291] + vfnmadd231bf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291] -// CHECK: vfnmadd231nepbf16 zmm2, zmm3, word ptr [eax]{1to32} +// CHECK: vfnmadd231bf16 zmm2, zmm3, word ptr [eax]{1to32} // CHECK: encoding: [0x62,0xf6,0x64,0x58,0xbc,0x10] - vfnmadd231nepbf16 zmm2, zmm3, word ptr [eax]{1to32} + vfnmadd231bf16 zmm2, zmm3, word ptr [eax]{1to32} -// CHECK: vfnmadd231nepbf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048] +// CHECK: vfnmadd231bf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048] // CHECK: encoding: [0x62,0xf6,0x64,0x48,0xbc,0x14,0x6d,0x00,0xf8,0xff,0xff] - vfnmadd231nepbf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048] + vfnmadd231bf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048] -// CHECK: vfnmadd231nepbf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128] +// CHECK: vfnmadd231bf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128] // CHECK: encoding: [0x62,0xf6,0x64,0xcf,0xbc,0x51,0x7f] - vfnmadd231nepbf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128] + vfnmadd231bf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128] -// CHECK: vfnmadd231nepbf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32} +// CHECK: vfnmadd231bf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32} // CHECK: encoding: [0x62,0xf6,0x64,0xdf,0xbc,0x52,0x80] - vfnmadd231nepbf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32} + vfnmadd231bf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32} -// CHECK: vfnmadd231nepbf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456] +// CHECK: vfnmadd231bf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456] // CHECK: encoding: [0x62,0xf6,0x64,0x28,0xbc,0x94,0xf4,0x00,0x00,0x00,0x10] - vfnmadd231nepbf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456] + vfnmadd231bf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456] -// CHECK: vfnmadd231nepbf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291] +// CHECK: vfnmadd231bf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291] // CHECK: encoding: [0x62,0xf6,0x64,0x2f,0xbc,0x94,0x87,0x23,0x01,0x00,0x00] - vfnmadd231nepbf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291] + vfnmadd231bf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291] -// CHECK: vfnmadd231nepbf16 ymm2, ymm3, word ptr [eax]{1to16} +// CHECK: vfnmadd231bf16 ymm2, ymm3, word ptr [eax]{1to16} // CHECK: encoding: [0x62,0xf6,0x64,0x38,0xbc,0x10] - vfnmadd231nepbf16 ymm2, ymm3, word ptr [eax]{1to16} + vfnmadd231bf16 ymm2, ymm3, word ptr [eax]{1to16} -// CHECK: vfnmadd231nepbf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024] +// CHECK: vfnmadd231bf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024] // CHECK: encoding: [0x62,0xf6,0x64,0x28,0xbc,0x14,0x6d,0x00,0xfc,0xff,0xff] - vfnmadd231nepbf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024] + vfnmadd231bf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024] -// CHECK: vfnmadd231nepbf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064] +// CHECK: vfnmadd231bf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064] // CHECK: encoding: [0x62,0xf6,0x64,0xaf,0xbc,0x51,0x7f] - vfnmadd231nepbf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064] + vfnmadd231bf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064] -// CHECK: vfnmadd231nepbf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16} +// CHECK: vfnmadd231bf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16} // CHECK: encoding: [0x62,0xf6,0x64,0xbf,0xbc,0x52,0x80] - vfnmadd231nepbf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16} + vfnmadd231bf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16} -// CHECK: vfnmadd231nepbf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456] +// CHECK: vfnmadd231bf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456] // CHECK: encoding: [0x62,0xf6,0x64,0x08,0xbc,0x94,0xf4,0x00,0x00,0x00,0x10] - vfnmadd231nepbf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456] + vfnmadd231bf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456] -// CHECK: vfnmadd231nepbf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291] +// CHECK: vfnmadd231bf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291] // CHECK: encoding: [0x62,0xf6,0x64,0x0f,0xbc,0x94,0x87,0x23,0x01,0x00,0x00] - vfnmadd231nepbf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291] + vfnmadd231bf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291] -// CHECK: vfnmadd231nepbf16 xmm2, xmm3, word ptr [eax]{1to8} +// CHECK: vfnmadd231bf16 xmm2, xmm3, word ptr [eax]{1to8} // CHECK: encoding: [0x62,0xf6,0x64,0x18,0xbc,0x10] - vfnmadd231nepbf16 xmm2, xmm3, word ptr [eax]{1to8} + vfnmadd231bf16 xmm2, xmm3, word ptr [eax]{1to8} -// CHECK: vfnmadd231nepbf16 xmm2, xmm3, xmmword ptr [2*ebp - 512] +// CHECK: vfnmadd231bf16 xmm2, xmm3, xmmword ptr [2*ebp - 512] // CHECK: encoding: [0x62,0xf6,0x64,0x08,0xbc,0x14,0x6d,0x00,0xfe,0xff,0xff] - vfnmadd231nepbf16 xmm2, xmm3, xmmword ptr [2*ebp - 512] + vfnmadd231bf16 xmm2, xmm3, xmmword ptr [2*ebp - 512] -// CHECK: vfnmadd231nepbf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032] +// CHECK: vfnmadd231bf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032] // CHECK: encoding: [0x62,0xf6,0x64,0x8f,0xbc,0x51,0x7f] - vfnmadd231nepbf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032] + vfnmadd231bf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032] -// CHECK: vfnmadd231nepbf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8} +// CHECK: vfnmadd231bf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8} // CHECK: encoding: [0x62,0xf6,0x64,0x9f,0xbc,0x52,0x80] - vfnmadd231nepbf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8} + vfnmadd231bf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8} -// CHECK: vfnmsub132nepbf16 ymm2, ymm3, ymm4 +// CHECK: vfnmsub132bf16 ymm2, ymm3, ymm4 // CHECK: encoding: [0x62,0xf6,0x64,0x28,0x9e,0xd4] - vfnmsub132nepbf16 ymm2, ymm3, ymm4 + vfnmsub132bf16 ymm2, ymm3, ymm4 -// CHECK: vfnmsub132nepbf16 ymm2 {k7}, ymm3, ymm4 +// CHECK: vfnmsub132bf16 ymm2 {k7}, ymm3, ymm4 // CHECK: encoding: [0x62,0xf6,0x64,0x2f,0x9e,0xd4] - vfnmsub132nepbf16 ymm2 {k7}, ymm3, ymm4 + vfnmsub132bf16 ymm2 {k7}, ymm3, ymm4 -// CHECK: vfnmsub132nepbf16 ymm2 {k7} {z}, ymm3, ymm4 +// CHECK: vfnmsub132bf16 ymm2 {k7} {z}, ymm3, ymm4 // CHECK: encoding: [0x62,0xf6,0x64,0xaf,0x9e,0xd4] - vfnmsub132nepbf16 ymm2 {k7} {z}, ymm3, ymm4 + vfnmsub132bf16 ymm2 {k7} {z}, ymm3, ymm4 -// CHECK: vfnmsub132nepbf16 zmm2, zmm3, zmm4 +// CHECK: vfnmsub132bf16 zmm2, zmm3, zmm4 // CHECK: encoding: [0x62,0xf6,0x64,0x48,0x9e,0xd4] - vfnmsub132nepbf16 zmm2, zmm3, zmm4 + vfnmsub132bf16 zmm2, zmm3, zmm4 -// CHECK: vfnmsub132nepbf16 zmm2 {k7}, zmm3, zmm4 +// CHECK: vfnmsub132bf16 zmm2 {k7}, zmm3, zmm4 // CHECK: encoding: [0x62,0xf6,0x64,0x4f,0x9e,0xd4] - vfnmsub132nepbf16 zmm2 {k7}, zmm3, zmm4 + vfnmsub132bf16 zmm2 {k7}, zmm3, zmm4 -// CHECK: vfnmsub132nepbf16 zmm2 {k7} {z}, zmm3, zmm4 +// CHECK: vfnmsub132bf16 zmm2 {k7} {z}, zmm3, zmm4 // CHECK: encoding: [0x62,0xf6,0x64,0xcf,0x9e,0xd4] - vfnmsub132nepbf16 zmm2 {k7} {z}, zmm3, zmm4 + vfnmsub132bf16 zmm2 {k7} {z}, zmm3, zmm4 -// CHECK: vfnmsub132nepbf16 xmm2, xmm3, xmm4 +// CHECK: vfnmsub132bf16 xmm2, xmm3, xmm4 // CHECK: encoding: [0x62,0xf6,0x64,0x08,0x9e,0xd4] - vfnmsub132nepbf16 xmm2, xmm3, xmm4 + vfnmsub132bf16 xmm2, xmm3, xmm4 -// CHECK: vfnmsub132nepbf16 xmm2 {k7}, xmm3, xmm4 +// CHECK: vfnmsub132bf16 xmm2 {k7}, xmm3, xmm4 // CHECK: encoding: [0x62,0xf6,0x64,0x0f,0x9e,0xd4] - vfnmsub132nepbf16 xmm2 {k7}, xmm3, xmm4 + vfnmsub132bf16 xmm2 {k7}, xmm3, xmm4 -// CHECK: vfnmsub132nepbf16 xmm2 {k7} {z}, xmm3, xmm4 +// CHECK: vfnmsub132bf16 xmm2 {k7} {z}, xmm3, xmm4 // CHECK: encoding: [0x62,0xf6,0x64,0x8f,0x9e,0xd4] - vfnmsub132nepbf16 xmm2 {k7} {z}, xmm3, xmm4 + vfnmsub132bf16 xmm2 {k7} {z}, xmm3, xmm4 -// CHECK: vfnmsub132nepbf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456] +// CHECK: vfnmsub132bf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456] // CHECK: encoding: [0x62,0xf6,0x64,0x48,0x9e,0x94,0xf4,0x00,0x00,0x00,0x10] - vfnmsub132nepbf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456] + vfnmsub132bf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456] -// CHECK: vfnmsub132nepbf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291] +// CHECK: vfnmsub132bf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291] // CHECK: encoding: [0x62,0xf6,0x64,0x4f,0x9e,0x94,0x87,0x23,0x01,0x00,0x00] - vfnmsub132nepbf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291] + vfnmsub132bf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291] -// CHECK: vfnmsub132nepbf16 zmm2, zmm3, word ptr [eax]{1to32} +// CHECK: vfnmsub132bf16 zmm2, zmm3, word ptr [eax]{1to32} // CHECK: encoding: [0x62,0xf6,0x64,0x58,0x9e,0x10] - vfnmsub132nepbf16 zmm2, zmm3, word ptr [eax]{1to32} + vfnmsub132bf16 zmm2, zmm3, word ptr [eax]{1to32} -// CHECK: vfnmsub132nepbf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048] +// CHECK: vfnmsub132bf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048] // CHECK: encoding: [0x62,0xf6,0x64,0x48,0x9e,0x14,0x6d,0x00,0xf8,0xff,0xff] - vfnmsub132nepbf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048] + vfnmsub132bf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048] -// CHECK: vfnmsub132nepbf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128] +// CHECK: vfnmsub132bf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128] // CHECK: encoding: [0x62,0xf6,0x64,0xcf,0x9e,0x51,0x7f] - vfnmsub132nepbf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128] + vfnmsub132bf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128] -// CHECK: vfnmsub132nepbf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32} +// CHECK: vfnmsub132bf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32} // CHECK: encoding: [0x62,0xf6,0x64,0xdf,0x9e,0x52,0x80] - vfnmsub132nepbf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32} + vfnmsub132bf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32} -// CHECK: vfnmsub132nepbf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456] +// CHECK: vfnmsub132bf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456] // CHECK: encoding: [0x62,0xf6,0x64,0x28,0x9e,0x94,0xf4,0x00,0x00,0x00,0x10] - vfnmsub132nepbf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456] + vfnmsub132bf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456] -// CHECK: vfnmsub132nepbf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291] +// CHECK: vfnmsub132bf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291] // CHECK: encoding: [0x62,0xf6,0x64,0x2f,0x9e,0x94,0x87,0x23,0x01,0x00,0x00] - vfnmsub132nepbf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291] + vfnmsub132bf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291] -// CHECK: vfnmsub132nepbf16 ymm2, ymm3, word ptr [eax]{1to16} +// CHECK: vfnmsub132bf16 ymm2, ymm3, word ptr [eax]{1to16} // CHECK: encoding: [0x62,0xf6,0x64,0x38,0x9e,0x10] - vfnmsub132nepbf16 ymm2, ymm3, word ptr [eax]{1to16} + vfnmsub132bf16 ymm2, ymm3, word ptr [eax]{1to16} -// CHECK: vfnmsub132nepbf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024] +// CHECK: vfnmsub132bf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024] // CHECK: encoding: [0x62,0xf6,0x64,0x28,0x9e,0x14,0x6d,0x00,0xfc,0xff,0xff] - vfnmsub132nepbf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024] + vfnmsub132bf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024] -// CHECK: vfnmsub132nepbf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064] +// CHECK: vfnmsub132bf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064] // CHECK: encoding: [0x62,0xf6,0x64,0xaf,0x9e,0x51,0x7f] - vfnmsub132nepbf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064] + vfnmsub132bf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064] -// CHECK: vfnmsub132nepbf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16} +// CHECK: vfnmsub132bf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16} // CHECK: encoding: [0x62,0xf6,0x64,0xbf,0x9e,0x52,0x80] - vfnmsub132nepbf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16} + vfnmsub132bf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16} -// CHECK: vfnmsub132nepbf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456] +// CHECK: vfnmsub132bf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456] // CHECK: encoding: [0x62,0xf6,0x64,0x08,0x9e,0x94,0xf4,0x00,0x00,0x00,0x10] - vfnmsub132nepbf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456] + vfnmsub132bf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456] -// CHECK: vfnmsub132nepbf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291] +// CHECK: vfnmsub132bf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291] // CHECK: encoding: [0x62,0xf6,0x64,0x0f,0x9e,0x94,0x87,0x23,0x01,0x00,0x00] - vfnmsub132nepbf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291] + vfnmsub132bf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291] -// CHECK: vfnmsub132nepbf16 xmm2, xmm3, word ptr [eax]{1to8} +// CHECK: vfnmsub132bf16 xmm2, xmm3, word ptr [eax]{1to8} // CHECK: encoding: [0x62,0xf6,0x64,0x18,0x9e,0x10] - vfnmsub132nepbf16 xmm2, xmm3, word ptr [eax]{1to8} + vfnmsub132bf16 xmm2, xmm3, word ptr [eax]{1to8} -// CHECK: vfnmsub132nepbf16 xmm2, xmm3, xmmword ptr [2*ebp - 512] +// CHECK: vfnmsub132bf16 xmm2, xmm3, xmmword ptr [2*ebp - 512] // CHECK: encoding: [0x62,0xf6,0x64,0x08,0x9e,0x14,0x6d,0x00,0xfe,0xff,0xff] - vfnmsub132nepbf16 xmm2, xmm3, xmmword ptr [2*ebp - 512] + vfnmsub132bf16 xmm2, xmm3, xmmword ptr [2*ebp - 512] -// CHECK: vfnmsub132nepbf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032] +// CHECK: vfnmsub132bf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032] // CHECK: encoding: [0x62,0xf6,0x64,0x8f,0x9e,0x51,0x7f] - vfnmsub132nepbf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032] + vfnmsub132bf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032] -// CHECK: vfnmsub132nepbf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8} +// CHECK: vfnmsub132bf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8} // CHECK: encoding: [0x62,0xf6,0x64,0x9f,0x9e,0x52,0x80] - vfnmsub132nepbf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8} + vfnmsub132bf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8} -// CHECK: vfnmsub213nepbf16 ymm2, ymm3, ymm4 +// CHECK: vfnmsub213bf16 ymm2, ymm3, ymm4 // CHECK: encoding: [0x62,0xf6,0x64,0x28,0xae,0xd4] - vfnmsub213nepbf16 ymm2, ymm3, ymm4 + vfnmsub213bf16 ymm2, ymm3, ymm4 -// CHECK: vfnmsub213nepbf16 ymm2 {k7}, ymm3, ymm4 +// CHECK: vfnmsub213bf16 ymm2 {k7}, ymm3, ymm4 // CHECK: encoding: [0x62,0xf6,0x64,0x2f,0xae,0xd4] - vfnmsub213nepbf16 ymm2 {k7}, ymm3, ymm4 + vfnmsub213bf16 ymm2 {k7}, ymm3, ymm4 -// CHECK: vfnmsub213nepbf16 ymm2 {k7} {z}, ymm3, ymm4 +// CHECK: vfnmsub213bf16 ymm2 {k7} {z}, ymm3, ymm4 // CHECK: encoding: [0x62,0xf6,0x64,0xaf,0xae,0xd4] - vfnmsub213nepbf16 ymm2 {k7} {z}, ymm3, ymm4 + vfnmsub213bf16 ymm2 {k7} {z}, ymm3, ymm4 -// CHECK: vfnmsub213nepbf16 zmm2, zmm3, zmm4 +// CHECK: vfnmsub213bf16 zmm2, zmm3, zmm4 // CHECK: encoding: [0x62,0xf6,0x64,0x48,0xae,0xd4] - vfnmsub213nepbf16 zmm2, zmm3, zmm4 + vfnmsub213bf16 zmm2, zmm3, zmm4 -// CHECK: vfnmsub213nepbf16 zmm2 {k7}, zmm3, zmm4 +// CHECK: vfnmsub213bf16 zmm2 {k7}, zmm3, zmm4 // CHECK: encoding: [0x62,0xf6,0x64,0x4f,0xae,0xd4] - vfnmsub213nepbf16 zmm2 {k7}, zmm3, zmm4 + vfnmsub213bf16 zmm2 {k7}, zmm3, zmm4 -// CHECK: vfnmsub213nepbf16 zmm2 {k7} {z}, zmm3, zmm4 +// CHECK: vfnmsub213bf16 zmm2 {k7} {z}, zmm3, zmm4 // CHECK: encoding: [0x62,0xf6,0x64,0xcf,0xae,0xd4] - vfnmsub213nepbf16 zmm2 {k7} {z}, zmm3, zmm4 + vfnmsub213bf16 zmm2 {k7} {z}, zmm3, zmm4 -// CHECK: vfnmsub213nepbf16 xmm2, xmm3, xmm4 +// CHECK: vfnmsub213bf16 xmm2, xmm3, xmm4 // CHECK: encoding: [0x62,0xf6,0x64,0x08,0xae,0xd4] - vfnmsub213nepbf16 xmm2, xmm3, xmm4 + vfnmsub213bf16 xmm2, xmm3, xmm4 -// CHECK: vfnmsub213nepbf16 xmm2 {k7}, xmm3, xmm4 +// CHECK: vfnmsub213bf16 xmm2 {k7}, xmm3, xmm4 // CHECK: encoding: [0x62,0xf6,0x64,0x0f,0xae,0xd4] - vfnmsub213nepbf16 xmm2 {k7}, xmm3, xmm4 + vfnmsub213bf16 xmm2 {k7}, xmm3, xmm4 -// CHECK: vfnmsub213nepbf16 xmm2 {k7} {z}, xmm3, xmm4 +// CHECK: vfnmsub213bf16 xmm2 {k7} {z}, xmm3, xmm4 // CHECK: encoding: [0x62,0xf6,0x64,0x8f,0xae,0xd4] - vfnmsub213nepbf16 xmm2 {k7} {z}, xmm3, xmm4 + vfnmsub213bf16 xmm2 {k7} {z}, xmm3, xmm4 -// CHECK: vfnmsub213nepbf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456] +// CHECK: vfnmsub213bf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456] // CHECK: encoding: [0x62,0xf6,0x64,0x48,0xae,0x94,0xf4,0x00,0x00,0x00,0x10] - vfnmsub213nepbf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456] + vfnmsub213bf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456] -// CHECK: vfnmsub213nepbf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291] +// CHECK: vfnmsub213bf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291] // CHECK: encoding: [0x62,0xf6,0x64,0x4f,0xae,0x94,0x87,0x23,0x01,0x00,0x00] - vfnmsub213nepbf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291] + vfnmsub213bf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291] -// CHECK: vfnmsub213nepbf16 zmm2, zmm3, word ptr [eax]{1to32} +// CHECK: vfnmsub213bf16 zmm2, zmm3, word ptr [eax]{1to32} // CHECK: encoding: [0x62,0xf6,0x64,0x58,0xae,0x10] - vfnmsub213nepbf16 zmm2, zmm3, word ptr [eax]{1to32} + vfnmsub213bf16 zmm2, zmm3, word ptr [eax]{1to32} -// CHECK: vfnmsub213nepbf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048] +// CHECK: vfnmsub213bf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048] // CHECK: encoding: [0x62,0xf6,0x64,0x48,0xae,0x14,0x6d,0x00,0xf8,0xff,0xff] - vfnmsub213nepbf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048] + vfnmsub213bf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048] -// CHECK: vfnmsub213nepbf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128] +// CHECK: vfnmsub213bf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128] // CHECK: encoding: [0x62,0xf6,0x64,0xcf,0xae,0x51,0x7f] - vfnmsub213nepbf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128] + vfnmsub213bf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128] -// CHECK: vfnmsub213nepbf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32} +// CHECK: vfnmsub213bf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32} // CHECK: encoding: [0x62,0xf6,0x64,0xdf,0xae,0x52,0x80] - vfnmsub213nepbf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32} + vfnmsub213bf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32} -// CHECK: vfnmsub213nepbf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456] +// CHECK: vfnmsub213bf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456] // CHECK: encoding: [0x62,0xf6,0x64,0x28,0xae,0x94,0xf4,0x00,0x00,0x00,0x10] - vfnmsub213nepbf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456] + vfnmsub213bf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456] -// CHECK: vfnmsub213nepbf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291] +// CHECK: vfnmsub213bf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291] // CHECK: encoding: [0x62,0xf6,0x64,0x2f,0xae,0x94,0x87,0x23,0x01,0x00,0x00] - vfnmsub213nepbf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291] + vfnmsub213bf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291] -// CHECK: vfnmsub213nepbf16 ymm2, ymm3, word ptr [eax]{1to16} +// CHECK: vfnmsub213bf16 ymm2, ymm3, word ptr [eax]{1to16} // CHECK: encoding: [0x62,0xf6,0x64,0x38,0xae,0x10] - vfnmsub213nepbf16 ymm2, ymm3, word ptr [eax]{1to16} + vfnmsub213bf16 ymm2, ymm3, word ptr [eax]{1to16} -// CHECK: vfnmsub213nepbf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024] +// CHECK: vfnmsub213bf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024] // CHECK: encoding: [0x62,0xf6,0x64,0x28,0xae,0x14,0x6d,0x00,0xfc,0xff,0xff] - vfnmsub213nepbf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024] + vfnmsub213bf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024] -// CHECK: vfnmsub213nepbf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064] +// CHECK: vfnmsub213bf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064] // CHECK: encoding: [0x62,0xf6,0x64,0xaf,0xae,0x51,0x7f] - vfnmsub213nepbf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064] + vfnmsub213bf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064] -// CHECK: vfnmsub213nepbf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16} +// CHECK: vfnmsub213bf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16} // CHECK: encoding: [0x62,0xf6,0x64,0xbf,0xae,0x52,0x80] - vfnmsub213nepbf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16} + vfnmsub213bf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16} -// CHECK: vfnmsub213nepbf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456] +// CHECK: vfnmsub213bf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456] // CHECK: encoding: [0x62,0xf6,0x64,0x08,0xae,0x94,0xf4,0x00,0x00,0x00,0x10] - vfnmsub213nepbf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456] + vfnmsub213bf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456] -// CHECK: vfnmsub213nepbf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291] +// CHECK: vfnmsub213bf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291] // CHECK: encoding: [0x62,0xf6,0x64,0x0f,0xae,0x94,0x87,0x23,0x01,0x00,0x00] - vfnmsub213nepbf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291] + vfnmsub213bf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291] -// CHECK: vfnmsub213nepbf16 xmm2, xmm3, word ptr [eax]{1to8} +// CHECK: vfnmsub213bf16 xmm2, xmm3, word ptr [eax]{1to8} // CHECK: encoding: [0x62,0xf6,0x64,0x18,0xae,0x10] - vfnmsub213nepbf16 xmm2, xmm3, word ptr [eax]{1to8} + vfnmsub213bf16 xmm2, xmm3, word ptr [eax]{1to8} -// CHECK: vfnmsub213nepbf16 xmm2, xmm3, xmmword ptr [2*ebp - 512] +// CHECK: vfnmsub213bf16 xmm2, xmm3, xmmword ptr [2*ebp - 512] // CHECK: encoding: [0x62,0xf6,0x64,0x08,0xae,0x14,0x6d,0x00,0xfe,0xff,0xff] - vfnmsub213nepbf16 xmm2, xmm3, xmmword ptr [2*ebp - 512] + vfnmsub213bf16 xmm2, xmm3, xmmword ptr [2*ebp - 512] -// CHECK: vfnmsub213nepbf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032] +// CHECK: vfnmsub213bf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032] // CHECK: encoding: [0x62,0xf6,0x64,0x8f,0xae,0x51,0x7f] - vfnmsub213nepbf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032] + vfnmsub213bf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032] -// CHECK: vfnmsub213nepbf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8} +// CHECK: vfnmsub213bf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8} // CHECK: encoding: [0x62,0xf6,0x64,0x9f,0xae,0x52,0x80] - vfnmsub213nepbf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8} + vfnmsub213bf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8} -// CHECK: vfnmsub231nepbf16 ymm2, ymm3, ymm4 +// CHECK: vfnmsub231bf16 ymm2, ymm3, ymm4 // CHECK: encoding: [0x62,0xf6,0x64,0x28,0xbe,0xd4] - vfnmsub231nepbf16 ymm2, ymm3, ymm4 + vfnmsub231bf16 ymm2, ymm3, ymm4 -// CHECK: vfnmsub231nepbf16 ymm2 {k7}, ymm3, ymm4 +// CHECK: vfnmsub231bf16 ymm2 {k7}, ymm3, ymm4 // CHECK: encoding: [0x62,0xf6,0x64,0x2f,0xbe,0xd4] - vfnmsub231nepbf16 ymm2 {k7}, ymm3, ymm4 + vfnmsub231bf16 ymm2 {k7}, ymm3, ymm4 -// CHECK: vfnmsub231nepbf16 ymm2 {k7} {z}, ymm3, ymm4 +// CHECK: vfnmsub231bf16 ymm2 {k7} {z}, ymm3, ymm4 // CHECK: encoding: [0x62,0xf6,0x64,0xaf,0xbe,0xd4] - vfnmsub231nepbf16 ymm2 {k7} {z}, ymm3, ymm4 + vfnmsub231bf16 ymm2 {k7} {z}, ymm3, ymm4 -// CHECK: vfnmsub231nepbf16 zmm2, zmm3, zmm4 +// CHECK: vfnmsub231bf16 zmm2, zmm3, zmm4 // CHECK: encoding: [0x62,0xf6,0x64,0x48,0xbe,0xd4] - vfnmsub231nepbf16 zmm2, zmm3, zmm4 + vfnmsub231bf16 zmm2, zmm3, zmm4 -// CHECK: vfnmsub231nepbf16 zmm2 {k7}, zmm3, zmm4 +// CHECK: vfnmsub231bf16 zmm2 {k7}, zmm3, zmm4 // CHECK: encoding: [0x62,0xf6,0x64,0x4f,0xbe,0xd4] - vfnmsub231nepbf16 zmm2 {k7}, zmm3, zmm4 + vfnmsub231bf16 zmm2 {k7}, zmm3, zmm4 -// CHECK: vfnmsub231nepbf16 zmm2 {k7} {z}, zmm3, zmm4 +// CHECK: vfnmsub231bf16 zmm2 {k7} {z}, zmm3, zmm4 // CHECK: encoding: [0x62,0xf6,0x64,0xcf,0xbe,0xd4] - vfnmsub231nepbf16 zmm2 {k7} {z}, zmm3, zmm4 + vfnmsub231bf16 zmm2 {k7} {z}, zmm3, zmm4 -// CHECK: vfnmsub231nepbf16 xmm2, xmm3, xmm4 +// CHECK: vfnmsub231bf16 xmm2, xmm3, xmm4 // CHECK: encoding: [0x62,0xf6,0x64,0x08,0xbe,0xd4] - vfnmsub231nepbf16 xmm2, xmm3, xmm4 + vfnmsub231bf16 xmm2, xmm3, xmm4 -// CHECK: vfnmsub231nepbf16 xmm2 {k7}, xmm3, xmm4 +// CHECK: vfnmsub231bf16 xmm2 {k7}, xmm3, xmm4 // CHECK: encoding: [0x62,0xf6,0x64,0x0f,0xbe,0xd4] - vfnmsub231nepbf16 xmm2 {k7}, xmm3, xmm4 + vfnmsub231bf16 xmm2 {k7}, xmm3, xmm4 -// CHECK: vfnmsub231nepbf16 xmm2 {k7} {z}, xmm3, xmm4 +// CHECK: vfnmsub231bf16 xmm2 {k7} {z}, xmm3, xmm4 // CHECK: encoding: [0x62,0xf6,0x64,0x8f,0xbe,0xd4] - vfnmsub231nepbf16 xmm2 {k7} {z}, xmm3, xmm4 + vfnmsub231bf16 xmm2 {k7} {z}, xmm3, xmm4 -// CHECK: vfnmsub231nepbf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456] +// CHECK: vfnmsub231bf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456] // CHECK: encoding: [0x62,0xf6,0x64,0x48,0xbe,0x94,0xf4,0x00,0x00,0x00,0x10] - vfnmsub231nepbf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456] + vfnmsub231bf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456] -// CHECK: vfnmsub231nepbf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291] +// CHECK: vfnmsub231bf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291] // CHECK: encoding: [0x62,0xf6,0x64,0x4f,0xbe,0x94,0x87,0x23,0x01,0x00,0x00] - vfnmsub231nepbf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291] + vfnmsub231bf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291] -// CHECK: vfnmsub231nepbf16 zmm2, zmm3, word ptr [eax]{1to32} +// CHECK: vfnmsub231bf16 zmm2, zmm3, word ptr [eax]{1to32} // CHECK: encoding: [0x62,0xf6,0x64,0x58,0xbe,0x10] - vfnmsub231nepbf16 zmm2, zmm3, word ptr [eax]{1to32} + vfnmsub231bf16 zmm2, zmm3, word ptr [eax]{1to32} -// CHECK: vfnmsub231nepbf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048] +// CHECK: vfnmsub231bf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048] // CHECK: encoding: [0x62,0xf6,0x64,0x48,0xbe,0x14,0x6d,0x00,0xf8,0xff,0xff] - vfnmsub231nepbf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048] + vfnmsub231bf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048] -// CHECK: vfnmsub231nepbf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128] +// CHECK: vfnmsub231bf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128] // CHECK: encoding: [0x62,0xf6,0x64,0xcf,0xbe,0x51,0x7f] - vfnmsub231nepbf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128] + vfnmsub231bf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128] -// CHECK: vfnmsub231nepbf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32} +// CHECK: vfnmsub231bf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32} // CHECK: encoding: [0x62,0xf6,0x64,0xdf,0xbe,0x52,0x80] - vfnmsub231nepbf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32} + vfnmsub231bf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32} -// CHECK: vfnmsub231nepbf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456] +// CHECK: vfnmsub231bf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456] // CHECK: encoding: [0x62,0xf6,0x64,0x28,0xbe,0x94,0xf4,0x00,0x00,0x00,0x10] - vfnmsub231nepbf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456] + vfnmsub231bf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456] -// CHECK: vfnmsub231nepbf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291] +// CHECK: vfnmsub231bf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291] // CHECK: encoding: [0x62,0xf6,0x64,0x2f,0xbe,0x94,0x87,0x23,0x01,0x00,0x00] - vfnmsub231nepbf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291] + vfnmsub231bf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291] -// CHECK: vfnmsub231nepbf16 ymm2, ymm3, word ptr [eax]{1to16} +// CHECK: vfnmsub231bf16 ymm2, ymm3, word ptr [eax]{1to16} // CHECK: encoding: [0x62,0xf6,0x64,0x38,0xbe,0x10] - vfnmsub231nepbf16 ymm2, ymm3, word ptr [eax]{1to16} + vfnmsub231bf16 ymm2, ymm3, word ptr [eax]{1to16} -// CHECK: vfnmsub231nepbf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024] +// CHECK: vfnmsub231bf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024] // CHECK: encoding: [0x62,0xf6,0x64,0x28,0xbe,0x14,0x6d,0x00,0xfc,0xff,0xff] - vfnmsub231nepbf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024] + vfnmsub231bf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024] -// CHECK: vfnmsub231nepbf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064] +// CHECK: vfnmsub231bf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064] // CHECK: encoding: [0x62,0xf6,0x64,0xaf,0xbe,0x51,0x7f] - vfnmsub231nepbf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064] + vfnmsub231bf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064] -// CHECK: vfnmsub231nepbf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16} +// CHECK: vfnmsub231bf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16} // CHECK: encoding: [0x62,0xf6,0x64,0xbf,0xbe,0x52,0x80] - vfnmsub231nepbf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16} + vfnmsub231bf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16} -// CHECK: vfnmsub231nepbf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456] +// CHECK: vfnmsub231bf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456] // CHECK: encoding: [0x62,0xf6,0x64,0x08,0xbe,0x94,0xf4,0x00,0x00,0x00,0x10] - vfnmsub231nepbf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456] + vfnmsub231bf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456] -// CHECK: vfnmsub231nepbf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291] +// CHECK: vfnmsub231bf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291] // CHECK: encoding: [0x62,0xf6,0x64,0x0f,0xbe,0x94,0x87,0x23,0x01,0x00,0x00] - vfnmsub231nepbf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291] + vfnmsub231bf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291] -// CHECK: vfnmsub231nepbf16 xmm2, xmm3, word ptr [eax]{1to8} +// CHECK: vfnmsub231bf16 xmm2, xmm3, word ptr [eax]{1to8} // CHECK: encoding: [0x62,0xf6,0x64,0x18,0xbe,0x10] - vfnmsub231nepbf16 xmm2, xmm3, word ptr [eax]{1to8} + vfnmsub231bf16 xmm2, xmm3, word ptr [eax]{1to8} -// CHECK: vfnmsub231nepbf16 xmm2, xmm3, xmmword ptr [2*ebp - 512] +// CHECK: vfnmsub231bf16 xmm2, xmm3, xmmword ptr [2*ebp - 512] // CHECK: encoding: [0x62,0xf6,0x64,0x08,0xbe,0x14,0x6d,0x00,0xfe,0xff,0xff] - vfnmsub231nepbf16 xmm2, xmm3, xmmword ptr [2*ebp - 512] + vfnmsub231bf16 xmm2, xmm3, xmmword ptr [2*ebp - 512] -// CHECK: vfnmsub231nepbf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032] +// CHECK: vfnmsub231bf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032] // CHECK: encoding: [0x62,0xf6,0x64,0x8f,0xbe,0x51,0x7f] - vfnmsub231nepbf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032] + vfnmsub231bf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032] -// CHECK: vfnmsub231nepbf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8} +// CHECK: vfnmsub231bf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8} // CHECK: encoding: [0x62,0xf6,0x64,0x9f,0xbe,0x52,0x80] - vfnmsub231nepbf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8} + vfnmsub231bf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8} -// CHECK: vfpclasspbf16 k5, zmm3, 123 +// CHECK: vfpclassbf16 k5, zmm3, 123 // CHECK: encoding: [0x62,0xf3,0x7f,0x48,0x66,0xeb,0x7b] - vfpclasspbf16 k5, zmm3, 123 + vfpclassbf16 k5, zmm3, 123 -// CHECK: vfpclasspbf16 k5 {k7}, zmm3, 123 +// CHECK: vfpclassbf16 k5 {k7}, zmm3, 123 // CHECK: encoding: [0x62,0xf3,0x7f,0x4f,0x66,0xeb,0x7b] - vfpclasspbf16 k5 {k7}, zmm3, 123 + vfpclassbf16 k5 {k7}, zmm3, 123 -// CHECK: vfpclasspbf16 k5, ymm3, 123 +// CHECK: vfpclassbf16 k5, ymm3, 123 // CHECK: encoding: [0x62,0xf3,0x7f,0x28,0x66,0xeb,0x7b] - vfpclasspbf16 k5, ymm3, 123 + vfpclassbf16 k5, ymm3, 123 -// CHECK: vfpclasspbf16 k5 {k7}, ymm3, 123 +// CHECK: vfpclassbf16 k5 {k7}, ymm3, 123 // CHECK: encoding: [0x62,0xf3,0x7f,0x2f,0x66,0xeb,0x7b] - vfpclasspbf16 k5 {k7}, ymm3, 123 + vfpclassbf16 k5 {k7}, ymm3, 123 -// CHECK: vfpclasspbf16 k5, xmm3, 123 +// CHECK: vfpclassbf16 k5, xmm3, 123 // CHECK: encoding: [0x62,0xf3,0x7f,0x08,0x66,0xeb,0x7b] - vfpclasspbf16 k5, xmm3, 123 + vfpclassbf16 k5, xmm3, 123 -// CHECK: vfpclasspbf16 k5 {k7}, xmm3, 123 +// CHECK: vfpclassbf16 k5 {k7}, xmm3, 123 // CHECK: encoding: [0x62,0xf3,0x7f,0x0f,0x66,0xeb,0x7b] - vfpclasspbf16 k5 {k7}, xmm3, 123 + vfpclassbf16 k5 {k7}, xmm3, 123 -// CHECK: vfpclasspbf16 k5, xmmword ptr [esp + 8*esi + 268435456], 123 +// CHECK: vfpclassbf16 k5, xmmword ptr [esp + 8*esi + 268435456], 123 // CHECK: encoding: [0x62,0xf3,0x7f,0x08,0x66,0xac,0xf4,0x00,0x00,0x00,0x10,0x7b] - vfpclasspbf16 k5, xmmword ptr [esp + 8*esi + 268435456], 123 + vfpclassbf16 k5, xmmword ptr [esp + 8*esi + 268435456], 123 -// CHECK: vfpclasspbf16 k5 {k7}, xmmword ptr [edi + 4*eax + 291], 123 +// CHECK: vfpclassbf16 k5 {k7}, xmmword ptr [edi + 4*eax + 291], 123 // CHECK: encoding: [0x62,0xf3,0x7f,0x0f,0x66,0xac,0x87,0x23,0x01,0x00,0x00,0x7b] - vfpclasspbf16 k5 {k7}, xmmword ptr [edi + 4*eax + 291], 123 + vfpclassbf16 k5 {k7}, xmmword ptr [edi + 4*eax + 291], 123 -// CHECK: vfpclasspbf16 k5, word ptr [eax]{1to8}, 123 +// CHECK: vfpclassbf16 k5, word ptr [eax]{1to8}, 123 // CHECK: encoding: [0x62,0xf3,0x7f,0x18,0x66,0x28,0x7b] - vfpclasspbf16 k5, word ptr [eax]{1to8}, 123 + vfpclassbf16 k5, word ptr [eax]{1to8}, 123 -// CHECK: vfpclasspbf16 k5, xmmword ptr [2*ebp - 512], 123 +// CHECK: vfpclassbf16 k5, xmmword ptr [2*ebp - 512], 123 // CHECK: encoding: [0x62,0xf3,0x7f,0x08,0x66,0x2c,0x6d,0x00,0xfe,0xff,0xff,0x7b] - vfpclasspbf16 k5, xmmword ptr [2*ebp - 512], 123 + vfpclassbf16 k5, xmmword ptr [2*ebp - 512], 123 -// CHECK: vfpclasspbf16 k5 {k7}, xmmword ptr [ecx + 2032], 123 +// CHECK: vfpclassbf16 k5 {k7}, xmmword ptr [ecx + 2032], 123 // CHECK: encoding: [0x62,0xf3,0x7f,0x0f,0x66,0x69,0x7f,0x7b] - vfpclasspbf16 k5 {k7}, xmmword ptr [ecx + 2032], 123 + vfpclassbf16 k5 {k7}, xmmword ptr [ecx + 2032], 123 -// CHECK: vfpclasspbf16 k5 {k7}, word ptr [edx - 256]{1to8}, 123 +// CHECK: vfpclassbf16 k5 {k7}, word ptr [edx - 256]{1to8}, 123 // CHECK: encoding: [0x62,0xf3,0x7f,0x1f,0x66,0x6a,0x80,0x7b] - vfpclasspbf16 k5 {k7}, word ptr [edx - 256]{1to8}, 123 + vfpclassbf16 k5 {k7}, word ptr [edx - 256]{1to8}, 123 -// CHECK: vfpclasspbf16 k5, word ptr [eax]{1to16}, 123 +// CHECK: vfpclassbf16 k5, word ptr [eax]{1to16}, 123 // CHECK: encoding: [0x62,0xf3,0x7f,0x38,0x66,0x28,0x7b] - vfpclasspbf16 k5, word ptr [eax]{1to16}, 123 + vfpclassbf16 k5, word ptr [eax]{1to16}, 123 -// CHECK: vfpclasspbf16 k5, ymmword ptr [2*ebp - 1024], 123 +// CHECK: vfpclassbf16 k5, ymmword ptr [2*ebp - 1024], 123 // CHECK: encoding: [0x62,0xf3,0x7f,0x28,0x66,0x2c,0x6d,0x00,0xfc,0xff,0xff,0x7b] - vfpclasspbf16 k5, ymmword ptr [2*ebp - 1024], 123 + vfpclassbf16 k5, ymmword ptr [2*ebp - 1024], 123 -// CHECK: vfpclasspbf16 k5 {k7}, ymmword ptr [ecx + 4064], 123 +// CHECK: vfpclassbf16 k5 {k7}, ymmword ptr [ecx + 4064], 123 // CHECK: encoding: [0x62,0xf3,0x7f,0x2f,0x66,0x69,0x7f,0x7b] - vfpclasspbf16 k5 {k7}, ymmword ptr [ecx + 4064], 123 + vfpclassbf16 k5 {k7}, ymmword ptr [ecx + 4064], 123 -// CHECK: vfpclasspbf16 k5 {k7}, word ptr [edx - 256]{1to16}, 123 +// CHECK: vfpclassbf16 k5 {k7}, word ptr [edx - 256]{1to16}, 123 // CHECK: encoding: [0x62,0xf3,0x7f,0x3f,0x66,0x6a,0x80,0x7b] - vfpclasspbf16 k5 {k7}, word ptr [edx - 256]{1to16}, 123 + vfpclassbf16 k5 {k7}, word ptr [edx - 256]{1to16}, 123 -// CHECK: vfpclasspbf16 k5, word ptr [eax]{1to32}, 123 +// CHECK: vfpclassbf16 k5, word ptr [eax]{1to32}, 123 // CHECK: encoding: [0x62,0xf3,0x7f,0x58,0x66,0x28,0x7b] - vfpclasspbf16 k5, word ptr [eax]{1to32}, 123 + vfpclassbf16 k5, word ptr [eax]{1to32}, 123 -// CHECK: vfpclasspbf16 k5, zmmword ptr [2*ebp - 2048], 123 +// CHECK: vfpclassbf16 k5, zmmword ptr [2*ebp - 2048], 123 // CHECK: encoding: [0x62,0xf3,0x7f,0x48,0x66,0x2c,0x6d,0x00,0xf8,0xff,0xff,0x7b] - vfpclasspbf16 k5, zmmword ptr [2*ebp - 2048], 123 + vfpclassbf16 k5, zmmword ptr [2*ebp - 2048], 123 -// CHECK: vfpclasspbf16 k5 {k7}, zmmword ptr [ecx + 8128], 123 +// CHECK: vfpclassbf16 k5 {k7}, zmmword ptr [ecx + 8128], 123 // CHECK: encoding: [0x62,0xf3,0x7f,0x4f,0x66,0x69,0x7f,0x7b] - vfpclasspbf16 k5 {k7}, zmmword ptr [ecx + 8128], 123 + vfpclassbf16 k5 {k7}, zmmword ptr [ecx + 8128], 123 -// CHECK: vfpclasspbf16 k5 {k7}, word ptr [edx - 256]{1to32}, 123 +// CHECK: vfpclassbf16 k5 {k7}, word ptr [edx - 256]{1to32}, 123 // CHECK: encoding: [0x62,0xf3,0x7f,0x5f,0x66,0x6a,0x80,0x7b] - vfpclasspbf16 k5 {k7}, word ptr [edx - 256]{1to32}, 123 + vfpclassbf16 k5 {k7}, word ptr [edx - 256]{1to32}, 123 -// CHECK: vgetexppbf16 xmm2, xmm3 +// CHECK: vgetexpbf16 xmm2, xmm3 // CHECK: encoding: [0x62,0xf5,0x7d,0x08,0x42,0xd3] - vgetexppbf16 xmm2, xmm3 + vgetexpbf16 xmm2, xmm3 -// CHECK: vgetexppbf16 xmm2 {k7}, xmm3 +// CHECK: vgetexpbf16 xmm2 {k7}, xmm3 // CHECK: encoding: [0x62,0xf5,0x7d,0x0f,0x42,0xd3] - vgetexppbf16 xmm2 {k7}, xmm3 + vgetexpbf16 xmm2 {k7}, xmm3 -// CHECK: vgetexppbf16 xmm2 {k7} {z}, xmm3 +// CHECK: vgetexpbf16 xmm2 {k7} {z}, xmm3 // CHECK: encoding: [0x62,0xf5,0x7d,0x8f,0x42,0xd3] - vgetexppbf16 xmm2 {k7} {z}, xmm3 + vgetexpbf16 xmm2 {k7} {z}, xmm3 -// CHECK: vgetexppbf16 zmm2, zmm3 +// CHECK: vgetexpbf16 zmm2, zmm3 // CHECK: encoding: [0x62,0xf5,0x7d,0x48,0x42,0xd3] - vgetexppbf16 zmm2, zmm3 + vgetexpbf16 zmm2, zmm3 -// CHECK: vgetexppbf16 zmm2 {k7}, zmm3 +// CHECK: vgetexpbf16 zmm2 {k7}, zmm3 // CHECK: encoding: [0x62,0xf5,0x7d,0x4f,0x42,0xd3] - vgetexppbf16 zmm2 {k7}, zmm3 + vgetexpbf16 zmm2 {k7}, zmm3 -// CHECK: vgetexppbf16 zmm2 {k7} {z}, zmm3 +// CHECK: vgetexpbf16 zmm2 {k7} {z}, zmm3 // CHECK: encoding: [0x62,0xf5,0x7d,0xcf,0x42,0xd3] - vgetexppbf16 zmm2 {k7} {z}, zmm3 + vgetexpbf16 zmm2 {k7} {z}, zmm3 -// CHECK: vgetexppbf16 ymm2, ymm3 +// CHECK: vgetexpbf16 ymm2, ymm3 // CHECK: encoding: [0x62,0xf5,0x7d,0x28,0x42,0xd3] - vgetexppbf16 ymm2, ymm3 + vgetexpbf16 ymm2, ymm3 -// CHECK: vgetexppbf16 ymm2 {k7}, ymm3 +// CHECK: vgetexpbf16 ymm2 {k7}, ymm3 // CHECK: encoding: [0x62,0xf5,0x7d,0x2f,0x42,0xd3] - vgetexppbf16 ymm2 {k7}, ymm3 + vgetexpbf16 ymm2 {k7}, ymm3 -// CHECK: vgetexppbf16 ymm2 {k7} {z}, ymm3 +// CHECK: vgetexpbf16 ymm2 {k7} {z}, ymm3 // CHECK: encoding: [0x62,0xf5,0x7d,0xaf,0x42,0xd3] - vgetexppbf16 ymm2 {k7} {z}, ymm3 + vgetexpbf16 ymm2 {k7} {z}, ymm3 -// CHECK: vgetexppbf16 xmm2, xmmword ptr [esp + 8*esi + 268435456] +// CHECK: vgetexpbf16 xmm2, xmmword ptr [esp + 8*esi + 268435456] // CHECK: encoding: [0x62,0xf5,0x7d,0x08,0x42,0x94,0xf4,0x00,0x00,0x00,0x10] - vgetexppbf16 xmm2, xmmword ptr [esp + 8*esi + 268435456] + vgetexpbf16 xmm2, xmmword ptr [esp + 8*esi + 268435456] -// CHECK: vgetexppbf16 xmm2 {k7}, xmmword ptr [edi + 4*eax + 291] +// CHECK: vgetexpbf16 xmm2 {k7}, xmmword ptr [edi + 4*eax + 291] // CHECK: encoding: [0x62,0xf5,0x7d,0x0f,0x42,0x94,0x87,0x23,0x01,0x00,0x00] - vgetexppbf16 xmm2 {k7}, xmmword ptr [edi + 4*eax + 291] + vgetexpbf16 xmm2 {k7}, xmmword ptr [edi + 4*eax + 291] -// CHECK: vgetexppbf16 xmm2, word ptr [eax]{1to8} +// CHECK: vgetexpbf16 xmm2, word ptr [eax]{1to8} // CHECK: encoding: [0x62,0xf5,0x7d,0x18,0x42,0x10] - vgetexppbf16 xmm2, word ptr [eax]{1to8} + vgetexpbf16 xmm2, word ptr [eax]{1to8} -// CHECK: vgetexppbf16 xmm2, xmmword ptr [2*ebp - 512] +// CHECK: vgetexpbf16 xmm2, xmmword ptr [2*ebp - 512] // CHECK: encoding: [0x62,0xf5,0x7d,0x08,0x42,0x14,0x6d,0x00,0xfe,0xff,0xff] - vgetexppbf16 xmm2, xmmword ptr [2*ebp - 512] + vgetexpbf16 xmm2, xmmword ptr [2*ebp - 512] -// CHECK: vgetexppbf16 xmm2 {k7} {z}, xmmword ptr [ecx + 2032] +// CHECK: vgetexpbf16 xmm2 {k7} {z}, xmmword ptr [ecx + 2032] // CHECK: encoding: [0x62,0xf5,0x7d,0x8f,0x42,0x51,0x7f] - vgetexppbf16 xmm2 {k7} {z}, xmmword ptr [ecx + 2032] + vgetexpbf16 xmm2 {k7} {z}, xmmword ptr [ecx + 2032] -// CHECK: vgetexppbf16 xmm2 {k7} {z}, word ptr [edx - 256]{1to8} +// CHECK: vgetexpbf16 xmm2 {k7} {z}, word ptr [edx - 256]{1to8} // CHECK: encoding: [0x62,0xf5,0x7d,0x9f,0x42,0x52,0x80] - vgetexppbf16 xmm2 {k7} {z}, word ptr [edx - 256]{1to8} + vgetexpbf16 xmm2 {k7} {z}, word ptr [edx - 256]{1to8} -// CHECK: vgetexppbf16 ymm2, ymmword ptr [esp + 8*esi + 268435456] +// CHECK: vgetexpbf16 ymm2, ymmword ptr [esp + 8*esi + 268435456] // CHECK: encoding: [0x62,0xf5,0x7d,0x28,0x42,0x94,0xf4,0x00,0x00,0x00,0x10] - vgetexppbf16 ymm2, ymmword ptr [esp + 8*esi + 268435456] + vgetexpbf16 ymm2, ymmword ptr [esp + 8*esi + 268435456] -// CHECK: vgetexppbf16 ymm2 {k7}, ymmword ptr [edi + 4*eax + 291] +// CHECK: vgetexpbf16 ymm2 {k7}, ymmword ptr [edi + 4*eax + 291] // CHECK: encoding: [0x62,0xf5,0x7d,0x2f,0x42,0x94,0x87,0x23,0x01,0x00,0x00] - vgetexppbf16 ymm2 {k7}, ymmword ptr [edi + 4*eax + 291] + vgetexpbf16 ymm2 {k7}, ymmword ptr [edi + 4*eax + 291] -// CHECK: vgetexppbf16 ymm2, word ptr [eax]{1to16} +// CHECK: vgetexpbf16 ymm2, word ptr [eax]{1to16} // CHECK: encoding: [0x62,0xf5,0x7d,0x38,0x42,0x10] - vgetexppbf16 ymm2, word ptr [eax]{1to16} + vgetexpbf16 ymm2, word ptr [eax]{1to16} -// CHECK: vgetexppbf16 ymm2, ymmword ptr [2*ebp - 1024] +// CHECK: vgetexpbf16 ymm2, ymmword ptr [2*ebp - 1024] // CHECK: encoding: [0x62,0xf5,0x7d,0x28,0x42,0x14,0x6d,0x00,0xfc,0xff,0xff] - vgetexppbf16 ymm2, ymmword ptr [2*ebp - 1024] + vgetexpbf16 ymm2, ymmword ptr [2*ebp - 1024] -// CHECK: vgetexppbf16 ymm2 {k7} {z}, ymmword ptr [ecx + 4064] +// CHECK: vgetexpbf16 ymm2 {k7} {z}, ymmword ptr [ecx + 4064] // CHECK: encoding: [0x62,0xf5,0x7d,0xaf,0x42,0x51,0x7f] - vgetexppbf16 ymm2 {k7} {z}, ymmword ptr [ecx + 4064] + vgetexpbf16 ymm2 {k7} {z}, ymmword ptr [ecx + 4064] -// CHECK: vgetexppbf16 ymm2 {k7} {z}, word ptr [edx - 256]{1to16} +// CHECK: vgetexpbf16 ymm2 {k7} {z}, word ptr [edx - 256]{1to16} // CHECK: encoding: [0x62,0xf5,0x7d,0xbf,0x42,0x52,0x80] - vgetexppbf16 ymm2 {k7} {z}, word ptr [edx - 256]{1to16} + vgetexpbf16 ymm2 {k7} {z}, word ptr [edx - 256]{1to16} -// CHECK: vgetexppbf16 zmm2, zmmword ptr [esp + 8*esi + 268435456] +// CHECK: vgetexpbf16 zmm2, zmmword ptr [esp + 8*esi + 268435456] // CHECK: encoding: [0x62,0xf5,0x7d,0x48,0x42,0x94,0xf4,0x00,0x00,0x00,0x10] - vgetexppbf16 zmm2, zmmword ptr [esp + 8*esi + 268435456] + vgetexpbf16 zmm2, zmmword ptr [esp + 8*esi + 268435456] -// CHECK: vgetexppbf16 zmm2 {k7}, zmmword ptr [edi + 4*eax + 291] +// CHECK: vgetexpbf16 zmm2 {k7}, zmmword ptr [edi + 4*eax + 291] // CHECK: encoding: [0x62,0xf5,0x7d,0x4f,0x42,0x94,0x87,0x23,0x01,0x00,0x00] - vgetexppbf16 zmm2 {k7}, zmmword ptr [edi + 4*eax + 291] + vgetexpbf16 zmm2 {k7}, zmmword ptr [edi + 4*eax + 291] -// CHECK: vgetexppbf16 zmm2, word ptr [eax]{1to32} +// CHECK: vgetexpbf16 zmm2, word ptr [eax]{1to32} // CHECK: encoding: [0x62,0xf5,0x7d,0x58,0x42,0x10] - vgetexppbf16 zmm2, word ptr [eax]{1to32} + vgetexpbf16 zmm2, word ptr [eax]{1to32} -// CHECK: vgetexppbf16 zmm2, zmmword ptr [2*ebp - 2048] +// CHECK: vgetexpbf16 zmm2, zmmword ptr [2*ebp - 2048] // CHECK: encoding: [0x62,0xf5,0x7d,0x48,0x42,0x14,0x6d,0x00,0xf8,0xff,0xff] - vgetexppbf16 zmm2, zmmword ptr [2*ebp - 2048] + vgetexpbf16 zmm2, zmmword ptr [2*ebp - 2048] -// CHECK: vgetexppbf16 zmm2 {k7} {z}, zmmword ptr [ecx + 8128] +// CHECK: vgetexpbf16 zmm2 {k7} {z}, zmmword ptr [ecx + 8128] // CHECK: encoding: [0x62,0xf5,0x7d,0xcf,0x42,0x51,0x7f] - vgetexppbf16 zmm2 {k7} {z}, zmmword ptr [ecx + 8128] + vgetexpbf16 zmm2 {k7} {z}, zmmword ptr [ecx + 8128] -// CHECK: vgetexppbf16 zmm2 {k7} {z}, word ptr [edx - 256]{1to32} +// CHECK: vgetexpbf16 zmm2 {k7} {z}, word ptr [edx - 256]{1to32} // CHECK: encoding: [0x62,0xf5,0x7d,0xdf,0x42,0x52,0x80] - vgetexppbf16 zmm2 {k7} {z}, word ptr [edx - 256]{1to32} + vgetexpbf16 zmm2 {k7} {z}, word ptr [edx - 256]{1to32} -// CHECK: vgetmantpbf16 zmm2, zmm3, 123 +// CHECK: vgetmantbf16 zmm2, zmm3, 123 // CHECK: encoding: [0x62,0xf3,0x7f,0x48,0x26,0xd3,0x7b] - vgetmantpbf16 zmm2, zmm3, 123 + vgetmantbf16 zmm2, zmm3, 123 -// CHECK: vgetmantpbf16 zmm2 {k7}, zmm3, 123 +// CHECK: vgetmantbf16 zmm2 {k7}, zmm3, 123 // CHECK: encoding: [0x62,0xf3,0x7f,0x4f,0x26,0xd3,0x7b] - vgetmantpbf16 zmm2 {k7}, zmm3, 123 + vgetmantbf16 zmm2 {k7}, zmm3, 123 -// CHECK: vgetmantpbf16 zmm2 {k7} {z}, zmm3, 123 +// CHECK: vgetmantbf16 zmm2 {k7} {z}, zmm3, 123 // CHECK: encoding: [0x62,0xf3,0x7f,0xcf,0x26,0xd3,0x7b] - vgetmantpbf16 zmm2 {k7} {z}, zmm3, 123 + vgetmantbf16 zmm2 {k7} {z}, zmm3, 123 -// CHECK: vgetmantpbf16 ymm2, ymm3, 123 +// CHECK: vgetmantbf16 ymm2, ymm3, 123 // CHECK: encoding: [0x62,0xf3,0x7f,0x28,0x26,0xd3,0x7b] - vgetmantpbf16 ymm2, ymm3, 123 + vgetmantbf16 ymm2, ymm3, 123 -// CHECK: vgetmantpbf16 ymm2 {k7}, ymm3, 123 +// CHECK: vgetmantbf16 ymm2 {k7}, ymm3, 123 // CHECK: encoding: [0x62,0xf3,0x7f,0x2f,0x26,0xd3,0x7b] - vgetmantpbf16 ymm2 {k7}, ymm3, 123 + vgetmantbf16 ymm2 {k7}, ymm3, 123 -// CHECK: vgetmantpbf16 ymm2 {k7} {z}, ymm3, 123 +// CHECK: vgetmantbf16 ymm2 {k7} {z}, ymm3, 123 // CHECK: encoding: [0x62,0xf3,0x7f,0xaf,0x26,0xd3,0x7b] - vgetmantpbf16 ymm2 {k7} {z}, ymm3, 123 + vgetmantbf16 ymm2 {k7} {z}, ymm3, 123 -// CHECK: vgetmantpbf16 xmm2, xmm3, 123 +// CHECK: vgetmantbf16 xmm2, xmm3, 123 // CHECK: encoding: [0x62,0xf3,0x7f,0x08,0x26,0xd3,0x7b] - vgetmantpbf16 xmm2, xmm3, 123 + vgetmantbf16 xmm2, xmm3, 123 -// CHECK: vgetmantpbf16 xmm2 {k7}, xmm3, 123 +// CHECK: vgetmantbf16 xmm2 {k7}, xmm3, 123 // CHECK: encoding: [0x62,0xf3,0x7f,0x0f,0x26,0xd3,0x7b] - vgetmantpbf16 xmm2 {k7}, xmm3, 123 + vgetmantbf16 xmm2 {k7}, xmm3, 123 -// CHECK: vgetmantpbf16 xmm2 {k7} {z}, xmm3, 123 +// CHECK: vgetmantbf16 xmm2 {k7} {z}, xmm3, 123 // CHECK: encoding: [0x62,0xf3,0x7f,0x8f,0x26,0xd3,0x7b] - vgetmantpbf16 xmm2 {k7} {z}, xmm3, 123 + vgetmantbf16 xmm2 {k7} {z}, xmm3, 123 -// CHECK: vgetmantpbf16 xmm2, xmmword ptr [esp + 8*esi + 268435456], 123 +// CHECK: vgetmantbf16 xmm2, xmmword ptr [esp + 8*esi + 268435456], 123 // CHECK: encoding: [0x62,0xf3,0x7f,0x08,0x26,0x94,0xf4,0x00,0x00,0x00,0x10,0x7b] - vgetmantpbf16 xmm2, xmmword ptr [esp + 8*esi + 268435456], 123 + vgetmantbf16 xmm2, xmmword ptr [esp + 8*esi + 268435456], 123 -// CHECK: vgetmantpbf16 xmm2 {k7}, xmmword ptr [edi + 4*eax + 291], 123 +// CHECK: vgetmantbf16 xmm2 {k7}, xmmword ptr [edi + 4*eax + 291], 123 // CHECK: encoding: [0x62,0xf3,0x7f,0x0f,0x26,0x94,0x87,0x23,0x01,0x00,0x00,0x7b] - vgetmantpbf16 xmm2 {k7}, xmmword ptr [edi + 4*eax + 291], 123 + vgetmantbf16 xmm2 {k7}, xmmword ptr [edi + 4*eax + 291], 123 -// CHECK: vgetmantpbf16 xmm2, word ptr [eax]{1to8}, 123 +// CHECK: vgetmantbf16 xmm2, word ptr [eax]{1to8}, 123 // CHECK: encoding: [0x62,0xf3,0x7f,0x18,0x26,0x10,0x7b] - vgetmantpbf16 xmm2, word ptr [eax]{1to8}, 123 + vgetmantbf16 xmm2, word ptr [eax]{1to8}, 123 -// CHECK: vgetmantpbf16 xmm2, xmmword ptr [2*ebp - 512], 123 +// CHECK: vgetmantbf16 xmm2, xmmword ptr [2*ebp - 512], 123 // CHECK: encoding: [0x62,0xf3,0x7f,0x08,0x26,0x14,0x6d,0x00,0xfe,0xff,0xff,0x7b] - vgetmantpbf16 xmm2, xmmword ptr [2*ebp - 512], 123 + vgetmantbf16 xmm2, xmmword ptr [2*ebp - 512], 123 -// CHECK: vgetmantpbf16 xmm2 {k7} {z}, xmmword ptr [ecx + 2032], 123 +// CHECK: vgetmantbf16 xmm2 {k7} {z}, xmmword ptr [ecx + 2032], 123 // CHECK: encoding: [0x62,0xf3,0x7f,0x8f,0x26,0x51,0x7f,0x7b] - vgetmantpbf16 xmm2 {k7} {z}, xmmword ptr [ecx + 2032], 123 + vgetmantbf16 xmm2 {k7} {z}, xmmword ptr [ecx + 2032], 123 -// CHECK: vgetmantpbf16 xmm2 {k7} {z}, word ptr [edx - 256]{1to8}, 123 +// CHECK: vgetmantbf16 xmm2 {k7} {z}, word ptr [edx - 256]{1to8}, 123 // CHECK: encoding: [0x62,0xf3,0x7f,0x9f,0x26,0x52,0x80,0x7b] - vgetmantpbf16 xmm2 {k7} {z}, word ptr [edx - 256]{1to8}, 123 + vgetmantbf16 xmm2 {k7} {z}, word ptr [edx - 256]{1to8}, 123 -// CHECK: vgetmantpbf16 ymm2, ymmword ptr [esp + 8*esi + 268435456], 123 +// CHECK: vgetmantbf16 ymm2, ymmword ptr [esp + 8*esi + 268435456], 123 // CHECK: encoding: [0x62,0xf3,0x7f,0x28,0x26,0x94,0xf4,0x00,0x00,0x00,0x10,0x7b] - vgetmantpbf16 ymm2, ymmword ptr [esp + 8*esi + 268435456], 123 + vgetmantbf16 ymm2, ymmword ptr [esp + 8*esi + 268435456], 123 -// CHECK: vgetmantpbf16 ymm2 {k7}, ymmword ptr [edi + 4*eax + 291], 123 +// CHECK: vgetmantbf16 ymm2 {k7}, ymmword ptr [edi + 4*eax + 291], 123 // CHECK: encoding: [0x62,0xf3,0x7f,0x2f,0x26,0x94,0x87,0x23,0x01,0x00,0x00,0x7b] - vgetmantpbf16 ymm2 {k7}, ymmword ptr [edi + 4*eax + 291], 123 + vgetmantbf16 ymm2 {k7}, ymmword ptr [edi + 4*eax + 291], 123 -// CHECK: vgetmantpbf16 ymm2, word ptr [eax]{1to16}, 123 +// CHECK: vgetmantbf16 ymm2, word ptr [eax]{1to16}, 123 // CHECK: encoding: [0x62,0xf3,0x7f,0x38,0x26,0x10,0x7b] - vgetmantpbf16 ymm2, word ptr [eax]{1to16}, 123 + vgetmantbf16 ymm2, word ptr [eax]{1to16}, 123 -// CHECK: vgetmantpbf16 ymm2, ymmword ptr [2*ebp - 1024], 123 +// CHECK: vgetmantbf16 ymm2, ymmword ptr [2*ebp - 1024], 123 // CHECK: encoding: [0x62,0xf3,0x7f,0x28,0x26,0x14,0x6d,0x00,0xfc,0xff,0xff,0x7b] - vgetmantpbf16 ymm2, ymmword ptr [2*ebp - 1024], 123 + vgetmantbf16 ymm2, ymmword ptr [2*ebp - 1024], 123 -// CHECK: vgetmantpbf16 ymm2 {k7} {z}, ymmword ptr [ecx + 4064], 123 +// CHECK: vgetmantbf16 ymm2 {k7} {z}, ymmword ptr [ecx + 4064], 123 // CHECK: encoding: [0x62,0xf3,0x7f,0xaf,0x26,0x51,0x7f,0x7b] - vgetmantpbf16 ymm2 {k7} {z}, ymmword ptr [ecx + 4064], 123 + vgetmantbf16 ymm2 {k7} {z}, ymmword ptr [ecx + 4064], 123 -// CHECK: vgetmantpbf16 ymm2 {k7} {z}, word ptr [edx - 256]{1to16}, 123 +// CHECK: vgetmantbf16 ymm2 {k7} {z}, word ptr [edx - 256]{1to16}, 123 // CHECK: encoding: [0x62,0xf3,0x7f,0xbf,0x26,0x52,0x80,0x7b] - vgetmantpbf16 ymm2 {k7} {z}, word ptr [edx - 256]{1to16}, 123 + vgetmantbf16 ymm2 {k7} {z}, word ptr [edx - 256]{1to16}, 123 -// CHECK: vgetmantpbf16 zmm2, zmmword ptr [esp + 8*esi + 268435456], 123 +// CHECK: vgetmantbf16 zmm2, zmmword ptr [esp + 8*esi + 268435456], 123 // CHECK: encoding: [0x62,0xf3,0x7f,0x48,0x26,0x94,0xf4,0x00,0x00,0x00,0x10,0x7b] - vgetmantpbf16 zmm2, zmmword ptr [esp + 8*esi + 268435456], 123 + vgetmantbf16 zmm2, zmmword ptr [esp + 8*esi + 268435456], 123 -// CHECK: vgetmantpbf16 zmm2 {k7}, zmmword ptr [edi + 4*eax + 291], 123 +// CHECK: vgetmantbf16 zmm2 {k7}, zmmword ptr [edi + 4*eax + 291], 123 // CHECK: encoding: [0x62,0xf3,0x7f,0x4f,0x26,0x94,0x87,0x23,0x01,0x00,0x00,0x7b] - vgetmantpbf16 zmm2 {k7}, zmmword ptr [edi + 4*eax + 291], 123 + vgetmantbf16 zmm2 {k7}, zmmword ptr [edi + 4*eax + 291], 123 -// CHECK: vgetmantpbf16 zmm2, word ptr [eax]{1to32}, 123 +// CHECK: vgetmantbf16 zmm2, word ptr [eax]{1to32}, 123 // CHECK: encoding: [0x62,0xf3,0x7f,0x58,0x26,0x10,0x7b] - vgetmantpbf16 zmm2, word ptr [eax]{1to32}, 123 + vgetmantbf16 zmm2, word ptr [eax]{1to32}, 123 -// CHECK: vgetmantpbf16 zmm2, zmmword ptr [2*ebp - 2048], 123 +// CHECK: vgetmantbf16 zmm2, zmmword ptr [2*ebp - 2048], 123 // CHECK: encoding: [0x62,0xf3,0x7f,0x48,0x26,0x14,0x6d,0x00,0xf8,0xff,0xff,0x7b] - vgetmantpbf16 zmm2, zmmword ptr [2*ebp - 2048], 123 + vgetmantbf16 zmm2, zmmword ptr [2*ebp - 2048], 123 -// CHECK: vgetmantpbf16 zmm2 {k7} {z}, zmmword ptr [ecx + 8128], 123 +// CHECK: vgetmantbf16 zmm2 {k7} {z}, zmmword ptr [ecx + 8128], 123 // CHECK: encoding: [0x62,0xf3,0x7f,0xcf,0x26,0x51,0x7f,0x7b] - vgetmantpbf16 zmm2 {k7} {z}, zmmword ptr [ecx + 8128], 123 + vgetmantbf16 zmm2 {k7} {z}, zmmword ptr [ecx + 8128], 123 -// CHECK: vgetmantpbf16 zmm2 {k7} {z}, word ptr [edx - 256]{1to32}, 123 +// CHECK: vgetmantbf16 zmm2 {k7} {z}, word ptr [edx - 256]{1to32}, 123 // CHECK: encoding: [0x62,0xf3,0x7f,0xdf,0x26,0x52,0x80,0x7b] - vgetmantpbf16 zmm2 {k7} {z}, word ptr [edx - 256]{1to32}, 123 + vgetmantbf16 zmm2 {k7} {z}, word ptr [edx - 256]{1to32}, 123 -// CHECK: vmaxpbf16 ymm2, ymm3, ymm4 +// CHECK: vmaxbf16 ymm2, ymm3, ymm4 // CHECK: encoding: [0x62,0xf5,0x65,0x28,0x5f,0xd4] - vmaxpbf16 ymm2, ymm3, ymm4 + vmaxbf16 ymm2, ymm3, ymm4 -// CHECK: vmaxpbf16 ymm2 {k7}, ymm3, ymm4 +// CHECK: vmaxbf16 ymm2 {k7}, ymm3, ymm4 // CHECK: encoding: [0x62,0xf5,0x65,0x2f,0x5f,0xd4] - vmaxpbf16 ymm2 {k7}, ymm3, ymm4 + vmaxbf16 ymm2 {k7}, ymm3, ymm4 -// CHECK: vmaxpbf16 ymm2 {k7} {z}, ymm3, ymm4 +// CHECK: vmaxbf16 ymm2 {k7} {z}, ymm3, ymm4 // CHECK: encoding: [0x62,0xf5,0x65,0xaf,0x5f,0xd4] - vmaxpbf16 ymm2 {k7} {z}, ymm3, ymm4 + vmaxbf16 ymm2 {k7} {z}, ymm3, ymm4 -// CHECK: vmaxpbf16 zmm2, zmm3, zmm4 +// CHECK: vmaxbf16 zmm2, zmm3, zmm4 // CHECK: encoding: [0x62,0xf5,0x65,0x48,0x5f,0xd4] - vmaxpbf16 zmm2, zmm3, zmm4 + vmaxbf16 zmm2, zmm3, zmm4 -// CHECK: vmaxpbf16 zmm2 {k7}, zmm3, zmm4 +// CHECK: vmaxbf16 zmm2 {k7}, zmm3, zmm4 // CHECK: encoding: [0x62,0xf5,0x65,0x4f,0x5f,0xd4] - vmaxpbf16 zmm2 {k7}, zmm3, zmm4 + vmaxbf16 zmm2 {k7}, zmm3, zmm4 -// CHECK: vmaxpbf16 zmm2 {k7} {z}, zmm3, zmm4 +// CHECK: vmaxbf16 zmm2 {k7} {z}, zmm3, zmm4 // CHECK: encoding: [0x62,0xf5,0x65,0xcf,0x5f,0xd4] - vmaxpbf16 zmm2 {k7} {z}, zmm3, zmm4 + vmaxbf16 zmm2 {k7} {z}, zmm3, zmm4 -// CHECK: vmaxpbf16 xmm2, xmm3, xmm4 +// CHECK: vmaxbf16 xmm2, xmm3, xmm4 // CHECK: encoding: [0x62,0xf5,0x65,0x08,0x5f,0xd4] - vmaxpbf16 xmm2, xmm3, xmm4 + vmaxbf16 xmm2, xmm3, xmm4 -// CHECK: vmaxpbf16 xmm2 {k7}, xmm3, xmm4 +// CHECK: vmaxbf16 xmm2 {k7}, xmm3, xmm4 // CHECK: encoding: [0x62,0xf5,0x65,0x0f,0x5f,0xd4] - vmaxpbf16 xmm2 {k7}, xmm3, xmm4 + vmaxbf16 xmm2 {k7}, xmm3, xmm4 -// CHECK: vmaxpbf16 xmm2 {k7} {z}, xmm3, xmm4 +// CHECK: vmaxbf16 xmm2 {k7} {z}, xmm3, xmm4 // CHECK: encoding: [0x62,0xf5,0x65,0x8f,0x5f,0xd4] - vmaxpbf16 xmm2 {k7} {z}, xmm3, xmm4 + vmaxbf16 xmm2 {k7} {z}, xmm3, xmm4 -// CHECK: vmaxpbf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456] +// CHECK: vmaxbf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456] // CHECK: encoding: [0x62,0xf5,0x65,0x48,0x5f,0x94,0xf4,0x00,0x00,0x00,0x10] - vmaxpbf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456] + vmaxbf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456] -// CHECK: vmaxpbf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291] +// CHECK: vmaxbf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291] // CHECK: encoding: [0x62,0xf5,0x65,0x4f,0x5f,0x94,0x87,0x23,0x01,0x00,0x00] - vmaxpbf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291] + vmaxbf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291] -// CHECK: vmaxpbf16 zmm2, zmm3, word ptr [eax]{1to32} +// CHECK: vmaxbf16 zmm2, zmm3, word ptr [eax]{1to32} // CHECK: encoding: [0x62,0xf5,0x65,0x58,0x5f,0x10] - vmaxpbf16 zmm2, zmm3, word ptr [eax]{1to32} + vmaxbf16 zmm2, zmm3, word ptr [eax]{1to32} -// CHECK: vmaxpbf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048] +// CHECK: vmaxbf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048] // CHECK: encoding: [0x62,0xf5,0x65,0x48,0x5f,0x14,0x6d,0x00,0xf8,0xff,0xff] - vmaxpbf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048] + vmaxbf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048] -// CHECK: vmaxpbf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128] +// CHECK: vmaxbf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128] // CHECK: encoding: [0x62,0xf5,0x65,0xcf,0x5f,0x51,0x7f] - vmaxpbf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128] + vmaxbf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128] -// CHECK: vmaxpbf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32} +// CHECK: vmaxbf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32} // CHECK: encoding: [0x62,0xf5,0x65,0xdf,0x5f,0x52,0x80] - vmaxpbf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32} + vmaxbf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32} -// CHECK: vmaxpbf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456] +// CHECK: vmaxbf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456] // CHECK: encoding: [0x62,0xf5,0x65,0x28,0x5f,0x94,0xf4,0x00,0x00,0x00,0x10] - vmaxpbf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456] + vmaxbf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456] -// CHECK: vmaxpbf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291] +// CHECK: vmaxbf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291] // CHECK: encoding: [0x62,0xf5,0x65,0x2f,0x5f,0x94,0x87,0x23,0x01,0x00,0x00] - vmaxpbf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291] + vmaxbf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291] -// CHECK: vmaxpbf16 ymm2, ymm3, word ptr [eax]{1to16} +// CHECK: vmaxbf16 ymm2, ymm3, word ptr [eax]{1to16} // CHECK: encoding: [0x62,0xf5,0x65,0x38,0x5f,0x10] - vmaxpbf16 ymm2, ymm3, word ptr [eax]{1to16} + vmaxbf16 ymm2, ymm3, word ptr [eax]{1to16} -// CHECK: vmaxpbf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024] +// CHECK: vmaxbf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024] // CHECK: encoding: [0x62,0xf5,0x65,0x28,0x5f,0x14,0x6d,0x00,0xfc,0xff,0xff] - vmaxpbf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024] + vmaxbf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024] -// CHECK: vmaxpbf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064] +// CHECK: vmaxbf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064] // CHECK: encoding: [0x62,0xf5,0x65,0xaf,0x5f,0x51,0x7f] - vmaxpbf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064] + vmaxbf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064] -// CHECK: vmaxpbf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16} +// CHECK: vmaxbf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16} // CHECK: encoding: [0x62,0xf5,0x65,0xbf,0x5f,0x52,0x80] - vmaxpbf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16} + vmaxbf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16} -// CHECK: vmaxpbf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456] +// CHECK: vmaxbf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456] // CHECK: encoding: [0x62,0xf5,0x65,0x08,0x5f,0x94,0xf4,0x00,0x00,0x00,0x10] - vmaxpbf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456] + vmaxbf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456] -// CHECK: vmaxpbf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291] +// CHECK: vmaxbf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291] // CHECK: encoding: [0x62,0xf5,0x65,0x0f,0x5f,0x94,0x87,0x23,0x01,0x00,0x00] - vmaxpbf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291] + vmaxbf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291] -// CHECK: vmaxpbf16 xmm2, xmm3, word ptr [eax]{1to8} +// CHECK: vmaxbf16 xmm2, xmm3, word ptr [eax]{1to8} // CHECK: encoding: [0x62,0xf5,0x65,0x18,0x5f,0x10] - vmaxpbf16 xmm2, xmm3, word ptr [eax]{1to8} + vmaxbf16 xmm2, xmm3, word ptr [eax]{1to8} -// CHECK: vmaxpbf16 xmm2, xmm3, xmmword ptr [2*ebp - 512] +// CHECK: vmaxbf16 xmm2, xmm3, xmmword ptr [2*ebp - 512] // CHECK: encoding: [0x62,0xf5,0x65,0x08,0x5f,0x14,0x6d,0x00,0xfe,0xff,0xff] - vmaxpbf16 xmm2, xmm3, xmmword ptr [2*ebp - 512] + vmaxbf16 xmm2, xmm3, xmmword ptr [2*ebp - 512] -// CHECK: vmaxpbf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032] +// CHECK: vmaxbf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032] // CHECK: encoding: [0x62,0xf5,0x65,0x8f,0x5f,0x51,0x7f] - vmaxpbf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032] + vmaxbf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032] -// CHECK: vmaxpbf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8} +// CHECK: vmaxbf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8} // CHECK: encoding: [0x62,0xf5,0x65,0x9f,0x5f,0x52,0x80] - vmaxpbf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8} + vmaxbf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8} -// CHECK: vminpbf16 ymm2, ymm3, ymm4 +// CHECK: vminbf16 ymm2, ymm3, ymm4 // CHECK: encoding: [0x62,0xf5,0x65,0x28,0x5d,0xd4] - vminpbf16 ymm2, ymm3, ymm4 + vminbf16 ymm2, ymm3, ymm4 -// CHECK: vminpbf16 ymm2 {k7}, ymm3, ymm4 +// CHECK: vminbf16 ymm2 {k7}, ymm3, ymm4 // CHECK: encoding: [0x62,0xf5,0x65,0x2f,0x5d,0xd4] - vminpbf16 ymm2 {k7}, ymm3, ymm4 + vminbf16 ymm2 {k7}, ymm3, ymm4 -// CHECK: vminpbf16 ymm2 {k7} {z}, ymm3, ymm4 +// CHECK: vminbf16 ymm2 {k7} {z}, ymm3, ymm4 // CHECK: encoding: [0x62,0xf5,0x65,0xaf,0x5d,0xd4] - vminpbf16 ymm2 {k7} {z}, ymm3, ymm4 + vminbf16 ymm2 {k7} {z}, ymm3, ymm4 -// CHECK: vminpbf16 zmm2, zmm3, zmm4 +// CHECK: vminbf16 zmm2, zmm3, zmm4 // CHECK: encoding: [0x62,0xf5,0x65,0x48,0x5d,0xd4] - vminpbf16 zmm2, zmm3, zmm4 + vminbf16 zmm2, zmm3, zmm4 -// CHECK: vminpbf16 zmm2 {k7}, zmm3, zmm4 +// CHECK: vminbf16 zmm2 {k7}, zmm3, zmm4 // CHECK: encoding: [0x62,0xf5,0x65,0x4f,0x5d,0xd4] - vminpbf16 zmm2 {k7}, zmm3, zmm4 + vminbf16 zmm2 {k7}, zmm3, zmm4 -// CHECK: vminpbf16 zmm2 {k7} {z}, zmm3, zmm4 +// CHECK: vminbf16 zmm2 {k7} {z}, zmm3, zmm4 // CHECK: encoding: [0x62,0xf5,0x65,0xcf,0x5d,0xd4] - vminpbf16 zmm2 {k7} {z}, zmm3, zmm4 + vminbf16 zmm2 {k7} {z}, zmm3, zmm4 -// CHECK: vminpbf16 xmm2, xmm3, xmm4 +// CHECK: vminbf16 xmm2, xmm3, xmm4 // CHECK: encoding: [0x62,0xf5,0x65,0x08,0x5d,0xd4] - vminpbf16 xmm2, xmm3, xmm4 + vminbf16 xmm2, xmm3, xmm4 -// CHECK: vminpbf16 xmm2 {k7}, xmm3, xmm4 +// CHECK: vminbf16 xmm2 {k7}, xmm3, xmm4 // CHECK: encoding: [0x62,0xf5,0x65,0x0f,0x5d,0xd4] - vminpbf16 xmm2 {k7}, xmm3, xmm4 + vminbf16 xmm2 {k7}, xmm3, xmm4 -// CHECK: vminpbf16 xmm2 {k7} {z}, xmm3, xmm4 +// CHECK: vminbf16 xmm2 {k7} {z}, xmm3, xmm4 // CHECK: encoding: [0x62,0xf5,0x65,0x8f,0x5d,0xd4] - vminpbf16 xmm2 {k7} {z}, xmm3, xmm4 + vminbf16 xmm2 {k7} {z}, xmm3, xmm4 -// CHECK: vminpbf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456] +// CHECK: vminbf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456] // CHECK: encoding: [0x62,0xf5,0x65,0x48,0x5d,0x94,0xf4,0x00,0x00,0x00,0x10] - vminpbf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456] + vminbf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456] -// CHECK: vminpbf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291] +// CHECK: vminbf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291] // CHECK: encoding: [0x62,0xf5,0x65,0x4f,0x5d,0x94,0x87,0x23,0x01,0x00,0x00] - vminpbf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291] + vminbf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291] -// CHECK: vminpbf16 zmm2, zmm3, word ptr [eax]{1to32} +// CHECK: vminbf16 zmm2, zmm3, word ptr [eax]{1to32} // CHECK: encoding: [0x62,0xf5,0x65,0x58,0x5d,0x10] - vminpbf16 zmm2, zmm3, word ptr [eax]{1to32} + vminbf16 zmm2, zmm3, word ptr [eax]{1to32} -// CHECK: vminpbf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048] +// CHECK: vminbf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048] // CHECK: encoding: [0x62,0xf5,0x65,0x48,0x5d,0x14,0x6d,0x00,0xf8,0xff,0xff] - vminpbf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048] + vminbf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048] -// CHECK: vminpbf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128] +// CHECK: vminbf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128] // CHECK: encoding: [0x62,0xf5,0x65,0xcf,0x5d,0x51,0x7f] - vminpbf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128] + vminbf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128] -// CHECK: vminpbf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32} +// CHECK: vminbf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32} // CHECK: encoding: [0x62,0xf5,0x65,0xdf,0x5d,0x52,0x80] - vminpbf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32} + vminbf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32} -// CHECK: vminpbf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456] +// CHECK: vminbf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456] // CHECK: encoding: [0x62,0xf5,0x65,0x28,0x5d,0x94,0xf4,0x00,0x00,0x00,0x10] - vminpbf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456] + vminbf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456] -// CHECK: vminpbf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291] +// CHECK: vminbf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291] // CHECK: encoding: [0x62,0xf5,0x65,0x2f,0x5d,0x94,0x87,0x23,0x01,0x00,0x00] - vminpbf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291] + vminbf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291] -// CHECK: vminpbf16 ymm2, ymm3, word ptr [eax]{1to16} +// CHECK: vminbf16 ymm2, ymm3, word ptr [eax]{1to16} // CHECK: encoding: [0x62,0xf5,0x65,0x38,0x5d,0x10] - vminpbf16 ymm2, ymm3, word ptr [eax]{1to16} + vminbf16 ymm2, ymm3, word ptr [eax]{1to16} -// CHECK: vminpbf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024] +// CHECK: vminbf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024] // CHECK: encoding: [0x62,0xf5,0x65,0x28,0x5d,0x14,0x6d,0x00,0xfc,0xff,0xff] - vminpbf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024] + vminbf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024] -// CHECK: vminpbf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064] +// CHECK: vminbf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064] // CHECK: encoding: [0x62,0xf5,0x65,0xaf,0x5d,0x51,0x7f] - vminpbf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064] + vminbf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064] -// CHECK: vminpbf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16} +// CHECK: vminbf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16} // CHECK: encoding: [0x62,0xf5,0x65,0xbf,0x5d,0x52,0x80] - vminpbf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16} + vminbf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16} -// CHECK: vminpbf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456] +// CHECK: vminbf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456] // CHECK: encoding: [0x62,0xf5,0x65,0x08,0x5d,0x94,0xf4,0x00,0x00,0x00,0x10] - vminpbf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456] + vminbf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456] -// CHECK: vminpbf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291] +// CHECK: vminbf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291] // CHECK: encoding: [0x62,0xf5,0x65,0x0f,0x5d,0x94,0x87,0x23,0x01,0x00,0x00] - vminpbf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291] + vminbf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291] -// CHECK: vminpbf16 xmm2, xmm3, word ptr [eax]{1to8} +// CHECK: vminbf16 xmm2, xmm3, word ptr [eax]{1to8} // CHECK: encoding: [0x62,0xf5,0x65,0x18,0x5d,0x10] - vminpbf16 xmm2, xmm3, word ptr [eax]{1to8} + vminbf16 xmm2, xmm3, word ptr [eax]{1to8} -// CHECK: vminpbf16 xmm2, xmm3, xmmword ptr [2*ebp - 512] +// CHECK: vminbf16 xmm2, xmm3, xmmword ptr [2*ebp - 512] // CHECK: encoding: [0x62,0xf5,0x65,0x08,0x5d,0x14,0x6d,0x00,0xfe,0xff,0xff] - vminpbf16 xmm2, xmm3, xmmword ptr [2*ebp - 512] + vminbf16 xmm2, xmm3, xmmword ptr [2*ebp - 512] -// CHECK: vminpbf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032] +// CHECK: vminbf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032] // CHECK: encoding: [0x62,0xf5,0x65,0x8f,0x5d,0x51,0x7f] - vminpbf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032] + vminbf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032] -// CHECK: vminpbf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8} +// CHECK: vminbf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8} // CHECK: encoding: [0x62,0xf5,0x65,0x9f,0x5d,0x52,0x80] - vminpbf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8} + vminbf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8} -// CHECK: vmulnepbf16 ymm2, ymm3, ymm4 +// CHECK: vmulbf16 ymm2, ymm3, ymm4 // CHECK: encoding: [0x62,0xf5,0x65,0x28,0x59,0xd4] - vmulnepbf16 ymm2, ymm3, ymm4 + vmulbf16 ymm2, ymm3, ymm4 -// CHECK: vmulnepbf16 ymm2 {k7}, ymm3, ymm4 +// CHECK: vmulbf16 ymm2 {k7}, ymm3, ymm4 // CHECK: encoding: [0x62,0xf5,0x65,0x2f,0x59,0xd4] - vmulnepbf16 ymm2 {k7}, ymm3, ymm4 + vmulbf16 ymm2 {k7}, ymm3, ymm4 -// CHECK: vmulnepbf16 ymm2 {k7} {z}, ymm3, ymm4 +// CHECK: vmulbf16 ymm2 {k7} {z}, ymm3, ymm4 // CHECK: encoding: [0x62,0xf5,0x65,0xaf,0x59,0xd4] - vmulnepbf16 ymm2 {k7} {z}, ymm3, ymm4 + vmulbf16 ymm2 {k7} {z}, ymm3, ymm4 -// CHECK: vmulnepbf16 zmm2, zmm3, zmm4 +// CHECK: vmulbf16 zmm2, zmm3, zmm4 // CHECK: encoding: [0x62,0xf5,0x65,0x48,0x59,0xd4] - vmulnepbf16 zmm2, zmm3, zmm4 + vmulbf16 zmm2, zmm3, zmm4 -// CHECK: vmulnepbf16 zmm2 {k7}, zmm3, zmm4 +// CHECK: vmulbf16 zmm2 {k7}, zmm3, zmm4 // CHECK: encoding: [0x62,0xf5,0x65,0x4f,0x59,0xd4] - vmulnepbf16 zmm2 {k7}, zmm3, zmm4 + vmulbf16 zmm2 {k7}, zmm3, zmm4 -// CHECK: vmulnepbf16 zmm2 {k7} {z}, zmm3, zmm4 +// CHECK: vmulbf16 zmm2 {k7} {z}, zmm3, zmm4 // CHECK: encoding: [0x62,0xf5,0x65,0xcf,0x59,0xd4] - vmulnepbf16 zmm2 {k7} {z}, zmm3, zmm4 + vmulbf16 zmm2 {k7} {z}, zmm3, zmm4 -// CHECK: vmulnepbf16 xmm2, xmm3, xmm4 +// CHECK: vmulbf16 xmm2, xmm3, xmm4 // CHECK: encoding: [0x62,0xf5,0x65,0x08,0x59,0xd4] - vmulnepbf16 xmm2, xmm3, xmm4 + vmulbf16 xmm2, xmm3, xmm4 -// CHECK: vmulnepbf16 xmm2 {k7}, xmm3, xmm4 +// CHECK: vmulbf16 xmm2 {k7}, xmm3, xmm4 // CHECK: encoding: [0x62,0xf5,0x65,0x0f,0x59,0xd4] - vmulnepbf16 xmm2 {k7}, xmm3, xmm4 + vmulbf16 xmm2 {k7}, xmm3, xmm4 -// CHECK: vmulnepbf16 xmm2 {k7} {z}, xmm3, xmm4 +// CHECK: vmulbf16 xmm2 {k7} {z}, xmm3, xmm4 // CHECK: encoding: [0x62,0xf5,0x65,0x8f,0x59,0xd4] - vmulnepbf16 xmm2 {k7} {z}, xmm3, xmm4 + vmulbf16 xmm2 {k7} {z}, xmm3, xmm4 -// CHECK: vmulnepbf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456] +// CHECK: vmulbf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456] // CHECK: encoding: [0x62,0xf5,0x65,0x48,0x59,0x94,0xf4,0x00,0x00,0x00,0x10] - vmulnepbf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456] + vmulbf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456] -// CHECK: vmulnepbf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291] +// CHECK: vmulbf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291] // CHECK: encoding: [0x62,0xf5,0x65,0x4f,0x59,0x94,0x87,0x23,0x01,0x00,0x00] - vmulnepbf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291] + vmulbf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291] -// CHECK: vmulnepbf16 zmm2, zmm3, word ptr [eax]{1to32} +// CHECK: vmulbf16 zmm2, zmm3, word ptr [eax]{1to32} // CHECK: encoding: [0x62,0xf5,0x65,0x58,0x59,0x10] - vmulnepbf16 zmm2, zmm3, word ptr [eax]{1to32} + vmulbf16 zmm2, zmm3, word ptr [eax]{1to32} -// CHECK: vmulnepbf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048] +// CHECK: vmulbf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048] // CHECK: encoding: [0x62,0xf5,0x65,0x48,0x59,0x14,0x6d,0x00,0xf8,0xff,0xff] - vmulnepbf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048] + vmulbf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048] -// CHECK: vmulnepbf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128] +// CHECK: vmulbf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128] // CHECK: encoding: [0x62,0xf5,0x65,0xcf,0x59,0x51,0x7f] - vmulnepbf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128] + vmulbf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128] -// CHECK: vmulnepbf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32} +// CHECK: vmulbf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32} // CHECK: encoding: [0x62,0xf5,0x65,0xdf,0x59,0x52,0x80] - vmulnepbf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32} + vmulbf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32} -// CHECK: vmulnepbf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456] +// CHECK: vmulbf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456] // CHECK: encoding: [0x62,0xf5,0x65,0x28,0x59,0x94,0xf4,0x00,0x00,0x00,0x10] - vmulnepbf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456] + vmulbf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456] -// CHECK: vmulnepbf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291] +// CHECK: vmulbf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291] // CHECK: encoding: [0x62,0xf5,0x65,0x2f,0x59,0x94,0x87,0x23,0x01,0x00,0x00] - vmulnepbf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291] + vmulbf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291] -// CHECK: vmulnepbf16 ymm2, ymm3, word ptr [eax]{1to16} +// CHECK: vmulbf16 ymm2, ymm3, word ptr [eax]{1to16} // CHECK: encoding: [0x62,0xf5,0x65,0x38,0x59,0x10] - vmulnepbf16 ymm2, ymm3, word ptr [eax]{1to16} + vmulbf16 ymm2, ymm3, word ptr [eax]{1to16} -// CHECK: vmulnepbf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024] +// CHECK: vmulbf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024] // CHECK: encoding: [0x62,0xf5,0x65,0x28,0x59,0x14,0x6d,0x00,0xfc,0xff,0xff] - vmulnepbf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024] + vmulbf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024] -// CHECK: vmulnepbf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064] +// CHECK: vmulbf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064] // CHECK: encoding: [0x62,0xf5,0x65,0xaf,0x59,0x51,0x7f] - vmulnepbf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064] + vmulbf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064] -// CHECK: vmulnepbf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16} +// CHECK: vmulbf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16} // CHECK: encoding: [0x62,0xf5,0x65,0xbf,0x59,0x52,0x80] - vmulnepbf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16} + vmulbf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16} -// CHECK: vmulnepbf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456] +// CHECK: vmulbf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456] // CHECK: encoding: [0x62,0xf5,0x65,0x08,0x59,0x94,0xf4,0x00,0x00,0x00,0x10] - vmulnepbf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456] + vmulbf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456] -// CHECK: vmulnepbf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291] +// CHECK: vmulbf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291] // CHECK: encoding: [0x62,0xf5,0x65,0x0f,0x59,0x94,0x87,0x23,0x01,0x00,0x00] - vmulnepbf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291] + vmulbf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291] -// CHECK: vmulnepbf16 xmm2, xmm3, word ptr [eax]{1to8} +// CHECK: vmulbf16 xmm2, xmm3, word ptr [eax]{1to8} // CHECK: encoding: [0x62,0xf5,0x65,0x18,0x59,0x10] - vmulnepbf16 xmm2, xmm3, word ptr [eax]{1to8} + vmulbf16 xmm2, xmm3, word ptr [eax]{1to8} -// CHECK: vmulnepbf16 xmm2, xmm3, xmmword ptr [2*ebp - 512] +// CHECK: vmulbf16 xmm2, xmm3, xmmword ptr [2*ebp - 512] // CHECK: encoding: [0x62,0xf5,0x65,0x08,0x59,0x14,0x6d,0x00,0xfe,0xff,0xff] - vmulnepbf16 xmm2, xmm3, xmmword ptr [2*ebp - 512] + vmulbf16 xmm2, xmm3, xmmword ptr [2*ebp - 512] -// CHECK: vmulnepbf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032] +// CHECK: vmulbf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032] // CHECK: encoding: [0x62,0xf5,0x65,0x8f,0x59,0x51,0x7f] - vmulnepbf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032] + vmulbf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032] -// CHECK: vmulnepbf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8} +// CHECK: vmulbf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8} // CHECK: encoding: [0x62,0xf5,0x65,0x9f,0x59,0x52,0x80] - vmulnepbf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8} + vmulbf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8} -// CHECK: vrcppbf16 xmm2, xmm3 +// CHECK: vrcpbf16 xmm2, xmm3 // CHECK: encoding: [0x62,0xf6,0x7c,0x08,0x4c,0xd3] - vrcppbf16 xmm2, xmm3 + vrcpbf16 xmm2, xmm3 -// CHECK: vrcppbf16 xmm2 {k7}, xmm3 +// CHECK: vrcpbf16 xmm2 {k7}, xmm3 // CHECK: encoding: [0x62,0xf6,0x7c,0x0f,0x4c,0xd3] - vrcppbf16 xmm2 {k7}, xmm3 + vrcpbf16 xmm2 {k7}, xmm3 -// CHECK: vrcppbf16 xmm2 {k7} {z}, xmm3 +// CHECK: vrcpbf16 xmm2 {k7} {z}, xmm3 // CHECK: encoding: [0x62,0xf6,0x7c,0x8f,0x4c,0xd3] - vrcppbf16 xmm2 {k7} {z}, xmm3 + vrcpbf16 xmm2 {k7} {z}, xmm3 -// CHECK: vrcppbf16 zmm2, zmm3 +// CHECK: vrcpbf16 zmm2, zmm3 // CHECK: encoding: [0x62,0xf6,0x7c,0x48,0x4c,0xd3] - vrcppbf16 zmm2, zmm3 + vrcpbf16 zmm2, zmm3 -// CHECK: vrcppbf16 zmm2 {k7}, zmm3 +// CHECK: vrcpbf16 zmm2 {k7}, zmm3 // CHECK: encoding: [0x62,0xf6,0x7c,0x4f,0x4c,0xd3] - vrcppbf16 zmm2 {k7}, zmm3 + vrcpbf16 zmm2 {k7}, zmm3 -// CHECK: vrcppbf16 zmm2 {k7} {z}, zmm3 +// CHECK: vrcpbf16 zmm2 {k7} {z}, zmm3 // CHECK: encoding: [0x62,0xf6,0x7c,0xcf,0x4c,0xd3] - vrcppbf16 zmm2 {k7} {z}, zmm3 + vrcpbf16 zmm2 {k7} {z}, zmm3 -// CHECK: vrcppbf16 ymm2, ymm3 +// CHECK: vrcpbf16 ymm2, ymm3 // CHECK: encoding: [0x62,0xf6,0x7c,0x28,0x4c,0xd3] - vrcppbf16 ymm2, ymm3 + vrcpbf16 ymm2, ymm3 -// CHECK: vrcppbf16 ymm2 {k7}, ymm3 +// CHECK: vrcpbf16 ymm2 {k7}, ymm3 // CHECK: encoding: [0x62,0xf6,0x7c,0x2f,0x4c,0xd3] - vrcppbf16 ymm2 {k7}, ymm3 + vrcpbf16 ymm2 {k7}, ymm3 -// CHECK: vrcppbf16 ymm2 {k7} {z}, ymm3 +// CHECK: vrcpbf16 ymm2 {k7} {z}, ymm3 // CHECK: encoding: [0x62,0xf6,0x7c,0xaf,0x4c,0xd3] - vrcppbf16 ymm2 {k7} {z}, ymm3 + vrcpbf16 ymm2 {k7} {z}, ymm3 -// CHECK: vrcppbf16 xmm2, xmmword ptr [esp + 8*esi + 268435456] +// CHECK: vrcpbf16 xmm2, xmmword ptr [esp + 8*esi + 268435456] // CHECK: encoding: [0x62,0xf6,0x7c,0x08,0x4c,0x94,0xf4,0x00,0x00,0x00,0x10] - vrcppbf16 xmm2, xmmword ptr [esp + 8*esi + 268435456] + vrcpbf16 xmm2, xmmword ptr [esp + 8*esi + 268435456] -// CHECK: vrcppbf16 xmm2 {k7}, xmmword ptr [edi + 4*eax + 291] +// CHECK: vrcpbf16 xmm2 {k7}, xmmword ptr [edi + 4*eax + 291] // CHECK: encoding: [0x62,0xf6,0x7c,0x0f,0x4c,0x94,0x87,0x23,0x01,0x00,0x00] - vrcppbf16 xmm2 {k7}, xmmword ptr [edi + 4*eax + 291] + vrcpbf16 xmm2 {k7}, xmmword ptr [edi + 4*eax + 291] -// CHECK: vrcppbf16 xmm2, word ptr [eax]{1to8} +// CHECK: vrcpbf16 xmm2, word ptr [eax]{1to8} // CHECK: encoding: [0x62,0xf6,0x7c,0x18,0x4c,0x10] - vrcppbf16 xmm2, word ptr [eax]{1to8} + vrcpbf16 xmm2, word ptr [eax]{1to8} -// CHECK: vrcppbf16 xmm2, xmmword ptr [2*ebp - 512] +// CHECK: vrcpbf16 xmm2, xmmword ptr [2*ebp - 512] // CHECK: encoding: [0x62,0xf6,0x7c,0x08,0x4c,0x14,0x6d,0x00,0xfe,0xff,0xff] - vrcppbf16 xmm2, xmmword ptr [2*ebp - 512] + vrcpbf16 xmm2, xmmword ptr [2*ebp - 512] -// CHECK: vrcppbf16 xmm2 {k7} {z}, xmmword ptr [ecx + 2032] +// CHECK: vrcpbf16 xmm2 {k7} {z}, xmmword ptr [ecx + 2032] // CHECK: encoding: [0x62,0xf6,0x7c,0x8f,0x4c,0x51,0x7f] - vrcppbf16 xmm2 {k7} {z}, xmmword ptr [ecx + 2032] + vrcpbf16 xmm2 {k7} {z}, xmmword ptr [ecx + 2032] -// CHECK: vrcppbf16 xmm2 {k7} {z}, word ptr [edx - 256]{1to8} +// CHECK: vrcpbf16 xmm2 {k7} {z}, word ptr [edx - 256]{1to8} // CHECK: encoding: [0x62,0xf6,0x7c,0x9f,0x4c,0x52,0x80] - vrcppbf16 xmm2 {k7} {z}, word ptr [edx - 256]{1to8} + vrcpbf16 xmm2 {k7} {z}, word ptr [edx - 256]{1to8} -// CHECK: vrcppbf16 ymm2, ymmword ptr [esp + 8*esi + 268435456] +// CHECK: vrcpbf16 ymm2, ymmword ptr [esp + 8*esi + 268435456] // CHECK: encoding: [0x62,0xf6,0x7c,0x28,0x4c,0x94,0xf4,0x00,0x00,0x00,0x10] - vrcppbf16 ymm2, ymmword ptr [esp + 8*esi + 268435456] + vrcpbf16 ymm2, ymmword ptr [esp + 8*esi + 268435456] -// CHECK: vrcppbf16 ymm2 {k7}, ymmword ptr [edi + 4*eax + 291] +// CHECK: vrcpbf16 ymm2 {k7}, ymmword ptr [edi + 4*eax + 291] // CHECK: encoding: [0x62,0xf6,0x7c,0x2f,0x4c,0x94,0x87,0x23,0x01,0x00,0x00] - vrcppbf16 ymm2 {k7}, ymmword ptr [edi + 4*eax + 291] + vrcpbf16 ymm2 {k7}, ymmword ptr [edi + 4*eax + 291] -// CHECK: vrcppbf16 ymm2, word ptr [eax]{1to16} +// CHECK: vrcpbf16 ymm2, word ptr [eax]{1to16} // CHECK: encoding: [0x62,0xf6,0x7c,0x38,0x4c,0x10] - vrcppbf16 ymm2, word ptr [eax]{1to16} + vrcpbf16 ymm2, word ptr [eax]{1to16} -// CHECK: vrcppbf16 ymm2, ymmword ptr [2*ebp - 1024] +// CHECK: vrcpbf16 ymm2, ymmword ptr [2*ebp - 1024] // CHECK: encoding: [0x62,0xf6,0x7c,0x28,0x4c,0x14,0x6d,0x00,0xfc,0xff,0xff] - vrcppbf16 ymm2, ymmword ptr [2*ebp - 1024] + vrcpbf16 ymm2, ymmword ptr [2*ebp - 1024] -// CHECK: vrcppbf16 ymm2 {k7} {z}, ymmword ptr [ecx + 4064] +// CHECK: vrcpbf16 ymm2 {k7} {z}, ymmword ptr [ecx + 4064] // CHECK: encoding: [0x62,0xf6,0x7c,0xaf,0x4c,0x51,0x7f] - vrcppbf16 ymm2 {k7} {z}, ymmword ptr [ecx + 4064] + vrcpbf16 ymm2 {k7} {z}, ymmword ptr [ecx + 4064] -// CHECK: vrcppbf16 ymm2 {k7} {z}, word ptr [edx - 256]{1to16} +// CHECK: vrcpbf16 ymm2 {k7} {z}, word ptr [edx - 256]{1to16} // CHECK: encoding: [0x62,0xf6,0x7c,0xbf,0x4c,0x52,0x80] - vrcppbf16 ymm2 {k7} {z}, word ptr [edx - 256]{1to16} + vrcpbf16 ymm2 {k7} {z}, word ptr [edx - 256]{1to16} -// CHECK: vrcppbf16 zmm2, zmmword ptr [esp + 8*esi + 268435456] +// CHECK: vrcpbf16 zmm2, zmmword ptr [esp + 8*esi + 268435456] // CHECK: encoding: [0x62,0xf6,0x7c,0x48,0x4c,0x94,0xf4,0x00,0x00,0x00,0x10] - vrcppbf16 zmm2, zmmword ptr [esp + 8*esi + 268435456] + vrcpbf16 zmm2, zmmword ptr [esp + 8*esi + 268435456] -// CHECK: vrcppbf16 zmm2 {k7}, zmmword ptr [edi + 4*eax + 291] +// CHECK: vrcpbf16 zmm2 {k7}, zmmword ptr [edi + 4*eax + 291] // CHECK: encoding: [0x62,0xf6,0x7c,0x4f,0x4c,0x94,0x87,0x23,0x01,0x00,0x00] - vrcppbf16 zmm2 {k7}, zmmword ptr [edi + 4*eax + 291] + vrcpbf16 zmm2 {k7}, zmmword ptr [edi + 4*eax + 291] -// CHECK: vrcppbf16 zmm2, word ptr [eax]{1to32} +// CHECK: vrcpbf16 zmm2, word ptr [eax]{1to32} // CHECK: encoding: [0x62,0xf6,0x7c,0x58,0x4c,0x10] - vrcppbf16 zmm2, word ptr [eax]{1to32} + vrcpbf16 zmm2, word ptr [eax]{1to32} -// CHECK: vrcppbf16 zmm2, zmmword ptr [2*ebp - 2048] +// CHECK: vrcpbf16 zmm2, zmmword ptr [2*ebp - 2048] // CHECK: encoding: [0x62,0xf6,0x7c,0x48,0x4c,0x14,0x6d,0x00,0xf8,0xff,0xff] - vrcppbf16 zmm2, zmmword ptr [2*ebp - 2048] + vrcpbf16 zmm2, zmmword ptr [2*ebp - 2048] -// CHECK: vrcppbf16 zmm2 {k7} {z}, zmmword ptr [ecx + 8128] +// CHECK: vrcpbf16 zmm2 {k7} {z}, zmmword ptr [ecx + 8128] // CHECK: encoding: [0x62,0xf6,0x7c,0xcf,0x4c,0x51,0x7f] - vrcppbf16 zmm2 {k7} {z}, zmmword ptr [ecx + 8128] + vrcpbf16 zmm2 {k7} {z}, zmmword ptr [ecx + 8128] -// CHECK: vrcppbf16 zmm2 {k7} {z}, word ptr [edx - 256]{1to32} +// CHECK: vrcpbf16 zmm2 {k7} {z}, word ptr [edx - 256]{1to32} // CHECK: encoding: [0x62,0xf6,0x7c,0xdf,0x4c,0x52,0x80] - vrcppbf16 zmm2 {k7} {z}, word ptr [edx - 256]{1to32} + vrcpbf16 zmm2 {k7} {z}, word ptr [edx - 256]{1to32} -// CHECK: vreducenepbf16 zmm2, zmm3, 123 +// CHECK: vreducebf16 zmm2, zmm3, 123 // CHECK: encoding: [0x62,0xf3,0x7f,0x48,0x56,0xd3,0x7b] - vreducenepbf16 zmm2, zmm3, 123 + vreducebf16 zmm2, zmm3, 123 -// CHECK: vreducenepbf16 zmm2 {k7}, zmm3, 123 +// CHECK: vreducebf16 zmm2 {k7}, zmm3, 123 // CHECK: encoding: [0x62,0xf3,0x7f,0x4f,0x56,0xd3,0x7b] - vreducenepbf16 zmm2 {k7}, zmm3, 123 + vreducebf16 zmm2 {k7}, zmm3, 123 -// CHECK: vreducenepbf16 zmm2 {k7} {z}, zmm3, 123 +// CHECK: vreducebf16 zmm2 {k7} {z}, zmm3, 123 // CHECK: encoding: [0x62,0xf3,0x7f,0xcf,0x56,0xd3,0x7b] - vreducenepbf16 zmm2 {k7} {z}, zmm3, 123 + vreducebf16 zmm2 {k7} {z}, zmm3, 123 -// CHECK: vreducenepbf16 ymm2, ymm3, 123 +// CHECK: vreducebf16 ymm2, ymm3, 123 // CHECK: encoding: [0x62,0xf3,0x7f,0x28,0x56,0xd3,0x7b] - vreducenepbf16 ymm2, ymm3, 123 + vreducebf16 ymm2, ymm3, 123 -// CHECK: vreducenepbf16 ymm2 {k7}, ymm3, 123 +// CHECK: vreducebf16 ymm2 {k7}, ymm3, 123 // CHECK: encoding: [0x62,0xf3,0x7f,0x2f,0x56,0xd3,0x7b] - vreducenepbf16 ymm2 {k7}, ymm3, 123 + vreducebf16 ymm2 {k7}, ymm3, 123 -// CHECK: vreducenepbf16 ymm2 {k7} {z}, ymm3, 123 +// CHECK: vreducebf16 ymm2 {k7} {z}, ymm3, 123 // CHECK: encoding: [0x62,0xf3,0x7f,0xaf,0x56,0xd3,0x7b] - vreducenepbf16 ymm2 {k7} {z}, ymm3, 123 + vreducebf16 ymm2 {k7} {z}, ymm3, 123 -// CHECK: vreducenepbf16 xmm2, xmm3, 123 +// CHECK: vreducebf16 xmm2, xmm3, 123 // CHECK: encoding: [0x62,0xf3,0x7f,0x08,0x56,0xd3,0x7b] - vreducenepbf16 xmm2, xmm3, 123 + vreducebf16 xmm2, xmm3, 123 -// CHECK: vreducenepbf16 xmm2 {k7}, xmm3, 123 +// CHECK: vreducebf16 xmm2 {k7}, xmm3, 123 // CHECK: encoding: [0x62,0xf3,0x7f,0x0f,0x56,0xd3,0x7b] - vreducenepbf16 xmm2 {k7}, xmm3, 123 + vreducebf16 xmm2 {k7}, xmm3, 123 -// CHECK: vreducenepbf16 xmm2 {k7} {z}, xmm3, 123 +// CHECK: vreducebf16 xmm2 {k7} {z}, xmm3, 123 // CHECK: encoding: [0x62,0xf3,0x7f,0x8f,0x56,0xd3,0x7b] - vreducenepbf16 xmm2 {k7} {z}, xmm3, 123 + vreducebf16 xmm2 {k7} {z}, xmm3, 123 -// CHECK: vreducenepbf16 xmm2, xmmword ptr [esp + 8*esi + 268435456], 123 +// CHECK: vreducebf16 xmm2, xmmword ptr [esp + 8*esi + 268435456], 123 // CHECK: encoding: [0x62,0xf3,0x7f,0x08,0x56,0x94,0xf4,0x00,0x00,0x00,0x10,0x7b] - vreducenepbf16 xmm2, xmmword ptr [esp + 8*esi + 268435456], 123 + vreducebf16 xmm2, xmmword ptr [esp + 8*esi + 268435456], 123 -// CHECK: vreducenepbf16 xmm2 {k7}, xmmword ptr [edi + 4*eax + 291], 123 +// CHECK: vreducebf16 xmm2 {k7}, xmmword ptr [edi + 4*eax + 291], 123 // CHECK: encoding: [0x62,0xf3,0x7f,0x0f,0x56,0x94,0x87,0x23,0x01,0x00,0x00,0x7b] - vreducenepbf16 xmm2 {k7}, xmmword ptr [edi + 4*eax + 291], 123 + vreducebf16 xmm2 {k7}, xmmword ptr [edi + 4*eax + 291], 123 -// CHECK: vreducenepbf16 xmm2, word ptr [eax]{1to8}, 123 +// CHECK: vreducebf16 xmm2, word ptr [eax]{1to8}, 123 // CHECK: encoding: [0x62,0xf3,0x7f,0x18,0x56,0x10,0x7b] - vreducenepbf16 xmm2, word ptr [eax]{1to8}, 123 + vreducebf16 xmm2, word ptr [eax]{1to8}, 123 -// CHECK: vreducenepbf16 xmm2, xmmword ptr [2*ebp - 512], 123 +// CHECK: vreducebf16 xmm2, xmmword ptr [2*ebp - 512], 123 // CHECK: encoding: [0x62,0xf3,0x7f,0x08,0x56,0x14,0x6d,0x00,0xfe,0xff,0xff,0x7b] - vreducenepbf16 xmm2, xmmword ptr [2*ebp - 512], 123 + vreducebf16 xmm2, xmmword ptr [2*ebp - 512], 123 -// CHECK: vreducenepbf16 xmm2 {k7} {z}, xmmword ptr [ecx + 2032], 123 +// CHECK: vreducebf16 xmm2 {k7} {z}, xmmword ptr [ecx + 2032], 123 // CHECK: encoding: [0x62,0xf3,0x7f,0x8f,0x56,0x51,0x7f,0x7b] - vreducenepbf16 xmm2 {k7} {z}, xmmword ptr [ecx + 2032], 123 + vreducebf16 xmm2 {k7} {z}, xmmword ptr [ecx + 2032], 123 -// CHECK: vreducenepbf16 xmm2 {k7} {z}, word ptr [edx - 256]{1to8}, 123 +// CHECK: vreducebf16 xmm2 {k7} {z}, word ptr [edx - 256]{1to8}, 123 // CHECK: encoding: [0x62,0xf3,0x7f,0x9f,0x56,0x52,0x80,0x7b] - vreducenepbf16 xmm2 {k7} {z}, word ptr [edx - 256]{1to8}, 123 + vreducebf16 xmm2 {k7} {z}, word ptr [edx - 256]{1to8}, 123 -// CHECK: vreducenepbf16 ymm2, ymmword ptr [esp + 8*esi + 268435456], 123 +// CHECK: vreducebf16 ymm2, ymmword ptr [esp + 8*esi + 268435456], 123 // CHECK: encoding: [0x62,0xf3,0x7f,0x28,0x56,0x94,0xf4,0x00,0x00,0x00,0x10,0x7b] - vreducenepbf16 ymm2, ymmword ptr [esp + 8*esi + 268435456], 123 + vreducebf16 ymm2, ymmword ptr [esp + 8*esi + 268435456], 123 -// CHECK: vreducenepbf16 ymm2 {k7}, ymmword ptr [edi + 4*eax + 291], 123 +// CHECK: vreducebf16 ymm2 {k7}, ymmword ptr [edi + 4*eax + 291], 123 // CHECK: encoding: [0x62,0xf3,0x7f,0x2f,0x56,0x94,0x87,0x23,0x01,0x00,0x00,0x7b] - vreducenepbf16 ymm2 {k7}, ymmword ptr [edi + 4*eax + 291], 123 + vreducebf16 ymm2 {k7}, ymmword ptr [edi + 4*eax + 291], 123 -// CHECK: vreducenepbf16 ymm2, word ptr [eax]{1to16}, 123 +// CHECK: vreducebf16 ymm2, word ptr [eax]{1to16}, 123 // CHECK: encoding: [0x62,0xf3,0x7f,0x38,0x56,0x10,0x7b] - vreducenepbf16 ymm2, word ptr [eax]{1to16}, 123 + vreducebf16 ymm2, word ptr [eax]{1to16}, 123 -// CHECK: vreducenepbf16 ymm2, ymmword ptr [2*ebp - 1024], 123 +// CHECK: vreducebf16 ymm2, ymmword ptr [2*ebp - 1024], 123 // CHECK: encoding: [0x62,0xf3,0x7f,0x28,0x56,0x14,0x6d,0x00,0xfc,0xff,0xff,0x7b] - vreducenepbf16 ymm2, ymmword ptr [2*ebp - 1024], 123 + vreducebf16 ymm2, ymmword ptr [2*ebp - 1024], 123 -// CHECK: vreducenepbf16 ymm2 {k7} {z}, ymmword ptr [ecx + 4064], 123 +// CHECK: vreducebf16 ymm2 {k7} {z}, ymmword ptr [ecx + 4064], 123 // CHECK: encoding: [0x62,0xf3,0x7f,0xaf,0x56,0x51,0x7f,0x7b] - vreducenepbf16 ymm2 {k7} {z}, ymmword ptr [ecx + 4064], 123 + vreducebf16 ymm2 {k7} {z}, ymmword ptr [ecx + 4064], 123 -// CHECK: vreducenepbf16 ymm2 {k7} {z}, word ptr [edx - 256]{1to16}, 123 +// CHECK: vreducebf16 ymm2 {k7} {z}, word ptr [edx - 256]{1to16}, 123 // CHECK: encoding: [0x62,0xf3,0x7f,0xbf,0x56,0x52,0x80,0x7b] - vreducenepbf16 ymm2 {k7} {z}, word ptr [edx - 256]{1to16}, 123 + vreducebf16 ymm2 {k7} {z}, word ptr [edx - 256]{1to16}, 123 -// CHECK: vreducenepbf16 zmm2, zmmword ptr [esp + 8*esi + 268435456], 123 +// CHECK: vreducebf16 zmm2, zmmword ptr [esp + 8*esi + 268435456], 123 // CHECK: encoding: [0x62,0xf3,0x7f,0x48,0x56,0x94,0xf4,0x00,0x00,0x00,0x10,0x7b] - vreducenepbf16 zmm2, zmmword ptr [esp + 8*esi + 268435456], 123 + vreducebf16 zmm2, zmmword ptr [esp + 8*esi + 268435456], 123 -// CHECK: vreducenepbf16 zmm2 {k7}, zmmword ptr [edi + 4*eax + 291], 123 +// CHECK: vreducebf16 zmm2 {k7}, zmmword ptr [edi + 4*eax + 291], 123 // CHECK: encoding: [0x62,0xf3,0x7f,0x4f,0x56,0x94,0x87,0x23,0x01,0x00,0x00,0x7b] - vreducenepbf16 zmm2 {k7}, zmmword ptr [edi + 4*eax + 291], 123 + vreducebf16 zmm2 {k7}, zmmword ptr [edi + 4*eax + 291], 123 -// CHECK: vreducenepbf16 zmm2, word ptr [eax]{1to32}, 123 +// CHECK: vreducebf16 zmm2, word ptr [eax]{1to32}, 123 // CHECK: encoding: [0x62,0xf3,0x7f,0x58,0x56,0x10,0x7b] - vreducenepbf16 zmm2, word ptr [eax]{1to32}, 123 + vreducebf16 zmm2, word ptr [eax]{1to32}, 123 -// CHECK: vreducenepbf16 zmm2, zmmword ptr [2*ebp - 2048], 123 +// CHECK: vreducebf16 zmm2, zmmword ptr [2*ebp - 2048], 123 // CHECK: encoding: [0x62,0xf3,0x7f,0x48,0x56,0x14,0x6d,0x00,0xf8,0xff,0xff,0x7b] - vreducenepbf16 zmm2, zmmword ptr [2*ebp - 2048], 123 + vreducebf16 zmm2, zmmword ptr [2*ebp - 2048], 123 -// CHECK: vreducenepbf16 zmm2 {k7} {z}, zmmword ptr [ecx + 8128], 123 +// CHECK: vreducebf16 zmm2 {k7} {z}, zmmword ptr [ecx + 8128], 123 // CHECK: encoding: [0x62,0xf3,0x7f,0xcf,0x56,0x51,0x7f,0x7b] - vreducenepbf16 zmm2 {k7} {z}, zmmword ptr [ecx + 8128], 123 + vreducebf16 zmm2 {k7} {z}, zmmword ptr [ecx + 8128], 123 -// CHECK: vreducenepbf16 zmm2 {k7} {z}, word ptr [edx - 256]{1to32}, 123 +// CHECK: vreducebf16 zmm2 {k7} {z}, word ptr [edx - 256]{1to32}, 123 // CHECK: encoding: [0x62,0xf3,0x7f,0xdf,0x56,0x52,0x80,0x7b] - vreducenepbf16 zmm2 {k7} {z}, word ptr [edx - 256]{1to32}, 123 + vreducebf16 zmm2 {k7} {z}, word ptr [edx - 256]{1to32}, 123 -// CHECK: vrndscalenepbf16 zmm2, zmm3, 123 +// CHECK: vrndscalebf16 zmm2, zmm3, 123 // CHECK: encoding: [0x62,0xf3,0x7f,0x48,0x08,0xd3,0x7b] - vrndscalenepbf16 zmm2, zmm3, 123 + vrndscalebf16 zmm2, zmm3, 123 -// CHECK: vrndscalenepbf16 zmm2 {k7}, zmm3, 123 +// CHECK: vrndscalebf16 zmm2 {k7}, zmm3, 123 // CHECK: encoding: [0x62,0xf3,0x7f,0x4f,0x08,0xd3,0x7b] - vrndscalenepbf16 zmm2 {k7}, zmm3, 123 + vrndscalebf16 zmm2 {k7}, zmm3, 123 -// CHECK: vrndscalenepbf16 zmm2 {k7} {z}, zmm3, 123 +// CHECK: vrndscalebf16 zmm2 {k7} {z}, zmm3, 123 // CHECK: encoding: [0x62,0xf3,0x7f,0xcf,0x08,0xd3,0x7b] - vrndscalenepbf16 zmm2 {k7} {z}, zmm3, 123 + vrndscalebf16 zmm2 {k7} {z}, zmm3, 123 -// CHECK: vrndscalenepbf16 ymm2, ymm3, 123 +// CHECK: vrndscalebf16 ymm2, ymm3, 123 // CHECK: encoding: [0x62,0xf3,0x7f,0x28,0x08,0xd3,0x7b] - vrndscalenepbf16 ymm2, ymm3, 123 + vrndscalebf16 ymm2, ymm3, 123 -// CHECK: vrndscalenepbf16 ymm2 {k7}, ymm3, 123 +// CHECK: vrndscalebf16 ymm2 {k7}, ymm3, 123 // CHECK: encoding: [0x62,0xf3,0x7f,0x2f,0x08,0xd3,0x7b] - vrndscalenepbf16 ymm2 {k7}, ymm3, 123 + vrndscalebf16 ymm2 {k7}, ymm3, 123 -// CHECK: vrndscalenepbf16 ymm2 {k7} {z}, ymm3, 123 +// CHECK: vrndscalebf16 ymm2 {k7} {z}, ymm3, 123 // CHECK: encoding: [0x62,0xf3,0x7f,0xaf,0x08,0xd3,0x7b] - vrndscalenepbf16 ymm2 {k7} {z}, ymm3, 123 + vrndscalebf16 ymm2 {k7} {z}, ymm3, 123 -// CHECK: vrndscalenepbf16 xmm2, xmm3, 123 +// CHECK: vrndscalebf16 xmm2, xmm3, 123 // CHECK: encoding: [0x62,0xf3,0x7f,0x08,0x08,0xd3,0x7b] - vrndscalenepbf16 xmm2, xmm3, 123 + vrndscalebf16 xmm2, xmm3, 123 -// CHECK: vrndscalenepbf16 xmm2 {k7}, xmm3, 123 +// CHECK: vrndscalebf16 xmm2 {k7}, xmm3, 123 // CHECK: encoding: [0x62,0xf3,0x7f,0x0f,0x08,0xd3,0x7b] - vrndscalenepbf16 xmm2 {k7}, xmm3, 123 + vrndscalebf16 xmm2 {k7}, xmm3, 123 -// CHECK: vrndscalenepbf16 xmm2 {k7} {z}, xmm3, 123 +// CHECK: vrndscalebf16 xmm2 {k7} {z}, xmm3, 123 // CHECK: encoding: [0x62,0xf3,0x7f,0x8f,0x08,0xd3,0x7b] - vrndscalenepbf16 xmm2 {k7} {z}, xmm3, 123 + vrndscalebf16 xmm2 {k7} {z}, xmm3, 123 -// CHECK: vrndscalenepbf16 xmm2, xmmword ptr [esp + 8*esi + 268435456], 123 +// CHECK: vrndscalebf16 xmm2, xmmword ptr [esp + 8*esi + 268435456], 123 // CHECK: encoding: [0x62,0xf3,0x7f,0x08,0x08,0x94,0xf4,0x00,0x00,0x00,0x10,0x7b] - vrndscalenepbf16 xmm2, xmmword ptr [esp + 8*esi + 268435456], 123 + vrndscalebf16 xmm2, xmmword ptr [esp + 8*esi + 268435456], 123 -// CHECK: vrndscalenepbf16 xmm2 {k7}, xmmword ptr [edi + 4*eax + 291], 123 +// CHECK: vrndscalebf16 xmm2 {k7}, xmmword ptr [edi + 4*eax + 291], 123 // CHECK: encoding: [0x62,0xf3,0x7f,0x0f,0x08,0x94,0x87,0x23,0x01,0x00,0x00,0x7b] - vrndscalenepbf16 xmm2 {k7}, xmmword ptr [edi + 4*eax + 291], 123 + vrndscalebf16 xmm2 {k7}, xmmword ptr [edi + 4*eax + 291], 123 -// CHECK: vrndscalenepbf16 xmm2, word ptr [eax]{1to8}, 123 +// CHECK: vrndscalebf16 xmm2, word ptr [eax]{1to8}, 123 // CHECK: encoding: [0x62,0xf3,0x7f,0x18,0x08,0x10,0x7b] - vrndscalenepbf16 xmm2, word ptr [eax]{1to8}, 123 + vrndscalebf16 xmm2, word ptr [eax]{1to8}, 123 -// CHECK: vrndscalenepbf16 xmm2, xmmword ptr [2*ebp - 512], 123 +// CHECK: vrndscalebf16 xmm2, xmmword ptr [2*ebp - 512], 123 // CHECK: encoding: [0x62,0xf3,0x7f,0x08,0x08,0x14,0x6d,0x00,0xfe,0xff,0xff,0x7b] - vrndscalenepbf16 xmm2, xmmword ptr [2*ebp - 512], 123 + vrndscalebf16 xmm2, xmmword ptr [2*ebp - 512], 123 -// CHECK: vrndscalenepbf16 xmm2 {k7} {z}, xmmword ptr [ecx + 2032], 123 +// CHECK: vrndscalebf16 xmm2 {k7} {z}, xmmword ptr [ecx + 2032], 123 // CHECK: encoding: [0x62,0xf3,0x7f,0x8f,0x08,0x51,0x7f,0x7b] - vrndscalenepbf16 xmm2 {k7} {z}, xmmword ptr [ecx + 2032], 123 + vrndscalebf16 xmm2 {k7} {z}, xmmword ptr [ecx + 2032], 123 -// CHECK: vrndscalenepbf16 xmm2 {k7} {z}, word ptr [edx - 256]{1to8}, 123 +// CHECK: vrndscalebf16 xmm2 {k7} {z}, word ptr [edx - 256]{1to8}, 123 // CHECK: encoding: [0x62,0xf3,0x7f,0x9f,0x08,0x52,0x80,0x7b] - vrndscalenepbf16 xmm2 {k7} {z}, word ptr [edx - 256]{1to8}, 123 + vrndscalebf16 xmm2 {k7} {z}, word ptr [edx - 256]{1to8}, 123 -// CHECK: vrndscalenepbf16 ymm2, ymmword ptr [esp + 8*esi + 268435456], 123 +// CHECK: vrndscalebf16 ymm2, ymmword ptr [esp + 8*esi + 268435456], 123 // CHECK: encoding: [0x62,0xf3,0x7f,0x28,0x08,0x94,0xf4,0x00,0x00,0x00,0x10,0x7b] - vrndscalenepbf16 ymm2, ymmword ptr [esp + 8*esi + 268435456], 123 + vrndscalebf16 ymm2, ymmword ptr [esp + 8*esi + 268435456], 123 -// CHECK: vrndscalenepbf16 ymm2 {k7}, ymmword ptr [edi + 4*eax + 291], 123 +// CHECK: vrndscalebf16 ymm2 {k7}, ymmword ptr [edi + 4*eax + 291], 123 // CHECK: encoding: [0x62,0xf3,0x7f,0x2f,0x08,0x94,0x87,0x23,0x01,0x00,0x00,0x7b] - vrndscalenepbf16 ymm2 {k7}, ymmword ptr [edi + 4*eax + 291], 123 + vrndscalebf16 ymm2 {k7}, ymmword ptr [edi + 4*eax + 291], 123 -// CHECK: vrndscalenepbf16 ymm2, word ptr [eax]{1to16}, 123 +// CHECK: vrndscalebf16 ymm2, word ptr [eax]{1to16}, 123 // CHECK: encoding: [0x62,0xf3,0x7f,0x38,0x08,0x10,0x7b] - vrndscalenepbf16 ymm2, word ptr [eax]{1to16}, 123 + vrndscalebf16 ymm2, word ptr [eax]{1to16}, 123 -// CHECK: vrndscalenepbf16 ymm2, ymmword ptr [2*ebp - 1024], 123 +// CHECK: vrndscalebf16 ymm2, ymmword ptr [2*ebp - 1024], 123 // CHECK: encoding: [0x62,0xf3,0x7f,0x28,0x08,0x14,0x6d,0x00,0xfc,0xff,0xff,0x7b] - vrndscalenepbf16 ymm2, ymmword ptr [2*ebp - 1024], 123 + vrndscalebf16 ymm2, ymmword ptr [2*ebp - 1024], 123 -// CHECK: vrndscalenepbf16 ymm2 {k7} {z}, ymmword ptr [ecx + 4064], 123 +// CHECK: vrndscalebf16 ymm2 {k7} {z}, ymmword ptr [ecx + 4064], 123 // CHECK: encoding: [0x62,0xf3,0x7f,0xaf,0x08,0x51,0x7f,0x7b] - vrndscalenepbf16 ymm2 {k7} {z}, ymmword ptr [ecx + 4064], 123 + vrndscalebf16 ymm2 {k7} {z}, ymmword ptr [ecx + 4064], 123 -// CHECK: vrndscalenepbf16 ymm2 {k7} {z}, word ptr [edx - 256]{1to16}, 123 +// CHECK: vrndscalebf16 ymm2 {k7} {z}, word ptr [edx - 256]{1to16}, 123 // CHECK: encoding: [0x62,0xf3,0x7f,0xbf,0x08,0x52,0x80,0x7b] - vrndscalenepbf16 ymm2 {k7} {z}, word ptr [edx - 256]{1to16}, 123 + vrndscalebf16 ymm2 {k7} {z}, word ptr [edx - 256]{1to16}, 123 -// CHECK: vrndscalenepbf16 zmm2, zmmword ptr [esp + 8*esi + 268435456], 123 +// CHECK: vrndscalebf16 zmm2, zmmword ptr [esp + 8*esi + 268435456], 123 // CHECK: encoding: [0x62,0xf3,0x7f,0x48,0x08,0x94,0xf4,0x00,0x00,0x00,0x10,0x7b] - vrndscalenepbf16 zmm2, zmmword ptr [esp + 8*esi + 268435456], 123 + vrndscalebf16 zmm2, zmmword ptr [esp + 8*esi + 268435456], 123 -// CHECK: vrndscalenepbf16 zmm2 {k7}, zmmword ptr [edi + 4*eax + 291], 123 +// CHECK: vrndscalebf16 zmm2 {k7}, zmmword ptr [edi + 4*eax + 291], 123 // CHECK: encoding: [0x62,0xf3,0x7f,0x4f,0x08,0x94,0x87,0x23,0x01,0x00,0x00,0x7b] - vrndscalenepbf16 zmm2 {k7}, zmmword ptr [edi + 4*eax + 291], 123 + vrndscalebf16 zmm2 {k7}, zmmword ptr [edi + 4*eax + 291], 123 -// CHECK: vrndscalenepbf16 zmm2, word ptr [eax]{1to32}, 123 +// CHECK: vrndscalebf16 zmm2, word ptr [eax]{1to32}, 123 // CHECK: encoding: [0x62,0xf3,0x7f,0x58,0x08,0x10,0x7b] - vrndscalenepbf16 zmm2, word ptr [eax]{1to32}, 123 + vrndscalebf16 zmm2, word ptr [eax]{1to32}, 123 -// CHECK: vrndscalenepbf16 zmm2, zmmword ptr [2*ebp - 2048], 123 +// CHECK: vrndscalebf16 zmm2, zmmword ptr [2*ebp - 2048], 123 // CHECK: encoding: [0x62,0xf3,0x7f,0x48,0x08,0x14,0x6d,0x00,0xf8,0xff,0xff,0x7b] - vrndscalenepbf16 zmm2, zmmword ptr [2*ebp - 2048], 123 + vrndscalebf16 zmm2, zmmword ptr [2*ebp - 2048], 123 -// CHECK: vrndscalenepbf16 zmm2 {k7} {z}, zmmword ptr [ecx + 8128], 123 +// CHECK: vrndscalebf16 zmm2 {k7} {z}, zmmword ptr [ecx + 8128], 123 // CHECK: encoding: [0x62,0xf3,0x7f,0xcf,0x08,0x51,0x7f,0x7b] - vrndscalenepbf16 zmm2 {k7} {z}, zmmword ptr [ecx + 8128], 123 + vrndscalebf16 zmm2 {k7} {z}, zmmword ptr [ecx + 8128], 123 -// CHECK: vrndscalenepbf16 zmm2 {k7} {z}, word ptr [edx - 256]{1to32}, 123 +// CHECK: vrndscalebf16 zmm2 {k7} {z}, word ptr [edx - 256]{1to32}, 123 // CHECK: encoding: [0x62,0xf3,0x7f,0xdf,0x08,0x52,0x80,0x7b] - vrndscalenepbf16 zmm2 {k7} {z}, word ptr [edx - 256]{1to32}, 123 + vrndscalebf16 zmm2 {k7} {z}, word ptr [edx - 256]{1to32}, 123 -// CHECK: vrsqrtpbf16 xmm2, xmm3 +// CHECK: vrsqrtbf16 xmm2, xmm3 // CHECK: encoding: [0x62,0xf6,0x7c,0x08,0x4e,0xd3] - vrsqrtpbf16 xmm2, xmm3 + vrsqrtbf16 xmm2, xmm3 -// CHECK: vrsqrtpbf16 xmm2 {k7}, xmm3 +// CHECK: vrsqrtbf16 xmm2 {k7}, xmm3 // CHECK: encoding: [0x62,0xf6,0x7c,0x0f,0x4e,0xd3] - vrsqrtpbf16 xmm2 {k7}, xmm3 + vrsqrtbf16 xmm2 {k7}, xmm3 -// CHECK: vrsqrtpbf16 xmm2 {k7} {z}, xmm3 +// CHECK: vrsqrtbf16 xmm2 {k7} {z}, xmm3 // CHECK: encoding: [0x62,0xf6,0x7c,0x8f,0x4e,0xd3] - vrsqrtpbf16 xmm2 {k7} {z}, xmm3 + vrsqrtbf16 xmm2 {k7} {z}, xmm3 -// CHECK: vrsqrtpbf16 zmm2, zmm3 +// CHECK: vrsqrtbf16 zmm2, zmm3 // CHECK: encoding: [0x62,0xf6,0x7c,0x48,0x4e,0xd3] - vrsqrtpbf16 zmm2, zmm3 + vrsqrtbf16 zmm2, zmm3 -// CHECK: vrsqrtpbf16 zmm2 {k7}, zmm3 +// CHECK: vrsqrtbf16 zmm2 {k7}, zmm3 // CHECK: encoding: [0x62,0xf6,0x7c,0x4f,0x4e,0xd3] - vrsqrtpbf16 zmm2 {k7}, zmm3 + vrsqrtbf16 zmm2 {k7}, zmm3 -// CHECK: vrsqrtpbf16 zmm2 {k7} {z}, zmm3 +// CHECK: vrsqrtbf16 zmm2 {k7} {z}, zmm3 // CHECK: encoding: [0x62,0xf6,0x7c,0xcf,0x4e,0xd3] - vrsqrtpbf16 zmm2 {k7} {z}, zmm3 + vrsqrtbf16 zmm2 {k7} {z}, zmm3 -// CHECK: vrsqrtpbf16 ymm2, ymm3 +// CHECK: vrsqrtbf16 ymm2, ymm3 // CHECK: encoding: [0x62,0xf6,0x7c,0x28,0x4e,0xd3] - vrsqrtpbf16 ymm2, ymm3 + vrsqrtbf16 ymm2, ymm3 -// CHECK: vrsqrtpbf16 ymm2 {k7}, ymm3 +// CHECK: vrsqrtbf16 ymm2 {k7}, ymm3 // CHECK: encoding: [0x62,0xf6,0x7c,0x2f,0x4e,0xd3] - vrsqrtpbf16 ymm2 {k7}, ymm3 + vrsqrtbf16 ymm2 {k7}, ymm3 -// CHECK: vrsqrtpbf16 ymm2 {k7} {z}, ymm3 +// CHECK: vrsqrtbf16 ymm2 {k7} {z}, ymm3 // CHECK: encoding: [0x62,0xf6,0x7c,0xaf,0x4e,0xd3] - vrsqrtpbf16 ymm2 {k7} {z}, ymm3 + vrsqrtbf16 ymm2 {k7} {z}, ymm3 -// CHECK: vrsqrtpbf16 xmm2, xmmword ptr [esp + 8*esi + 268435456] +// CHECK: vrsqrtbf16 xmm2, xmmword ptr [esp + 8*esi + 268435456] // CHECK: encoding: [0x62,0xf6,0x7c,0x08,0x4e,0x94,0xf4,0x00,0x00,0x00,0x10] - vrsqrtpbf16 xmm2, xmmword ptr [esp + 8*esi + 268435456] + vrsqrtbf16 xmm2, xmmword ptr [esp + 8*esi + 268435456] -// CHECK: vrsqrtpbf16 xmm2 {k7}, xmmword ptr [edi + 4*eax + 291] +// CHECK: vrsqrtbf16 xmm2 {k7}, xmmword ptr [edi + 4*eax + 291] // CHECK: encoding: [0x62,0xf6,0x7c,0x0f,0x4e,0x94,0x87,0x23,0x01,0x00,0x00] - vrsqrtpbf16 xmm2 {k7}, xmmword ptr [edi + 4*eax + 291] + vrsqrtbf16 xmm2 {k7}, xmmword ptr [edi + 4*eax + 291] -// CHECK: vrsqrtpbf16 xmm2, word ptr [eax]{1to8} +// CHECK: vrsqrtbf16 xmm2, word ptr [eax]{1to8} // CHECK: encoding: [0x62,0xf6,0x7c,0x18,0x4e,0x10] - vrsqrtpbf16 xmm2, word ptr [eax]{1to8} + vrsqrtbf16 xmm2, word ptr [eax]{1to8} -// CHECK: vrsqrtpbf16 xmm2, xmmword ptr [2*ebp - 512] +// CHECK: vrsqrtbf16 xmm2, xmmword ptr [2*ebp - 512] // CHECK: encoding: [0x62,0xf6,0x7c,0x08,0x4e,0x14,0x6d,0x00,0xfe,0xff,0xff] - vrsqrtpbf16 xmm2, xmmword ptr [2*ebp - 512] + vrsqrtbf16 xmm2, xmmword ptr [2*ebp - 512] -// CHECK: vrsqrtpbf16 xmm2 {k7} {z}, xmmword ptr [ecx + 2032] +// CHECK: vrsqrtbf16 xmm2 {k7} {z}, xmmword ptr [ecx + 2032] // CHECK: encoding: [0x62,0xf6,0x7c,0x8f,0x4e,0x51,0x7f] - vrsqrtpbf16 xmm2 {k7} {z}, xmmword ptr [ecx + 2032] + vrsqrtbf16 xmm2 {k7} {z}, xmmword ptr [ecx + 2032] -// CHECK: vrsqrtpbf16 xmm2 {k7} {z}, word ptr [edx - 256]{1to8} +// CHECK: vrsqrtbf16 xmm2 {k7} {z}, word ptr [edx - 256]{1to8} // CHECK: encoding: [0x62,0xf6,0x7c,0x9f,0x4e,0x52,0x80] - vrsqrtpbf16 xmm2 {k7} {z}, word ptr [edx - 256]{1to8} + vrsqrtbf16 xmm2 {k7} {z}, word ptr [edx - 256]{1to8} -// CHECK: vrsqrtpbf16 ymm2, ymmword ptr [esp + 8*esi + 268435456] +// CHECK: vrsqrtbf16 ymm2, ymmword ptr [esp + 8*esi + 268435456] // CHECK: encoding: [0x62,0xf6,0x7c,0x28,0x4e,0x94,0xf4,0x00,0x00,0x00,0x10] - vrsqrtpbf16 ymm2, ymmword ptr [esp + 8*esi + 268435456] + vrsqrtbf16 ymm2, ymmword ptr [esp + 8*esi + 268435456] -// CHECK: vrsqrtpbf16 ymm2 {k7}, ymmword ptr [edi + 4*eax + 291] +// CHECK: vrsqrtbf16 ymm2 {k7}, ymmword ptr [edi + 4*eax + 291] // CHECK: encoding: [0x62,0xf6,0x7c,0x2f,0x4e,0x94,0x87,0x23,0x01,0x00,0x00] - vrsqrtpbf16 ymm2 {k7}, ymmword ptr [edi + 4*eax + 291] + vrsqrtbf16 ymm2 {k7}, ymmword ptr [edi + 4*eax + 291] -// CHECK: vrsqrtpbf16 ymm2, word ptr [eax]{1to16} +// CHECK: vrsqrtbf16 ymm2, word ptr [eax]{1to16} // CHECK: encoding: [0x62,0xf6,0x7c,0x38,0x4e,0x10] - vrsqrtpbf16 ymm2, word ptr [eax]{1to16} + vrsqrtbf16 ymm2, word ptr [eax]{1to16} -// CHECK: vrsqrtpbf16 ymm2, ymmword ptr [2*ebp - 1024] +// CHECK: vrsqrtbf16 ymm2, ymmword ptr [2*ebp - 1024] // CHECK: encoding: [0x62,0xf6,0x7c,0x28,0x4e,0x14,0x6d,0x00,0xfc,0xff,0xff] - vrsqrtpbf16 ymm2, ymmword ptr [2*ebp - 1024] + vrsqrtbf16 ymm2, ymmword ptr [2*ebp - 1024] -// CHECK: vrsqrtpbf16 ymm2 {k7} {z}, ymmword ptr [ecx + 4064] +// CHECK: vrsqrtbf16 ymm2 {k7} {z}, ymmword ptr [ecx + 4064] // CHECK: encoding: [0x62,0xf6,0x7c,0xaf,0x4e,0x51,0x7f] - vrsqrtpbf16 ymm2 {k7} {z}, ymmword ptr [ecx + 4064] + vrsqrtbf16 ymm2 {k7} {z}, ymmword ptr [ecx + 4064] -// CHECK: vrsqrtpbf16 ymm2 {k7} {z}, word ptr [edx - 256]{1to16} +// CHECK: vrsqrtbf16 ymm2 {k7} {z}, word ptr [edx - 256]{1to16} // CHECK: encoding: [0x62,0xf6,0x7c,0xbf,0x4e,0x52,0x80] - vrsqrtpbf16 ymm2 {k7} {z}, word ptr [edx - 256]{1to16} + vrsqrtbf16 ymm2 {k7} {z}, word ptr [edx - 256]{1to16} -// CHECK: vrsqrtpbf16 zmm2, zmmword ptr [esp + 8*esi + 268435456] +// CHECK: vrsqrtbf16 zmm2, zmmword ptr [esp + 8*esi + 268435456] // CHECK: encoding: [0x62,0xf6,0x7c,0x48,0x4e,0x94,0xf4,0x00,0x00,0x00,0x10] - vrsqrtpbf16 zmm2, zmmword ptr [esp + 8*esi + 268435456] + vrsqrtbf16 zmm2, zmmword ptr [esp + 8*esi + 268435456] -// CHECK: vrsqrtpbf16 zmm2 {k7}, zmmword ptr [edi + 4*eax + 291] +// CHECK: vrsqrtbf16 zmm2 {k7}, zmmword ptr [edi + 4*eax + 291] // CHECK: encoding: [0x62,0xf6,0x7c,0x4f,0x4e,0x94,0x87,0x23,0x01,0x00,0x00] - vrsqrtpbf16 zmm2 {k7}, zmmword ptr [edi + 4*eax + 291] + vrsqrtbf16 zmm2 {k7}, zmmword ptr [edi + 4*eax + 291] -// CHECK: vrsqrtpbf16 zmm2, word ptr [eax]{1to32} +// CHECK: vrsqrtbf16 zmm2, word ptr [eax]{1to32} // CHECK: encoding: [0x62,0xf6,0x7c,0x58,0x4e,0x10] - vrsqrtpbf16 zmm2, word ptr [eax]{1to32} + vrsqrtbf16 zmm2, word ptr [eax]{1to32} -// CHECK: vrsqrtpbf16 zmm2, zmmword ptr [2*ebp - 2048] +// CHECK: vrsqrtbf16 zmm2, zmmword ptr [2*ebp - 2048] // CHECK: encoding: [0x62,0xf6,0x7c,0x48,0x4e,0x14,0x6d,0x00,0xf8,0xff,0xff] - vrsqrtpbf16 zmm2, zmmword ptr [2*ebp - 2048] + vrsqrtbf16 zmm2, zmmword ptr [2*ebp - 2048] -// CHECK: vrsqrtpbf16 zmm2 {k7} {z}, zmmword ptr [ecx + 8128] +// CHECK: vrsqrtbf16 zmm2 {k7} {z}, zmmword ptr [ecx + 8128] // CHECK: encoding: [0x62,0xf6,0x7c,0xcf,0x4e,0x51,0x7f] - vrsqrtpbf16 zmm2 {k7} {z}, zmmword ptr [ecx + 8128] + vrsqrtbf16 zmm2 {k7} {z}, zmmword ptr [ecx + 8128] -// CHECK: vrsqrtpbf16 zmm2 {k7} {z}, word ptr [edx - 256]{1to32} +// CHECK: vrsqrtbf16 zmm2 {k7} {z}, word ptr [edx - 256]{1to32} // CHECK: encoding: [0x62,0xf6,0x7c,0xdf,0x4e,0x52,0x80] - vrsqrtpbf16 zmm2 {k7} {z}, word ptr [edx - 256]{1to32} + vrsqrtbf16 zmm2 {k7} {z}, word ptr [edx - 256]{1to32} -// CHECK: vscalefpbf16 ymm2, ymm3, ymm4 +// CHECK: vscalefbf16 ymm2, ymm3, ymm4 // CHECK: encoding: [0x62,0xf6,0x64,0x28,0x2c,0xd4] - vscalefpbf16 ymm2, ymm3, ymm4 + vscalefbf16 ymm2, ymm3, ymm4 -// CHECK: vscalefpbf16 ymm2 {k7}, ymm3, ymm4 +// CHECK: vscalefbf16 ymm2 {k7}, ymm3, ymm4 // CHECK: encoding: [0x62,0xf6,0x64,0x2f,0x2c,0xd4] - vscalefpbf16 ymm2 {k7}, ymm3, ymm4 + vscalefbf16 ymm2 {k7}, ymm3, ymm4 -// CHECK: vscalefpbf16 ymm2 {k7} {z}, ymm3, ymm4 +// CHECK: vscalefbf16 ymm2 {k7} {z}, ymm3, ymm4 // CHECK: encoding: [0x62,0xf6,0x64,0xaf,0x2c,0xd4] - vscalefpbf16 ymm2 {k7} {z}, ymm3, ymm4 + vscalefbf16 ymm2 {k7} {z}, ymm3, ymm4 -// CHECK: vscalefpbf16 zmm2, zmm3, zmm4 +// CHECK: vscalefbf16 zmm2, zmm3, zmm4 // CHECK: encoding: [0x62,0xf6,0x64,0x48,0x2c,0xd4] - vscalefpbf16 zmm2, zmm3, zmm4 + vscalefbf16 zmm2, zmm3, zmm4 -// CHECK: vscalefpbf16 zmm2 {k7}, zmm3, zmm4 +// CHECK: vscalefbf16 zmm2 {k7}, zmm3, zmm4 // CHECK: encoding: [0x62,0xf6,0x64,0x4f,0x2c,0xd4] - vscalefpbf16 zmm2 {k7}, zmm3, zmm4 + vscalefbf16 zmm2 {k7}, zmm3, zmm4 -// CHECK: vscalefpbf16 zmm2 {k7} {z}, zmm3, zmm4 +// CHECK: vscalefbf16 zmm2 {k7} {z}, zmm3, zmm4 // CHECK: encoding: [0x62,0xf6,0x64,0xcf,0x2c,0xd4] - vscalefpbf16 zmm2 {k7} {z}, zmm3, zmm4 + vscalefbf16 zmm2 {k7} {z}, zmm3, zmm4 -// CHECK: vscalefpbf16 xmm2, xmm3, xmm4 +// CHECK: vscalefbf16 xmm2, xmm3, xmm4 // CHECK: encoding: [0x62,0xf6,0x64,0x08,0x2c,0xd4] - vscalefpbf16 xmm2, xmm3, xmm4 + vscalefbf16 xmm2, xmm3, xmm4 -// CHECK: vscalefpbf16 xmm2 {k7}, xmm3, xmm4 +// CHECK: vscalefbf16 xmm2 {k7}, xmm3, xmm4 // CHECK: encoding: [0x62,0xf6,0x64,0x0f,0x2c,0xd4] - vscalefpbf16 xmm2 {k7}, xmm3, xmm4 + vscalefbf16 xmm2 {k7}, xmm3, xmm4 -// CHECK: vscalefpbf16 xmm2 {k7} {z}, xmm3, xmm4 +// CHECK: vscalefbf16 xmm2 {k7} {z}, xmm3, xmm4 // CHECK: encoding: [0x62,0xf6,0x64,0x8f,0x2c,0xd4] - vscalefpbf16 xmm2 {k7} {z}, xmm3, xmm4 + vscalefbf16 xmm2 {k7} {z}, xmm3, xmm4 -// CHECK: vscalefpbf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456] +// CHECK: vscalefbf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456] // CHECK: encoding: [0x62,0xf6,0x64,0x48,0x2c,0x94,0xf4,0x00,0x00,0x00,0x10] - vscalefpbf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456] + vscalefbf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456] -// CHECK: vscalefpbf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291] +// CHECK: vscalefbf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291] // CHECK: encoding: [0x62,0xf6,0x64,0x4f,0x2c,0x94,0x87,0x23,0x01,0x00,0x00] - vscalefpbf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291] + vscalefbf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291] -// CHECK: vscalefpbf16 zmm2, zmm3, word ptr [eax]{1to32} +// CHECK: vscalefbf16 zmm2, zmm3, word ptr [eax]{1to32} // CHECK: encoding: [0x62,0xf6,0x64,0x58,0x2c,0x10] - vscalefpbf16 zmm2, zmm3, word ptr [eax]{1to32} + vscalefbf16 zmm2, zmm3, word ptr [eax]{1to32} -// CHECK: vscalefpbf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048] +// CHECK: vscalefbf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048] // CHECK: encoding: [0x62,0xf6,0x64,0x48,0x2c,0x14,0x6d,0x00,0xf8,0xff,0xff] - vscalefpbf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048] + vscalefbf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048] -// CHECK: vscalefpbf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128] +// CHECK: vscalefbf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128] // CHECK: encoding: [0x62,0xf6,0x64,0xcf,0x2c,0x51,0x7f] - vscalefpbf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128] + vscalefbf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128] -// CHECK: vscalefpbf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32} +// CHECK: vscalefbf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32} // CHECK: encoding: [0x62,0xf6,0x64,0xdf,0x2c,0x52,0x80] - vscalefpbf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32} + vscalefbf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32} -// CHECK: vscalefpbf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456] +// CHECK: vscalefbf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456] // CHECK: encoding: [0x62,0xf6,0x64,0x28,0x2c,0x94,0xf4,0x00,0x00,0x00,0x10] - vscalefpbf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456] + vscalefbf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456] -// CHECK: vscalefpbf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291] +// CHECK: vscalefbf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291] // CHECK: encoding: [0x62,0xf6,0x64,0x2f,0x2c,0x94,0x87,0x23,0x01,0x00,0x00] - vscalefpbf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291] + vscalefbf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291] -// CHECK: vscalefpbf16 ymm2, ymm3, word ptr [eax]{1to16} +// CHECK: vscalefbf16 ymm2, ymm3, word ptr [eax]{1to16} // CHECK: encoding: [0x62,0xf6,0x64,0x38,0x2c,0x10] - vscalefpbf16 ymm2, ymm3, word ptr [eax]{1to16} + vscalefbf16 ymm2, ymm3, word ptr [eax]{1to16} -// CHECK: vscalefpbf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024] +// CHECK: vscalefbf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024] // CHECK: encoding: [0x62,0xf6,0x64,0x28,0x2c,0x14,0x6d,0x00,0xfc,0xff,0xff] - vscalefpbf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024] + vscalefbf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024] -// CHECK: vscalefpbf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064] +// CHECK: vscalefbf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064] // CHECK: encoding: [0x62,0xf6,0x64,0xaf,0x2c,0x51,0x7f] - vscalefpbf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064] + vscalefbf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064] -// CHECK: vscalefpbf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16} +// CHECK: vscalefbf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16} // CHECK: encoding: [0x62,0xf6,0x64,0xbf,0x2c,0x52,0x80] - vscalefpbf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16} + vscalefbf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16} -// CHECK: vscalefpbf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456] +// CHECK: vscalefbf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456] // CHECK: encoding: [0x62,0xf6,0x64,0x08,0x2c,0x94,0xf4,0x00,0x00,0x00,0x10] - vscalefpbf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456] + vscalefbf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456] -// CHECK: vscalefpbf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291] +// CHECK: vscalefbf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291] // CHECK: encoding: [0x62,0xf6,0x64,0x0f,0x2c,0x94,0x87,0x23,0x01,0x00,0x00] - vscalefpbf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291] + vscalefbf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291] -// CHECK: vscalefpbf16 xmm2, xmm3, word ptr [eax]{1to8} +// CHECK: vscalefbf16 xmm2, xmm3, word ptr [eax]{1to8} // CHECK: encoding: [0x62,0xf6,0x64,0x18,0x2c,0x10] - vscalefpbf16 xmm2, xmm3, word ptr [eax]{1to8} + vscalefbf16 xmm2, xmm3, word ptr [eax]{1to8} -// CHECK: vscalefpbf16 xmm2, xmm3, xmmword ptr [2*ebp - 512] +// CHECK: vscalefbf16 xmm2, xmm3, xmmword ptr [2*ebp - 512] // CHECK: encoding: [0x62,0xf6,0x64,0x08,0x2c,0x14,0x6d,0x00,0xfe,0xff,0xff] - vscalefpbf16 xmm2, xmm3, xmmword ptr [2*ebp - 512] + vscalefbf16 xmm2, xmm3, xmmword ptr [2*ebp - 512] -// CHECK: vscalefpbf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032] +// CHECK: vscalefbf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032] // CHECK: encoding: [0x62,0xf6,0x64,0x8f,0x2c,0x51,0x7f] - vscalefpbf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032] + vscalefbf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032] -// CHECK: vscalefpbf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8} +// CHECK: vscalefbf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8} // CHECK: encoding: [0x62,0xf6,0x64,0x9f,0x2c,0x52,0x80] - vscalefpbf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8} + vscalefbf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8} -// CHECK: vsqrtnepbf16 xmm2, xmm3 +// CHECK: vsqrtbf16 xmm2, xmm3 // CHECK: encoding: [0x62,0xf5,0x7d,0x08,0x51,0xd3] - vsqrtnepbf16 xmm2, xmm3 + vsqrtbf16 xmm2, xmm3 -// CHECK: vsqrtnepbf16 xmm2 {k7}, xmm3 +// CHECK: vsqrtbf16 xmm2 {k7}, xmm3 // CHECK: encoding: [0x62,0xf5,0x7d,0x0f,0x51,0xd3] - vsqrtnepbf16 xmm2 {k7}, xmm3 + vsqrtbf16 xmm2 {k7}, xmm3 -// CHECK: vsqrtnepbf16 xmm2 {k7} {z}, xmm3 +// CHECK: vsqrtbf16 xmm2 {k7} {z}, xmm3 // CHECK: encoding: [0x62,0xf5,0x7d,0x8f,0x51,0xd3] - vsqrtnepbf16 xmm2 {k7} {z}, xmm3 + vsqrtbf16 xmm2 {k7} {z}, xmm3 -// CHECK: vsqrtnepbf16 zmm2, zmm3 +// CHECK: vsqrtbf16 zmm2, zmm3 // CHECK: encoding: [0x62,0xf5,0x7d,0x48,0x51,0xd3] - vsqrtnepbf16 zmm2, zmm3 + vsqrtbf16 zmm2, zmm3 -// CHECK: vsqrtnepbf16 zmm2 {k7}, zmm3 +// CHECK: vsqrtbf16 zmm2 {k7}, zmm3 // CHECK: encoding: [0x62,0xf5,0x7d,0x4f,0x51,0xd3] - vsqrtnepbf16 zmm2 {k7}, zmm3 + vsqrtbf16 zmm2 {k7}, zmm3 -// CHECK: vsqrtnepbf16 zmm2 {k7} {z}, zmm3 +// CHECK: vsqrtbf16 zmm2 {k7} {z}, zmm3 // CHECK: encoding: [0x62,0xf5,0x7d,0xcf,0x51,0xd3] - vsqrtnepbf16 zmm2 {k7} {z}, zmm3 + vsqrtbf16 zmm2 {k7} {z}, zmm3 -// CHECK: vsqrtnepbf16 ymm2, ymm3 +// CHECK: vsqrtbf16 ymm2, ymm3 // CHECK: encoding: [0x62,0xf5,0x7d,0x28,0x51,0xd3] - vsqrtnepbf16 ymm2, ymm3 + vsqrtbf16 ymm2, ymm3 -// CHECK: vsqrtnepbf16 ymm2 {k7}, ymm3 +// CHECK: vsqrtbf16 ymm2 {k7}, ymm3 // CHECK: encoding: [0x62,0xf5,0x7d,0x2f,0x51,0xd3] - vsqrtnepbf16 ymm2 {k7}, ymm3 + vsqrtbf16 ymm2 {k7}, ymm3 -// CHECK: vsqrtnepbf16 ymm2 {k7} {z}, ymm3 +// CHECK: vsqrtbf16 ymm2 {k7} {z}, ymm3 // CHECK: encoding: [0x62,0xf5,0x7d,0xaf,0x51,0xd3] - vsqrtnepbf16 ymm2 {k7} {z}, ymm3 + vsqrtbf16 ymm2 {k7} {z}, ymm3 -// CHECK: vsqrtnepbf16 xmm2, xmmword ptr [esp + 8*esi + 268435456] +// CHECK: vsqrtbf16 xmm2, xmmword ptr [esp + 8*esi + 268435456] // CHECK: encoding: [0x62,0xf5,0x7d,0x08,0x51,0x94,0xf4,0x00,0x00,0x00,0x10] - vsqrtnepbf16 xmm2, xmmword ptr [esp + 8*esi + 268435456] + vsqrtbf16 xmm2, xmmword ptr [esp + 8*esi + 268435456] -// CHECK: vsqrtnepbf16 xmm2 {k7}, xmmword ptr [edi + 4*eax + 291] +// CHECK: vsqrtbf16 xmm2 {k7}, xmmword ptr [edi + 4*eax + 291] // CHECK: encoding: [0x62,0xf5,0x7d,0x0f,0x51,0x94,0x87,0x23,0x01,0x00,0x00] - vsqrtnepbf16 xmm2 {k7}, xmmword ptr [edi + 4*eax + 291] + vsqrtbf16 xmm2 {k7}, xmmword ptr [edi + 4*eax + 291] -// CHECK: vsqrtnepbf16 xmm2, word ptr [eax]{1to8} +// CHECK: vsqrtbf16 xmm2, word ptr [eax]{1to8} // CHECK: encoding: [0x62,0xf5,0x7d,0x18,0x51,0x10] - vsqrtnepbf16 xmm2, word ptr [eax]{1to8} + vsqrtbf16 xmm2, word ptr [eax]{1to8} -// CHECK: vsqrtnepbf16 xmm2, xmmword ptr [2*ebp - 512] +// CHECK: vsqrtbf16 xmm2, xmmword ptr [2*ebp - 512] // CHECK: encoding: [0x62,0xf5,0x7d,0x08,0x51,0x14,0x6d,0x00,0xfe,0xff,0xff] - vsqrtnepbf16 xmm2, xmmword ptr [2*ebp - 512] + vsqrtbf16 xmm2, xmmword ptr [2*ebp - 512] -// CHECK: vsqrtnepbf16 xmm2 {k7} {z}, xmmword ptr [ecx + 2032] +// CHECK: vsqrtbf16 xmm2 {k7} {z}, xmmword ptr [ecx + 2032] // CHECK: encoding: [0x62,0xf5,0x7d,0x8f,0x51,0x51,0x7f] - vsqrtnepbf16 xmm2 {k7} {z}, xmmword ptr [ecx + 2032] + vsqrtbf16 xmm2 {k7} {z}, xmmword ptr [ecx + 2032] -// CHECK: vsqrtnepbf16 xmm2 {k7} {z}, word ptr [edx - 256]{1to8} +// CHECK: vsqrtbf16 xmm2 {k7} {z}, word ptr [edx - 256]{1to8} // CHECK: encoding: [0x62,0xf5,0x7d,0x9f,0x51,0x52,0x80] - vsqrtnepbf16 xmm2 {k7} {z}, word ptr [edx - 256]{1to8} + vsqrtbf16 xmm2 {k7} {z}, word ptr [edx - 256]{1to8} -// CHECK: vsqrtnepbf16 ymm2, ymmword ptr [esp + 8*esi + 268435456] +// CHECK: vsqrtbf16 ymm2, ymmword ptr [esp + 8*esi + 268435456] // CHECK: encoding: [0x62,0xf5,0x7d,0x28,0x51,0x94,0xf4,0x00,0x00,0x00,0x10] - vsqrtnepbf16 ymm2, ymmword ptr [esp + 8*esi + 268435456] + vsqrtbf16 ymm2, ymmword ptr [esp + 8*esi + 268435456] -// CHECK: vsqrtnepbf16 ymm2 {k7}, ymmword ptr [edi + 4*eax + 291] +// CHECK: vsqrtbf16 ymm2 {k7}, ymmword ptr [edi + 4*eax + 291] // CHECK: encoding: [0x62,0xf5,0x7d,0x2f,0x51,0x94,0x87,0x23,0x01,0x00,0x00] - vsqrtnepbf16 ymm2 {k7}, ymmword ptr [edi + 4*eax + 291] + vsqrtbf16 ymm2 {k7}, ymmword ptr [edi + 4*eax + 291] -// CHECK: vsqrtnepbf16 ymm2, word ptr [eax]{1to16} +// CHECK: vsqrtbf16 ymm2, word ptr [eax]{1to16} // CHECK: encoding: [0x62,0xf5,0x7d,0x38,0x51,0x10] - vsqrtnepbf16 ymm2, word ptr [eax]{1to16} + vsqrtbf16 ymm2, word ptr [eax]{1to16} -// CHECK: vsqrtnepbf16 ymm2, ymmword ptr [2*ebp - 1024] +// CHECK: vsqrtbf16 ymm2, ymmword ptr [2*ebp - 1024] // CHECK: encoding: [0x62,0xf5,0x7d,0x28,0x51,0x14,0x6d,0x00,0xfc,0xff,0xff] - vsqrtnepbf16 ymm2, ymmword ptr [2*ebp - 1024] + vsqrtbf16 ymm2, ymmword ptr [2*ebp - 1024] -// CHECK: vsqrtnepbf16 ymm2 {k7} {z}, ymmword ptr [ecx + 4064] +// CHECK: vsqrtbf16 ymm2 {k7} {z}, ymmword ptr [ecx + 4064] // CHECK: encoding: [0x62,0xf5,0x7d,0xaf,0x51,0x51,0x7f] - vsqrtnepbf16 ymm2 {k7} {z}, ymmword ptr [ecx + 4064] + vsqrtbf16 ymm2 {k7} {z}, ymmword ptr [ecx + 4064] -// CHECK: vsqrtnepbf16 ymm2 {k7} {z}, word ptr [edx - 256]{1to16} +// CHECK: vsqrtbf16 ymm2 {k7} {z}, word ptr [edx - 256]{1to16} // CHECK: encoding: [0x62,0xf5,0x7d,0xbf,0x51,0x52,0x80] - vsqrtnepbf16 ymm2 {k7} {z}, word ptr [edx - 256]{1to16} + vsqrtbf16 ymm2 {k7} {z}, word ptr [edx - 256]{1to16} -// CHECK: vsqrtnepbf16 zmm2, zmmword ptr [esp + 8*esi + 268435456] +// CHECK: vsqrtbf16 zmm2, zmmword ptr [esp + 8*esi + 268435456] // CHECK: encoding: [0x62,0xf5,0x7d,0x48,0x51,0x94,0xf4,0x00,0x00,0x00,0x10] - vsqrtnepbf16 zmm2, zmmword ptr [esp + 8*esi + 268435456] + vsqrtbf16 zmm2, zmmword ptr [esp + 8*esi + 268435456] -// CHECK: vsqrtnepbf16 zmm2 {k7}, zmmword ptr [edi + 4*eax + 291] +// CHECK: vsqrtbf16 zmm2 {k7}, zmmword ptr [edi + 4*eax + 291] // CHECK: encoding: [0x62,0xf5,0x7d,0x4f,0x51,0x94,0x87,0x23,0x01,0x00,0x00] - vsqrtnepbf16 zmm2 {k7}, zmmword ptr [edi + 4*eax + 291] + vsqrtbf16 zmm2 {k7}, zmmword ptr [edi + 4*eax + 291] -// CHECK: vsqrtnepbf16 zmm2, word ptr [eax]{1to32} +// CHECK: vsqrtbf16 zmm2, word ptr [eax]{1to32} // CHECK: encoding: [0x62,0xf5,0x7d,0x58,0x51,0x10] - vsqrtnepbf16 zmm2, word ptr [eax]{1to32} + vsqrtbf16 zmm2, word ptr [eax]{1to32} -// CHECK: vsqrtnepbf16 zmm2, zmmword ptr [2*ebp - 2048] +// CHECK: vsqrtbf16 zmm2, zmmword ptr [2*ebp - 2048] // CHECK: encoding: [0x62,0xf5,0x7d,0x48,0x51,0x14,0x6d,0x00,0xf8,0xff,0xff] - vsqrtnepbf16 zmm2, zmmword ptr [2*ebp - 2048] + vsqrtbf16 zmm2, zmmword ptr [2*ebp - 2048] -// CHECK: vsqrtnepbf16 zmm2 {k7} {z}, zmmword ptr [ecx + 8128] +// CHECK: vsqrtbf16 zmm2 {k7} {z}, zmmword ptr [ecx + 8128] // CHECK: encoding: [0x62,0xf5,0x7d,0xcf,0x51,0x51,0x7f] - vsqrtnepbf16 zmm2 {k7} {z}, zmmword ptr [ecx + 8128] + vsqrtbf16 zmm2 {k7} {z}, zmmword ptr [ecx + 8128] -// CHECK: vsqrtnepbf16 zmm2 {k7} {z}, word ptr [edx - 256]{1to32} +// CHECK: vsqrtbf16 zmm2 {k7} {z}, word ptr [edx - 256]{1to32} // CHECK: encoding: [0x62,0xf5,0x7d,0xdf,0x51,0x52,0x80] - vsqrtnepbf16 zmm2 {k7} {z}, word ptr [edx - 256]{1to32} + vsqrtbf16 zmm2 {k7} {z}, word ptr [edx - 256]{1to32} -// CHECK: vsubnepbf16 ymm2, ymm3, ymm4 +// CHECK: vsubbf16 ymm2, ymm3, ymm4 // CHECK: encoding: [0x62,0xf5,0x65,0x28,0x5c,0xd4] - vsubnepbf16 ymm2, ymm3, ymm4 + vsubbf16 ymm2, ymm3, ymm4 -// CHECK: vsubnepbf16 ymm2 {k7}, ymm3, ymm4 +// CHECK: vsubbf16 ymm2 {k7}, ymm3, ymm4 // CHECK: encoding: [0x62,0xf5,0x65,0x2f,0x5c,0xd4] - vsubnepbf16 ymm2 {k7}, ymm3, ymm4 + vsubbf16 ymm2 {k7}, ymm3, ymm4 -// CHECK: vsubnepbf16 ymm2 {k7} {z}, ymm3, ymm4 +// CHECK: vsubbf16 ymm2 {k7} {z}, ymm3, ymm4 // CHECK: encoding: [0x62,0xf5,0x65,0xaf,0x5c,0xd4] - vsubnepbf16 ymm2 {k7} {z}, ymm3, ymm4 + vsubbf16 ymm2 {k7} {z}, ymm3, ymm4 -// CHECK: vsubnepbf16 zmm2, zmm3, zmm4 +// CHECK: vsubbf16 zmm2, zmm3, zmm4 // CHECK: encoding: [0x62,0xf5,0x65,0x48,0x5c,0xd4] - vsubnepbf16 zmm2, zmm3, zmm4 + vsubbf16 zmm2, zmm3, zmm4 -// CHECK: vsubnepbf16 zmm2 {k7}, zmm3, zmm4 +// CHECK: vsubbf16 zmm2 {k7}, zmm3, zmm4 // CHECK: encoding: [0x62,0xf5,0x65,0x4f,0x5c,0xd4] - vsubnepbf16 zmm2 {k7}, zmm3, zmm4 + vsubbf16 zmm2 {k7}, zmm3, zmm4 -// CHECK: vsubnepbf16 zmm2 {k7} {z}, zmm3, zmm4 +// CHECK: vsubbf16 zmm2 {k7} {z}, zmm3, zmm4 // CHECK: encoding: [0x62,0xf5,0x65,0xcf,0x5c,0xd4] - vsubnepbf16 zmm2 {k7} {z}, zmm3, zmm4 + vsubbf16 zmm2 {k7} {z}, zmm3, zmm4 -// CHECK: vsubnepbf16 xmm2, xmm3, xmm4 +// CHECK: vsubbf16 xmm2, xmm3, xmm4 // CHECK: encoding: [0x62,0xf5,0x65,0x08,0x5c,0xd4] - vsubnepbf16 xmm2, xmm3, xmm4 + vsubbf16 xmm2, xmm3, xmm4 -// CHECK: vsubnepbf16 xmm2 {k7}, xmm3, xmm4 +// CHECK: vsubbf16 xmm2 {k7}, xmm3, xmm4 // CHECK: encoding: [0x62,0xf5,0x65,0x0f,0x5c,0xd4] - vsubnepbf16 xmm2 {k7}, xmm3, xmm4 + vsubbf16 xmm2 {k7}, xmm3, xmm4 -// CHECK: vsubnepbf16 xmm2 {k7} {z}, xmm3, xmm4 +// CHECK: vsubbf16 xmm2 {k7} {z}, xmm3, xmm4 // CHECK: encoding: [0x62,0xf5,0x65,0x8f,0x5c,0xd4] - vsubnepbf16 xmm2 {k7} {z}, xmm3, xmm4 + vsubbf16 xmm2 {k7} {z}, xmm3, xmm4 -// CHECK: vsubnepbf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456] +// CHECK: vsubbf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456] // CHECK: encoding: [0x62,0xf5,0x65,0x48,0x5c,0x94,0xf4,0x00,0x00,0x00,0x10] - vsubnepbf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456] + vsubbf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456] -// CHECK: vsubnepbf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291] +// CHECK: vsubbf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291] // CHECK: encoding: [0x62,0xf5,0x65,0x4f,0x5c,0x94,0x87,0x23,0x01,0x00,0x00] - vsubnepbf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291] + vsubbf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291] -// CHECK: vsubnepbf16 zmm2, zmm3, word ptr [eax]{1to32} +// CHECK: vsubbf16 zmm2, zmm3, word ptr [eax]{1to32} // CHECK: encoding: [0x62,0xf5,0x65,0x58,0x5c,0x10] - vsubnepbf16 zmm2, zmm3, word ptr [eax]{1to32} + vsubbf16 zmm2, zmm3, word ptr [eax]{1to32} -// CHECK: vsubnepbf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048] +// CHECK: vsubbf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048] // CHECK: encoding: [0x62,0xf5,0x65,0x48,0x5c,0x14,0x6d,0x00,0xf8,0xff,0xff] - vsubnepbf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048] + vsubbf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048] -// CHECK: vsubnepbf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128] +// CHECK: vsubbf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128] // CHECK: encoding: [0x62,0xf5,0x65,0xcf,0x5c,0x51,0x7f] - vsubnepbf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128] + vsubbf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128] -// CHECK: vsubnepbf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32} +// CHECK: vsubbf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32} // CHECK: encoding: [0x62,0xf5,0x65,0xdf,0x5c,0x52,0x80] - vsubnepbf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32} + vsubbf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32} -// CHECK: vsubnepbf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456] +// CHECK: vsubbf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456] // CHECK: encoding: [0x62,0xf5,0x65,0x28,0x5c,0x94,0xf4,0x00,0x00,0x00,0x10] - vsubnepbf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456] + vsubbf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456] -// CHECK: vsubnepbf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291] +// CHECK: vsubbf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291] // CHECK: encoding: [0x62,0xf5,0x65,0x2f,0x5c,0x94,0x87,0x23,0x01,0x00,0x00] - vsubnepbf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291] + vsubbf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291] -// CHECK: vsubnepbf16 ymm2, ymm3, word ptr [eax]{1to16} +// CHECK: vsubbf16 ymm2, ymm3, word ptr [eax]{1to16} // CHECK: encoding: [0x62,0xf5,0x65,0x38,0x5c,0x10] - vsubnepbf16 ymm2, ymm3, word ptr [eax]{1to16} + vsubbf16 ymm2, ymm3, word ptr [eax]{1to16} -// CHECK: vsubnepbf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024] +// CHECK: vsubbf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024] // CHECK: encoding: [0x62,0xf5,0x65,0x28,0x5c,0x14,0x6d,0x00,0xfc,0xff,0xff] - vsubnepbf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024] + vsubbf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024] -// CHECK: vsubnepbf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064] +// CHECK: vsubbf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064] // CHECK: encoding: [0x62,0xf5,0x65,0xaf,0x5c,0x51,0x7f] - vsubnepbf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064] + vsubbf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064] -// CHECK: vsubnepbf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16} +// CHECK: vsubbf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16} // CHECK: encoding: [0x62,0xf5,0x65,0xbf,0x5c,0x52,0x80] - vsubnepbf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16} + vsubbf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16} -// CHECK: vsubnepbf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456] +// CHECK: vsubbf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456] // CHECK: encoding: [0x62,0xf5,0x65,0x08,0x5c,0x94,0xf4,0x00,0x00,0x00,0x10] - vsubnepbf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456] + vsubbf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456] -// CHECK: vsubnepbf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291] +// CHECK: vsubbf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291] // CHECK: encoding: [0x62,0xf5,0x65,0x0f,0x5c,0x94,0x87,0x23,0x01,0x00,0x00] - vsubnepbf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291] + vsubbf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291] -// CHECK: vsubnepbf16 xmm2, xmm3, word ptr [eax]{1to8} +// CHECK: vsubbf16 xmm2, xmm3, word ptr [eax]{1to8} // CHECK: encoding: [0x62,0xf5,0x65,0x18,0x5c,0x10] - vsubnepbf16 xmm2, xmm3, word ptr [eax]{1to8} + vsubbf16 xmm2, xmm3, word ptr [eax]{1to8} -// CHECK: vsubnepbf16 xmm2, xmm3, xmmword ptr [2*ebp - 512] +// CHECK: vsubbf16 xmm2, xmm3, xmmword ptr [2*ebp - 512] // CHECK: encoding: [0x62,0xf5,0x65,0x08,0x5c,0x14,0x6d,0x00,0xfe,0xff,0xff] - vsubnepbf16 xmm2, xmm3, xmmword ptr [2*ebp - 512] + vsubbf16 xmm2, xmm3, xmmword ptr [2*ebp - 512] -// CHECK: vsubnepbf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032] +// CHECK: vsubbf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032] // CHECK: encoding: [0x62,0xf5,0x65,0x8f,0x5c,0x51,0x7f] - vsubnepbf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032] + vsubbf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032] -// CHECK: vsubnepbf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8} +// CHECK: vsubbf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8} // CHECK: encoding: [0x62,0xf5,0x65,0x9f,0x5c,0x52,0x80] - vsubnepbf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8} + vsubbf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8} diff --git a/llvm/test/MC/X86/avx10.2-bf16-64-att.s b/llvm/test/MC/X86/avx10.2-bf16-64-att.s index 85d99cfe0a704..d960dca940c80 100644 --- a/llvm/test/MC/X86/avx10.2-bf16-64-att.s +++ b/llvm/test/MC/X86/avx10.2-bf16-64-att.s @@ -1,208 +1,208 @@ // RUN: llvm-mc -triple x86_64 --show-encoding %s | FileCheck %s -// CHECK: vaddnepbf16 %ymm24, %ymm23, %ymm22 +// CHECK: vaddbf16 %ymm24, %ymm23, %ymm22 // CHECK: encoding: [0x62,0x85,0x45,0x20,0x58,0xf0] - vaddnepbf16 %ymm24, %ymm23, %ymm22 + vaddbf16 %ymm24, %ymm23, %ymm22 -// CHECK: vaddnepbf16 %ymm24, %ymm23, %ymm22 {%k7} +// CHECK: vaddbf16 %ymm24, %ymm23, %ymm22 {%k7} // CHECK: encoding: [0x62,0x85,0x45,0x27,0x58,0xf0] - vaddnepbf16 %ymm24, %ymm23, %ymm22 {%k7} + vaddbf16 %ymm24, %ymm23, %ymm22 {%k7} -// CHECK: vaddnepbf16 %ymm24, %ymm23, %ymm22 {%k7} {z} +// CHECK: vaddbf16 %ymm24, %ymm23, %ymm22 {%k7} {z} // CHECK: encoding: [0x62,0x85,0x45,0xa7,0x58,0xf0] - vaddnepbf16 %ymm24, %ymm23, %ymm22 {%k7} {z} + vaddbf16 %ymm24, %ymm23, %ymm22 {%k7} {z} -// CHECK: vaddnepbf16 %zmm24, %zmm23, %zmm22 +// CHECK: vaddbf16 %zmm24, %zmm23, %zmm22 // CHECK: encoding: [0x62,0x85,0x45,0x40,0x58,0xf0] - vaddnepbf16 %zmm24, %zmm23, %zmm22 + vaddbf16 %zmm24, %zmm23, %zmm22 -// CHECK: vaddnepbf16 %zmm24, %zmm23, %zmm22 {%k7} +// CHECK: vaddbf16 %zmm24, %zmm23, %zmm22 {%k7} // CHECK: encoding: [0x62,0x85,0x45,0x47,0x58,0xf0] - vaddnepbf16 %zmm24, %zmm23, %zmm22 {%k7} + vaddbf16 %zmm24, %zmm23, %zmm22 {%k7} -// CHECK: vaddnepbf16 %zmm24, %zmm23, %zmm22 {%k7} {z} +// CHECK: vaddbf16 %zmm24, %zmm23, %zmm22 {%k7} {z} // CHECK: encoding: [0x62,0x85,0x45,0xc7,0x58,0xf0] - vaddnepbf16 %zmm24, %zmm23, %zmm22 {%k7} {z} + vaddbf16 %zmm24, %zmm23, %zmm22 {%k7} {z} -// CHECK: vaddnepbf16 %xmm24, %xmm23, %xmm22 +// CHECK: vaddbf16 %xmm24, %xmm23, %xmm22 // CHECK: encoding: [0x62,0x85,0x45,0x00,0x58,0xf0] - vaddnepbf16 %xmm24, %xmm23, %xmm22 + vaddbf16 %xmm24, %xmm23, %xmm22 -// CHECK: vaddnepbf16 %xmm24, %xmm23, %xmm22 {%k7} +// CHECK: vaddbf16 %xmm24, %xmm23, %xmm22 {%k7} // CHECK: encoding: [0x62,0x85,0x45,0x07,0x58,0xf0] - vaddnepbf16 %xmm24, %xmm23, %xmm22 {%k7} + vaddbf16 %xmm24, %xmm23, %xmm22 {%k7} -// CHECK: vaddnepbf16 %xmm24, %xmm23, %xmm22 {%k7} {z} +// CHECK: vaddbf16 %xmm24, %xmm23, %xmm22 {%k7} {z} // CHECK: encoding: [0x62,0x85,0x45,0x87,0x58,0xf0] - vaddnepbf16 %xmm24, %xmm23, %xmm22 {%k7} {z} + vaddbf16 %xmm24, %xmm23, %xmm22 {%k7} {z} -// CHECK: vaddnepbf16 268435456(%rbp,%r14,8), %zmm23, %zmm22 +// CHECK: vaddbf16 268435456(%rbp,%r14,8), %zmm23, %zmm22 // CHECK: encoding: [0x62,0xa5,0x45,0x40,0x58,0xb4,0xf5,0x00,0x00,0x00,0x10] - vaddnepbf16 268435456(%rbp,%r14,8), %zmm23, %zmm22 + vaddbf16 268435456(%rbp,%r14,8), %zmm23, %zmm22 -// CHECK: vaddnepbf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7} +// CHECK: vaddbf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7} // CHECK: encoding: [0x62,0xc5,0x45,0x47,0x58,0xb4,0x80,0x23,0x01,0x00,0x00] - vaddnepbf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7} + vaddbf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7} -// CHECK: vaddnepbf16 (%rip){1to32}, %zmm23, %zmm22 +// CHECK: vaddbf16 (%rip){1to32}, %zmm23, %zmm22 // CHECK: encoding: [0x62,0xe5,0x45,0x50,0x58,0x35,0x00,0x00,0x00,0x00] - vaddnepbf16 (%rip){1to32}, %zmm23, %zmm22 + vaddbf16 (%rip){1to32}, %zmm23, %zmm22 -// CHECK: vaddnepbf16 -2048(,%rbp,2), %zmm23, %zmm22 +// CHECK: vaddbf16 -2048(,%rbp,2), %zmm23, %zmm22 // CHECK: encoding: [0x62,0xe5,0x45,0x40,0x58,0x34,0x6d,0x00,0xf8,0xff,0xff] - vaddnepbf16 -2048(,%rbp,2), %zmm23, %zmm22 + vaddbf16 -2048(,%rbp,2), %zmm23, %zmm22 -// CHECK: vaddnepbf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z} +// CHECK: vaddbf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z} // CHECK: encoding: [0x62,0xe5,0x45,0xc7,0x58,0x71,0x7f] - vaddnepbf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z} + vaddbf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z} -// CHECK: vaddnepbf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z} +// CHECK: vaddbf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z} // CHECK: encoding: [0x62,0xe5,0x45,0xd7,0x58,0x72,0x80] - vaddnepbf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z} + vaddbf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z} -// CHECK: vaddnepbf16 268435456(%rbp,%r14,8), %ymm23, %ymm22 +// CHECK: vaddbf16 268435456(%rbp,%r14,8), %ymm23, %ymm22 // CHECK: encoding: [0x62,0xa5,0x45,0x20,0x58,0xb4,0xf5,0x00,0x00,0x00,0x10] - vaddnepbf16 268435456(%rbp,%r14,8), %ymm23, %ymm22 + vaddbf16 268435456(%rbp,%r14,8), %ymm23, %ymm22 -// CHECK: vaddnepbf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7} +// CHECK: vaddbf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7} // CHECK: encoding: [0x62,0xc5,0x45,0x27,0x58,0xb4,0x80,0x23,0x01,0x00,0x00] - vaddnepbf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7} + vaddbf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7} -// CHECK: vaddnepbf16 (%rip){1to16}, %ymm23, %ymm22 +// CHECK: vaddbf16 (%rip){1to16}, %ymm23, %ymm22 // CHECK: encoding: [0x62,0xe5,0x45,0x30,0x58,0x35,0x00,0x00,0x00,0x00] - vaddnepbf16 (%rip){1to16}, %ymm23, %ymm22 + vaddbf16 (%rip){1to16}, %ymm23, %ymm22 -// CHECK: vaddnepbf16 -1024(,%rbp,2), %ymm23, %ymm22 +// CHECK: vaddbf16 -1024(,%rbp,2), %ymm23, %ymm22 // CHECK: encoding: [0x62,0xe5,0x45,0x20,0x58,0x34,0x6d,0x00,0xfc,0xff,0xff] - vaddnepbf16 -1024(,%rbp,2), %ymm23, %ymm22 + vaddbf16 -1024(,%rbp,2), %ymm23, %ymm22 -// CHECK: vaddnepbf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z} +// CHECK: vaddbf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z} // CHECK: encoding: [0x62,0xe5,0x45,0xa7,0x58,0x71,0x7f] - vaddnepbf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z} + vaddbf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z} -// CHECK: vaddnepbf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z} +// CHECK: vaddbf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z} // CHECK: encoding: [0x62,0xe5,0x45,0xb7,0x58,0x72,0x80] - vaddnepbf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z} + vaddbf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z} -// CHECK: vaddnepbf16 268435456(%rbp,%r14,8), %xmm23, %xmm22 +// CHECK: vaddbf16 268435456(%rbp,%r14,8), %xmm23, %xmm22 // CHECK: encoding: [0x62,0xa5,0x45,0x00,0x58,0xb4,0xf5,0x00,0x00,0x00,0x10] - vaddnepbf16 268435456(%rbp,%r14,8), %xmm23, %xmm22 + vaddbf16 268435456(%rbp,%r14,8), %xmm23, %xmm22 -// CHECK: vaddnepbf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7} +// CHECK: vaddbf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7} // CHECK: encoding: [0x62,0xc5,0x45,0x07,0x58,0xb4,0x80,0x23,0x01,0x00,0x00] - vaddnepbf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7} + vaddbf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7} -// CHECK: vaddnepbf16 (%rip){1to8}, %xmm23, %xmm22 +// CHECK: vaddbf16 (%rip){1to8}, %xmm23, %xmm22 // CHECK: encoding: [0x62,0xe5,0x45,0x10,0x58,0x35,0x00,0x00,0x00,0x00] - vaddnepbf16 (%rip){1to8}, %xmm23, %xmm22 + vaddbf16 (%rip){1to8}, %xmm23, %xmm22 -// CHECK: vaddnepbf16 -512(,%rbp,2), %xmm23, %xmm22 +// CHECK: vaddbf16 -512(,%rbp,2), %xmm23, %xmm22 // CHECK: encoding: [0x62,0xe5,0x45,0x00,0x58,0x34,0x6d,0x00,0xfe,0xff,0xff] - vaddnepbf16 -512(,%rbp,2), %xmm23, %xmm22 + vaddbf16 -512(,%rbp,2), %xmm23, %xmm22 -// CHECK: vaddnepbf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z} +// CHECK: vaddbf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z} // CHECK: encoding: [0x62,0xe5,0x45,0x87,0x58,0x71,0x7f] - vaddnepbf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z} + vaddbf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z} -// CHECK: vaddnepbf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z} +// CHECK: vaddbf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z} // CHECK: encoding: [0x62,0xe5,0x45,0x97,0x58,0x72,0x80] - vaddnepbf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z} + vaddbf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z} -// CHECK: vcmppbf16 $123, %ymm24, %ymm23, %k5 +// CHECK: vcmpbf16 $123, %ymm24, %ymm23, %k5 // CHECK: encoding: [0x62,0x93,0x47,0x20,0xc2,0xe8,0x7b] - vcmppbf16 $123, %ymm24, %ymm23, %k5 + vcmpbf16 $123, %ymm24, %ymm23, %k5 -// CHECK: vcmppbf16 $123, %ymm24, %ymm23, %k5 {%k7} +// CHECK: vcmpbf16 $123, %ymm24, %ymm23, %k5 {%k7} // CHECK: encoding: [0x62,0x93,0x47,0x27,0xc2,0xe8,0x7b] - vcmppbf16 $123, %ymm24, %ymm23, %k5 {%k7} + vcmpbf16 $123, %ymm24, %ymm23, %k5 {%k7} -// CHECK: vcmppbf16 $123, %xmm24, %xmm23, %k5 +// CHECK: vcmpbf16 $123, %xmm24, %xmm23, %k5 // CHECK: encoding: [0x62,0x93,0x47,0x00,0xc2,0xe8,0x7b] - vcmppbf16 $123, %xmm24, %xmm23, %k5 + vcmpbf16 $123, %xmm24, %xmm23, %k5 -// CHECK: vcmppbf16 $123, %xmm24, %xmm23, %k5 {%k7} +// CHECK: vcmpbf16 $123, %xmm24, %xmm23, %k5 {%k7} // CHECK: encoding: [0x62,0x93,0x47,0x07,0xc2,0xe8,0x7b] - vcmppbf16 $123, %xmm24, %xmm23, %k5 {%k7} + vcmpbf16 $123, %xmm24, %xmm23, %k5 {%k7} -// CHECK: vcmppbf16 $123, %zmm24, %zmm23, %k5 +// CHECK: vcmpbf16 $123, %zmm24, %zmm23, %k5 // CHECK: encoding: [0x62,0x93,0x47,0x40,0xc2,0xe8,0x7b] - vcmppbf16 $123, %zmm24, %zmm23, %k5 + vcmpbf16 $123, %zmm24, %zmm23, %k5 -// CHECK: vcmppbf16 $123, %zmm24, %zmm23, %k5 {%k7} +// CHECK: vcmpbf16 $123, %zmm24, %zmm23, %k5 {%k7} // CHECK: encoding: [0x62,0x93,0x47,0x47,0xc2,0xe8,0x7b] - vcmppbf16 $123, %zmm24, %zmm23, %k5 {%k7} + vcmpbf16 $123, %zmm24, %zmm23, %k5 {%k7} -// CHECK: vcmppbf16 $123, 268435456(%rbp,%r14,8), %zmm23, %k5 +// CHECK: vcmpbf16 $123, 268435456(%rbp,%r14,8), %zmm23, %k5 // CHECK: encoding: [0x62,0xb3,0x47,0x40,0xc2,0xac,0xf5,0x00,0x00,0x00,0x10,0x7b] - vcmppbf16 $123, 268435456(%rbp,%r14,8), %zmm23, %k5 + vcmpbf16 $123, 268435456(%rbp,%r14,8), %zmm23, %k5 -// CHECK: vcmppbf16 $123, 291(%r8,%rax,4), %zmm23, %k5 {%k7} +// CHECK: vcmpbf16 $123, 291(%r8,%rax,4), %zmm23, %k5 {%k7} // CHECK: encoding: [0x62,0xd3,0x47,0x47,0xc2,0xac,0x80,0x23,0x01,0x00,0x00,0x7b] - vcmppbf16 $123, 291(%r8,%rax,4), %zmm23, %k5 {%k7} + vcmpbf16 $123, 291(%r8,%rax,4), %zmm23, %k5 {%k7} -// CHECK: vcmppbf16 $123, (%rip){1to32}, %zmm23, %k5 +// CHECK: vcmpbf16 $123, (%rip){1to32}, %zmm23, %k5 // CHECK: encoding: [0x62,0xf3,0x47,0x50,0xc2,0x2d,0x00,0x00,0x00,0x00,0x7b] - vcmppbf16 $123, (%rip){1to32}, %zmm23, %k5 + vcmpbf16 $123, (%rip){1to32}, %zmm23, %k5 -// CHECK: vcmppbf16 $123, -2048(,%rbp,2), %zmm23, %k5 +// CHECK: vcmpbf16 $123, -2048(,%rbp,2), %zmm23, %k5 // CHECK: encoding: [0x62,0xf3,0x47,0x40,0xc2,0x2c,0x6d,0x00,0xf8,0xff,0xff,0x7b] - vcmppbf16 $123, -2048(,%rbp,2), %zmm23, %k5 + vcmpbf16 $123, -2048(,%rbp,2), %zmm23, %k5 -// CHECK: vcmppbf16 $123, 8128(%rcx), %zmm23, %k5 {%k7} +// CHECK: vcmpbf16 $123, 8128(%rcx), %zmm23, %k5 {%k7} // CHECK: encoding: [0x62,0xf3,0x47,0x47,0xc2,0x69,0x7f,0x7b] - vcmppbf16 $123, 8128(%rcx), %zmm23, %k5 {%k7} + vcmpbf16 $123, 8128(%rcx), %zmm23, %k5 {%k7} -// CHECK: vcmppbf16 $123, -256(%rdx){1to32}, %zmm23, %k5 {%k7} +// CHECK: vcmpbf16 $123, -256(%rdx){1to32}, %zmm23, %k5 {%k7} // CHECK: encoding: [0x62,0xf3,0x47,0x57,0xc2,0x6a,0x80,0x7b] - vcmppbf16 $123, -256(%rdx){1to32}, %zmm23, %k5 {%k7} + vcmpbf16 $123, -256(%rdx){1to32}, %zmm23, %k5 {%k7} -// CHECK: vcmppbf16 $123, 268435456(%rbp,%r14,8), %xmm23, %k5 +// CHECK: vcmpbf16 $123, 268435456(%rbp,%r14,8), %xmm23, %k5 // CHECK: encoding: [0x62,0xb3,0x47,0x00,0xc2,0xac,0xf5,0x00,0x00,0x00,0x10,0x7b] - vcmppbf16 $123, 268435456(%rbp,%r14,8), %xmm23, %k5 + vcmpbf16 $123, 268435456(%rbp,%r14,8), %xmm23, %k5 -// CHECK: vcmppbf16 $123, 291(%r8,%rax,4), %xmm23, %k5 {%k7} +// CHECK: vcmpbf16 $123, 291(%r8,%rax,4), %xmm23, %k5 {%k7} // CHECK: encoding: [0x62,0xd3,0x47,0x07,0xc2,0xac,0x80,0x23,0x01,0x00,0x00,0x7b] - vcmppbf16 $123, 291(%r8,%rax,4), %xmm23, %k5 {%k7} + vcmpbf16 $123, 291(%r8,%rax,4), %xmm23, %k5 {%k7} -// CHECK: vcmppbf16 $123, (%rip){1to8}, %xmm23, %k5 +// CHECK: vcmpbf16 $123, (%rip){1to8}, %xmm23, %k5 // CHECK: encoding: [0x62,0xf3,0x47,0x10,0xc2,0x2d,0x00,0x00,0x00,0x00,0x7b] - vcmppbf16 $123, (%rip){1to8}, %xmm23, %k5 + vcmpbf16 $123, (%rip){1to8}, %xmm23, %k5 -// CHECK: vcmppbf16 $123, -512(,%rbp,2), %xmm23, %k5 +// CHECK: vcmpbf16 $123, -512(,%rbp,2), %xmm23, %k5 // CHECK: encoding: [0x62,0xf3,0x47,0x00,0xc2,0x2c,0x6d,0x00,0xfe,0xff,0xff,0x7b] - vcmppbf16 $123, -512(,%rbp,2), %xmm23, %k5 + vcmpbf16 $123, -512(,%rbp,2), %xmm23, %k5 -// CHECK: vcmppbf16 $123, 2032(%rcx), %xmm23, %k5 {%k7} +// CHECK: vcmpbf16 $123, 2032(%rcx), %xmm23, %k5 {%k7} // CHECK: encoding: [0x62,0xf3,0x47,0x07,0xc2,0x69,0x7f,0x7b] - vcmppbf16 $123, 2032(%rcx), %xmm23, %k5 {%k7} + vcmpbf16 $123, 2032(%rcx), %xmm23, %k5 {%k7} -// CHECK: vcmppbf16 $123, -256(%rdx){1to8}, %xmm23, %k5 {%k7} +// CHECK: vcmpbf16 $123, -256(%rdx){1to8}, %xmm23, %k5 {%k7} // CHECK: encoding: [0x62,0xf3,0x47,0x17,0xc2,0x6a,0x80,0x7b] - vcmppbf16 $123, -256(%rdx){1to8}, %xmm23, %k5 {%k7} + vcmpbf16 $123, -256(%rdx){1to8}, %xmm23, %k5 {%k7} -// CHECK: vcmppbf16 $123, 268435456(%rbp,%r14,8), %ymm23, %k5 +// CHECK: vcmpbf16 $123, 268435456(%rbp,%r14,8), %ymm23, %k5 // CHECK: encoding: [0x62,0xb3,0x47,0x20,0xc2,0xac,0xf5,0x00,0x00,0x00,0x10,0x7b] - vcmppbf16 $123, 268435456(%rbp,%r14,8), %ymm23, %k5 + vcmpbf16 $123, 268435456(%rbp,%r14,8), %ymm23, %k5 -// CHECK: vcmppbf16 $123, 291(%r8,%rax,4), %ymm23, %k5 {%k7} +// CHECK: vcmpbf16 $123, 291(%r8,%rax,4), %ymm23, %k5 {%k7} // CHECK: encoding: [0x62,0xd3,0x47,0x27,0xc2,0xac,0x80,0x23,0x01,0x00,0x00,0x7b] - vcmppbf16 $123, 291(%r8,%rax,4), %ymm23, %k5 {%k7} + vcmpbf16 $123, 291(%r8,%rax,4), %ymm23, %k5 {%k7} -// CHECK: vcmppbf16 $123, (%rip){1to16}, %ymm23, %k5 +// CHECK: vcmpbf16 $123, (%rip){1to16}, %ymm23, %k5 // CHECK: encoding: [0x62,0xf3,0x47,0x30,0xc2,0x2d,0x00,0x00,0x00,0x00,0x7b] - vcmppbf16 $123, (%rip){1to16}, %ymm23, %k5 + vcmpbf16 $123, (%rip){1to16}, %ymm23, %k5 -// CHECK: vcmppbf16 $123, -1024(,%rbp,2), %ymm23, %k5 +// CHECK: vcmpbf16 $123, -1024(,%rbp,2), %ymm23, %k5 // CHECK: encoding: [0x62,0xf3,0x47,0x20,0xc2,0x2c,0x6d,0x00,0xfc,0xff,0xff,0x7b] - vcmppbf16 $123, -1024(,%rbp,2), %ymm23, %k5 + vcmpbf16 $123, -1024(,%rbp,2), %ymm23, %k5 -// CHECK: vcmppbf16 $123, 4064(%rcx), %ymm23, %k5 {%k7} +// CHECK: vcmpbf16 $123, 4064(%rcx), %ymm23, %k5 {%k7} // CHECK: encoding: [0x62,0xf3,0x47,0x27,0xc2,0x69,0x7f,0x7b] - vcmppbf16 $123, 4064(%rcx), %ymm23, %k5 {%k7} + vcmpbf16 $123, 4064(%rcx), %ymm23, %k5 {%k7} -// CHECK: vcmppbf16 $123, -256(%rdx){1to16}, %ymm23, %k5 {%k7} +// CHECK: vcmpbf16 $123, -256(%rdx){1to16}, %ymm23, %k5 {%k7} // CHECK: encoding: [0x62,0xf3,0x47,0x37,0xc2,0x6a,0x80,0x7b] - vcmppbf16 $123, -256(%rdx){1to16}, %ymm23, %k5 {%k7} + vcmpbf16 $123, -256(%rdx){1to16}, %ymm23, %k5 {%k7} // CHECK: vcomsbf16 %xmm23, %xmm22 // CHECK: encoding: [0x62,0xa5,0x7d,0x08,0x2f,0xf7] @@ -232,2783 +232,2783 @@ // CHECK: encoding: [0x62,0xe5,0x7d,0x08,0x2f,0x72,0x80] vcomsbf16 -256(%rdx), %xmm22 -// CHECK: vdivnepbf16 %ymm24, %ymm23, %ymm22 +// CHECK: vdivbf16 %ymm24, %ymm23, %ymm22 // CHECK: encoding: [0x62,0x85,0x45,0x20,0x5e,0xf0] - vdivnepbf16 %ymm24, %ymm23, %ymm22 + vdivbf16 %ymm24, %ymm23, %ymm22 -// CHECK: vdivnepbf16 %ymm24, %ymm23, %ymm22 {%k7} +// CHECK: vdivbf16 %ymm24, %ymm23, %ymm22 {%k7} // CHECK: encoding: [0x62,0x85,0x45,0x27,0x5e,0xf0] - vdivnepbf16 %ymm24, %ymm23, %ymm22 {%k7} + vdivbf16 %ymm24, %ymm23, %ymm22 {%k7} -// CHECK: vdivnepbf16 %ymm24, %ymm23, %ymm22 {%k7} {z} +// CHECK: vdivbf16 %ymm24, %ymm23, %ymm22 {%k7} {z} // CHECK: encoding: [0x62,0x85,0x45,0xa7,0x5e,0xf0] - vdivnepbf16 %ymm24, %ymm23, %ymm22 {%k7} {z} + vdivbf16 %ymm24, %ymm23, %ymm22 {%k7} {z} -// CHECK: vdivnepbf16 %zmm24, %zmm23, %zmm22 +// CHECK: vdivbf16 %zmm24, %zmm23, %zmm22 // CHECK: encoding: [0x62,0x85,0x45,0x40,0x5e,0xf0] - vdivnepbf16 %zmm24, %zmm23, %zmm22 + vdivbf16 %zmm24, %zmm23, %zmm22 -// CHECK: vdivnepbf16 %zmm24, %zmm23, %zmm22 {%k7} +// CHECK: vdivbf16 %zmm24, %zmm23, %zmm22 {%k7} // CHECK: encoding: [0x62,0x85,0x45,0x47,0x5e,0xf0] - vdivnepbf16 %zmm24, %zmm23, %zmm22 {%k7} + vdivbf16 %zmm24, %zmm23, %zmm22 {%k7} -// CHECK: vdivnepbf16 %zmm24, %zmm23, %zmm22 {%k7} {z} +// CHECK: vdivbf16 %zmm24, %zmm23, %zmm22 {%k7} {z} // CHECK: encoding: [0x62,0x85,0x45,0xc7,0x5e,0xf0] - vdivnepbf16 %zmm24, %zmm23, %zmm22 {%k7} {z} + vdivbf16 %zmm24, %zmm23, %zmm22 {%k7} {z} -// CHECK: vdivnepbf16 %xmm24, %xmm23, %xmm22 +// CHECK: vdivbf16 %xmm24, %xmm23, %xmm22 // CHECK: encoding: [0x62,0x85,0x45,0x00,0x5e,0xf0] - vdivnepbf16 %xmm24, %xmm23, %xmm22 + vdivbf16 %xmm24, %xmm23, %xmm22 -// CHECK: vdivnepbf16 %xmm24, %xmm23, %xmm22 {%k7} +// CHECK: vdivbf16 %xmm24, %xmm23, %xmm22 {%k7} // CHECK: encoding: [0x62,0x85,0x45,0x07,0x5e,0xf0] - vdivnepbf16 %xmm24, %xmm23, %xmm22 {%k7} + vdivbf16 %xmm24, %xmm23, %xmm22 {%k7} -// CHECK: vdivnepbf16 %xmm24, %xmm23, %xmm22 {%k7} {z} +// CHECK: vdivbf16 %xmm24, %xmm23, %xmm22 {%k7} {z} // CHECK: encoding: [0x62,0x85,0x45,0x87,0x5e,0xf0] - vdivnepbf16 %xmm24, %xmm23, %xmm22 {%k7} {z} + vdivbf16 %xmm24, %xmm23, %xmm22 {%k7} {z} -// CHECK: vdivnepbf16 268435456(%rbp,%r14,8), %zmm23, %zmm22 +// CHECK: vdivbf16 268435456(%rbp,%r14,8), %zmm23, %zmm22 // CHECK: encoding: [0x62,0xa5,0x45,0x40,0x5e,0xb4,0xf5,0x00,0x00,0x00,0x10] - vdivnepbf16 268435456(%rbp,%r14,8), %zmm23, %zmm22 + vdivbf16 268435456(%rbp,%r14,8), %zmm23, %zmm22 -// CHECK: vdivnepbf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7} +// CHECK: vdivbf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7} // CHECK: encoding: [0x62,0xc5,0x45,0x47,0x5e,0xb4,0x80,0x23,0x01,0x00,0x00] - vdivnepbf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7} + vdivbf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7} -// CHECK: vdivnepbf16 (%rip){1to32}, %zmm23, %zmm22 +// CHECK: vdivbf16 (%rip){1to32}, %zmm23, %zmm22 // CHECK: encoding: [0x62,0xe5,0x45,0x50,0x5e,0x35,0x00,0x00,0x00,0x00] - vdivnepbf16 (%rip){1to32}, %zmm23, %zmm22 + vdivbf16 (%rip){1to32}, %zmm23, %zmm22 -// CHECK: vdivnepbf16 -2048(,%rbp,2), %zmm23, %zmm22 +// CHECK: vdivbf16 -2048(,%rbp,2), %zmm23, %zmm22 // CHECK: encoding: [0x62,0xe5,0x45,0x40,0x5e,0x34,0x6d,0x00,0xf8,0xff,0xff] - vdivnepbf16 -2048(,%rbp,2), %zmm23, %zmm22 + vdivbf16 -2048(,%rbp,2), %zmm23, %zmm22 -// CHECK: vdivnepbf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z} +// CHECK: vdivbf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z} // CHECK: encoding: [0x62,0xe5,0x45,0xc7,0x5e,0x71,0x7f] - vdivnepbf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z} + vdivbf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z} -// CHECK: vdivnepbf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z} +// CHECK: vdivbf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z} // CHECK: encoding: [0x62,0xe5,0x45,0xd7,0x5e,0x72,0x80] - vdivnepbf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z} + vdivbf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z} -// CHECK: vdivnepbf16 268435456(%rbp,%r14,8), %ymm23, %ymm22 +// CHECK: vdivbf16 268435456(%rbp,%r14,8), %ymm23, %ymm22 // CHECK: encoding: [0x62,0xa5,0x45,0x20,0x5e,0xb4,0xf5,0x00,0x00,0x00,0x10] - vdivnepbf16 268435456(%rbp,%r14,8), %ymm23, %ymm22 + vdivbf16 268435456(%rbp,%r14,8), %ymm23, %ymm22 -// CHECK: vdivnepbf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7} +// CHECK: vdivbf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7} // CHECK: encoding: [0x62,0xc5,0x45,0x27,0x5e,0xb4,0x80,0x23,0x01,0x00,0x00] - vdivnepbf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7} + vdivbf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7} -// CHECK: vdivnepbf16 (%rip){1to16}, %ymm23, %ymm22 +// CHECK: vdivbf16 (%rip){1to16}, %ymm23, %ymm22 // CHECK: encoding: [0x62,0xe5,0x45,0x30,0x5e,0x35,0x00,0x00,0x00,0x00] - vdivnepbf16 (%rip){1to16}, %ymm23, %ymm22 + vdivbf16 (%rip){1to16}, %ymm23, %ymm22 -// CHECK: vdivnepbf16 -1024(,%rbp,2), %ymm23, %ymm22 +// CHECK: vdivbf16 -1024(,%rbp,2), %ymm23, %ymm22 // CHECK: encoding: [0x62,0xe5,0x45,0x20,0x5e,0x34,0x6d,0x00,0xfc,0xff,0xff] - vdivnepbf16 -1024(,%rbp,2), %ymm23, %ymm22 + vdivbf16 -1024(,%rbp,2), %ymm23, %ymm22 -// CHECK: vdivnepbf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z} +// CHECK: vdivbf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z} // CHECK: encoding: [0x62,0xe5,0x45,0xa7,0x5e,0x71,0x7f] - vdivnepbf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z} + vdivbf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z} -// CHECK: vdivnepbf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z} +// CHECK: vdivbf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z} // CHECK: encoding: [0x62,0xe5,0x45,0xb7,0x5e,0x72,0x80] - vdivnepbf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z} + vdivbf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z} -// CHECK: vdivnepbf16 268435456(%rbp,%r14,8), %xmm23, %xmm22 +// CHECK: vdivbf16 268435456(%rbp,%r14,8), %xmm23, %xmm22 // CHECK: encoding: [0x62,0xa5,0x45,0x00,0x5e,0xb4,0xf5,0x00,0x00,0x00,0x10] - vdivnepbf16 268435456(%rbp,%r14,8), %xmm23, %xmm22 + vdivbf16 268435456(%rbp,%r14,8), %xmm23, %xmm22 -// CHECK: vdivnepbf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7} +// CHECK: vdivbf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7} // CHECK: encoding: [0x62,0xc5,0x45,0x07,0x5e,0xb4,0x80,0x23,0x01,0x00,0x00] - vdivnepbf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7} + vdivbf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7} -// CHECK: vdivnepbf16 (%rip){1to8}, %xmm23, %xmm22 +// CHECK: vdivbf16 (%rip){1to8}, %xmm23, %xmm22 // CHECK: encoding: [0x62,0xe5,0x45,0x10,0x5e,0x35,0x00,0x00,0x00,0x00] - vdivnepbf16 (%rip){1to8}, %xmm23, %xmm22 + vdivbf16 (%rip){1to8}, %xmm23, %xmm22 -// CHECK: vdivnepbf16 -512(,%rbp,2), %xmm23, %xmm22 +// CHECK: vdivbf16 -512(,%rbp,2), %xmm23, %xmm22 // CHECK: encoding: [0x62,0xe5,0x45,0x00,0x5e,0x34,0x6d,0x00,0xfe,0xff,0xff] - vdivnepbf16 -512(,%rbp,2), %xmm23, %xmm22 + vdivbf16 -512(,%rbp,2), %xmm23, %xmm22 -// CHECK: vdivnepbf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z} +// CHECK: vdivbf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z} // CHECK: encoding: [0x62,0xe5,0x45,0x87,0x5e,0x71,0x7f] - vdivnepbf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z} + vdivbf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z} -// CHECK: vdivnepbf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z} +// CHECK: vdivbf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z} // CHECK: encoding: [0x62,0xe5,0x45,0x97,0x5e,0x72,0x80] - vdivnepbf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z} + vdivbf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z} -// CHECK: vfmadd132nepbf16 %ymm24, %ymm23, %ymm22 +// CHECK: vfmadd132bf16 %ymm24, %ymm23, %ymm22 // CHECK: encoding: [0x62,0x86,0x44,0x20,0x98,0xf0] - vfmadd132nepbf16 %ymm24, %ymm23, %ymm22 + vfmadd132bf16 %ymm24, %ymm23, %ymm22 -// CHECK: vfmadd132nepbf16 %ymm24, %ymm23, %ymm22 {%k7} +// CHECK: vfmadd132bf16 %ymm24, %ymm23, %ymm22 {%k7} // CHECK: encoding: [0x62,0x86,0x44,0x27,0x98,0xf0] - vfmadd132nepbf16 %ymm24, %ymm23, %ymm22 {%k7} + vfmadd132bf16 %ymm24, %ymm23, %ymm22 {%k7} -// CHECK: vfmadd132nepbf16 %ymm24, %ymm23, %ymm22 {%k7} {z} +// CHECK: vfmadd132bf16 %ymm24, %ymm23, %ymm22 {%k7} {z} // CHECK: encoding: [0x62,0x86,0x44,0xa7,0x98,0xf0] - vfmadd132nepbf16 %ymm24, %ymm23, %ymm22 {%k7} {z} + vfmadd132bf16 %ymm24, %ymm23, %ymm22 {%k7} {z} -// CHECK: vfmadd132nepbf16 %zmm24, %zmm23, %zmm22 +// CHECK: vfmadd132bf16 %zmm24, %zmm23, %zmm22 // CHECK: encoding: [0x62,0x86,0x44,0x40,0x98,0xf0] - vfmadd132nepbf16 %zmm24, %zmm23, %zmm22 + vfmadd132bf16 %zmm24, %zmm23, %zmm22 -// CHECK: vfmadd132nepbf16 %zmm24, %zmm23, %zmm22 {%k7} +// CHECK: vfmadd132bf16 %zmm24, %zmm23, %zmm22 {%k7} // CHECK: encoding: [0x62,0x86,0x44,0x47,0x98,0xf0] - vfmadd132nepbf16 %zmm24, %zmm23, %zmm22 {%k7} + vfmadd132bf16 %zmm24, %zmm23, %zmm22 {%k7} -// CHECK: vfmadd132nepbf16 %zmm24, %zmm23, %zmm22 {%k7} {z} +// CHECK: vfmadd132bf16 %zmm24, %zmm23, %zmm22 {%k7} {z} // CHECK: encoding: [0x62,0x86,0x44,0xc7,0x98,0xf0] - vfmadd132nepbf16 %zmm24, %zmm23, %zmm22 {%k7} {z} + vfmadd132bf16 %zmm24, %zmm23, %zmm22 {%k7} {z} -// CHECK: vfmadd132nepbf16 %xmm24, %xmm23, %xmm22 +// CHECK: vfmadd132bf16 %xmm24, %xmm23, %xmm22 // CHECK: encoding: [0x62,0x86,0x44,0x00,0x98,0xf0] - vfmadd132nepbf16 %xmm24, %xmm23, %xmm22 + vfmadd132bf16 %xmm24, %xmm23, %xmm22 -// CHECK: vfmadd132nepbf16 %xmm24, %xmm23, %xmm22 {%k7} +// CHECK: vfmadd132bf16 %xmm24, %xmm23, %xmm22 {%k7} // CHECK: encoding: [0x62,0x86,0x44,0x07,0x98,0xf0] - vfmadd132nepbf16 %xmm24, %xmm23, %xmm22 {%k7} + vfmadd132bf16 %xmm24, %xmm23, %xmm22 {%k7} -// CHECK: vfmadd132nepbf16 %xmm24, %xmm23, %xmm22 {%k7} {z} +// CHECK: vfmadd132bf16 %xmm24, %xmm23, %xmm22 {%k7} {z} // CHECK: encoding: [0x62,0x86,0x44,0x87,0x98,0xf0] - vfmadd132nepbf16 %xmm24, %xmm23, %xmm22 {%k7} {z} + vfmadd132bf16 %xmm24, %xmm23, %xmm22 {%k7} {z} -// CHECK: vfmadd132nepbf16 268435456(%rbp,%r14,8), %zmm23, %zmm22 +// CHECK: vfmadd132bf16 268435456(%rbp,%r14,8), %zmm23, %zmm22 // CHECK: encoding: [0x62,0xa6,0x44,0x40,0x98,0xb4,0xf5,0x00,0x00,0x00,0x10] - vfmadd132nepbf16 268435456(%rbp,%r14,8), %zmm23, %zmm22 + vfmadd132bf16 268435456(%rbp,%r14,8), %zmm23, %zmm22 -// CHECK: vfmadd132nepbf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7} +// CHECK: vfmadd132bf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7} // CHECK: encoding: [0x62,0xc6,0x44,0x47,0x98,0xb4,0x80,0x23,0x01,0x00,0x00] - vfmadd132nepbf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7} + vfmadd132bf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7} -// CHECK: vfmadd132nepbf16 (%rip){1to32}, %zmm23, %zmm22 +// CHECK: vfmadd132bf16 (%rip){1to32}, %zmm23, %zmm22 // CHECK: encoding: [0x62,0xe6,0x44,0x50,0x98,0x35,0x00,0x00,0x00,0x00] - vfmadd132nepbf16 (%rip){1to32}, %zmm23, %zmm22 + vfmadd132bf16 (%rip){1to32}, %zmm23, %zmm22 -// CHECK: vfmadd132nepbf16 -2048(,%rbp,2), %zmm23, %zmm22 +// CHECK: vfmadd132bf16 -2048(,%rbp,2), %zmm23, %zmm22 // CHECK: encoding: [0x62,0xe6,0x44,0x40,0x98,0x34,0x6d,0x00,0xf8,0xff,0xff] - vfmadd132nepbf16 -2048(,%rbp,2), %zmm23, %zmm22 + vfmadd132bf16 -2048(,%rbp,2), %zmm23, %zmm22 -// CHECK: vfmadd132nepbf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z} +// CHECK: vfmadd132bf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z} // CHECK: encoding: [0x62,0xe6,0x44,0xc7,0x98,0x71,0x7f] - vfmadd132nepbf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z} + vfmadd132bf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z} -// CHECK: vfmadd132nepbf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z} +// CHECK: vfmadd132bf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z} // CHECK: encoding: [0x62,0xe6,0x44,0xd7,0x98,0x72,0x80] - vfmadd132nepbf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z} + vfmadd132bf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z} -// CHECK: vfmadd132nepbf16 268435456(%rbp,%r14,8), %ymm23, %ymm22 +// CHECK: vfmadd132bf16 268435456(%rbp,%r14,8), %ymm23, %ymm22 // CHECK: encoding: [0x62,0xa6,0x44,0x20,0x98,0xb4,0xf5,0x00,0x00,0x00,0x10] - vfmadd132nepbf16 268435456(%rbp,%r14,8), %ymm23, %ymm22 + vfmadd132bf16 268435456(%rbp,%r14,8), %ymm23, %ymm22 -// CHECK: vfmadd132nepbf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7} +// CHECK: vfmadd132bf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7} // CHECK: encoding: [0x62,0xc6,0x44,0x27,0x98,0xb4,0x80,0x23,0x01,0x00,0x00] - vfmadd132nepbf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7} + vfmadd132bf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7} -// CHECK: vfmadd132nepbf16 (%rip){1to16}, %ymm23, %ymm22 +// CHECK: vfmadd132bf16 (%rip){1to16}, %ymm23, %ymm22 // CHECK: encoding: [0x62,0xe6,0x44,0x30,0x98,0x35,0x00,0x00,0x00,0x00] - vfmadd132nepbf16 (%rip){1to16}, %ymm23, %ymm22 + vfmadd132bf16 (%rip){1to16}, %ymm23, %ymm22 -// CHECK: vfmadd132nepbf16 -1024(,%rbp,2), %ymm23, %ymm22 +// CHECK: vfmadd132bf16 -1024(,%rbp,2), %ymm23, %ymm22 // CHECK: encoding: [0x62,0xe6,0x44,0x20,0x98,0x34,0x6d,0x00,0xfc,0xff,0xff] - vfmadd132nepbf16 -1024(,%rbp,2), %ymm23, %ymm22 + vfmadd132bf16 -1024(,%rbp,2), %ymm23, %ymm22 -// CHECK: vfmadd132nepbf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z} +// CHECK: vfmadd132bf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z} // CHECK: encoding: [0x62,0xe6,0x44,0xa7,0x98,0x71,0x7f] - vfmadd132nepbf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z} + vfmadd132bf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z} -// CHECK: vfmadd132nepbf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z} +// CHECK: vfmadd132bf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z} // CHECK: encoding: [0x62,0xe6,0x44,0xb7,0x98,0x72,0x80] - vfmadd132nepbf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z} + vfmadd132bf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z} -// CHECK: vfmadd132nepbf16 268435456(%rbp,%r14,8), %xmm23, %xmm22 +// CHECK: vfmadd132bf16 268435456(%rbp,%r14,8), %xmm23, %xmm22 // CHECK: encoding: [0x62,0xa6,0x44,0x00,0x98,0xb4,0xf5,0x00,0x00,0x00,0x10] - vfmadd132nepbf16 268435456(%rbp,%r14,8), %xmm23, %xmm22 + vfmadd132bf16 268435456(%rbp,%r14,8), %xmm23, %xmm22 -// CHECK: vfmadd132nepbf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7} +// CHECK: vfmadd132bf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7} // CHECK: encoding: [0x62,0xc6,0x44,0x07,0x98,0xb4,0x80,0x23,0x01,0x00,0x00] - vfmadd132nepbf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7} + vfmadd132bf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7} -// CHECK: vfmadd132nepbf16 (%rip){1to8}, %xmm23, %xmm22 +// CHECK: vfmadd132bf16 (%rip){1to8}, %xmm23, %xmm22 // CHECK: encoding: [0x62,0xe6,0x44,0x10,0x98,0x35,0x00,0x00,0x00,0x00] - vfmadd132nepbf16 (%rip){1to8}, %xmm23, %xmm22 + vfmadd132bf16 (%rip){1to8}, %xmm23, %xmm22 -// CHECK: vfmadd132nepbf16 -512(,%rbp,2), %xmm23, %xmm22 +// CHECK: vfmadd132bf16 -512(,%rbp,2), %xmm23, %xmm22 // CHECK: encoding: [0x62,0xe6,0x44,0x00,0x98,0x34,0x6d,0x00,0xfe,0xff,0xff] - vfmadd132nepbf16 -512(,%rbp,2), %xmm23, %xmm22 + vfmadd132bf16 -512(,%rbp,2), %xmm23, %xmm22 -// CHECK: vfmadd132nepbf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z} +// CHECK: vfmadd132bf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z} // CHECK: encoding: [0x62,0xe6,0x44,0x87,0x98,0x71,0x7f] - vfmadd132nepbf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z} + vfmadd132bf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z} -// CHECK: vfmadd132nepbf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z} +// CHECK: vfmadd132bf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z} // CHECK: encoding: [0x62,0xe6,0x44,0x97,0x98,0x72,0x80] - vfmadd132nepbf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z} + vfmadd132bf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z} -// CHECK: vfmadd213nepbf16 %ymm24, %ymm23, %ymm22 +// CHECK: vfmadd213bf16 %ymm24, %ymm23, %ymm22 // CHECK: encoding: [0x62,0x86,0x44,0x20,0xa8,0xf0] - vfmadd213nepbf16 %ymm24, %ymm23, %ymm22 + vfmadd213bf16 %ymm24, %ymm23, %ymm22 -// CHECK: vfmadd213nepbf16 %ymm24, %ymm23, %ymm22 {%k7} +// CHECK: vfmadd213bf16 %ymm24, %ymm23, %ymm22 {%k7} // CHECK: encoding: [0x62,0x86,0x44,0x27,0xa8,0xf0] - vfmadd213nepbf16 %ymm24, %ymm23, %ymm22 {%k7} + vfmadd213bf16 %ymm24, %ymm23, %ymm22 {%k7} -// CHECK: vfmadd213nepbf16 %ymm24, %ymm23, %ymm22 {%k7} {z} +// CHECK: vfmadd213bf16 %ymm24, %ymm23, %ymm22 {%k7} {z} // CHECK: encoding: [0x62,0x86,0x44,0xa7,0xa8,0xf0] - vfmadd213nepbf16 %ymm24, %ymm23, %ymm22 {%k7} {z} + vfmadd213bf16 %ymm24, %ymm23, %ymm22 {%k7} {z} -// CHECK: vfmadd213nepbf16 %zmm24, %zmm23, %zmm22 +// CHECK: vfmadd213bf16 %zmm24, %zmm23, %zmm22 // CHECK: encoding: [0x62,0x86,0x44,0x40,0xa8,0xf0] - vfmadd213nepbf16 %zmm24, %zmm23, %zmm22 + vfmadd213bf16 %zmm24, %zmm23, %zmm22 -// CHECK: vfmadd213nepbf16 %zmm24, %zmm23, %zmm22 {%k7} +// CHECK: vfmadd213bf16 %zmm24, %zmm23, %zmm22 {%k7} // CHECK: encoding: [0x62,0x86,0x44,0x47,0xa8,0xf0] - vfmadd213nepbf16 %zmm24, %zmm23, %zmm22 {%k7} + vfmadd213bf16 %zmm24, %zmm23, %zmm22 {%k7} -// CHECK: vfmadd213nepbf16 %zmm24, %zmm23, %zmm22 {%k7} {z} +// CHECK: vfmadd213bf16 %zmm24, %zmm23, %zmm22 {%k7} {z} // CHECK: encoding: [0x62,0x86,0x44,0xc7,0xa8,0xf0] - vfmadd213nepbf16 %zmm24, %zmm23, %zmm22 {%k7} {z} + vfmadd213bf16 %zmm24, %zmm23, %zmm22 {%k7} {z} -// CHECK: vfmadd213nepbf16 %xmm24, %xmm23, %xmm22 +// CHECK: vfmadd213bf16 %xmm24, %xmm23, %xmm22 // CHECK: encoding: [0x62,0x86,0x44,0x00,0xa8,0xf0] - vfmadd213nepbf16 %xmm24, %xmm23, %xmm22 + vfmadd213bf16 %xmm24, %xmm23, %xmm22 -// CHECK: vfmadd213nepbf16 %xmm24, %xmm23, %xmm22 {%k7} +// CHECK: vfmadd213bf16 %xmm24, %xmm23, %xmm22 {%k7} // CHECK: encoding: [0x62,0x86,0x44,0x07,0xa8,0xf0] - vfmadd213nepbf16 %xmm24, %xmm23, %xmm22 {%k7} + vfmadd213bf16 %xmm24, %xmm23, %xmm22 {%k7} -// CHECK: vfmadd213nepbf16 %xmm24, %xmm23, %xmm22 {%k7} {z} +// CHECK: vfmadd213bf16 %xmm24, %xmm23, %xmm22 {%k7} {z} // CHECK: encoding: [0x62,0x86,0x44,0x87,0xa8,0xf0] - vfmadd213nepbf16 %xmm24, %xmm23, %xmm22 {%k7} {z} + vfmadd213bf16 %xmm24, %xmm23, %xmm22 {%k7} {z} -// CHECK: vfmadd213nepbf16 268435456(%rbp,%r14,8), %zmm23, %zmm22 +// CHECK: vfmadd213bf16 268435456(%rbp,%r14,8), %zmm23, %zmm22 // CHECK: encoding: [0x62,0xa6,0x44,0x40,0xa8,0xb4,0xf5,0x00,0x00,0x00,0x10] - vfmadd213nepbf16 268435456(%rbp,%r14,8), %zmm23, %zmm22 + vfmadd213bf16 268435456(%rbp,%r14,8), %zmm23, %zmm22 -// CHECK: vfmadd213nepbf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7} +// CHECK: vfmadd213bf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7} // CHECK: encoding: [0x62,0xc6,0x44,0x47,0xa8,0xb4,0x80,0x23,0x01,0x00,0x00] - vfmadd213nepbf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7} + vfmadd213bf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7} -// CHECK: vfmadd213nepbf16 (%rip){1to32}, %zmm23, %zmm22 +// CHECK: vfmadd213bf16 (%rip){1to32}, %zmm23, %zmm22 // CHECK: encoding: [0x62,0xe6,0x44,0x50,0xa8,0x35,0x00,0x00,0x00,0x00] - vfmadd213nepbf16 (%rip){1to32}, %zmm23, %zmm22 + vfmadd213bf16 (%rip){1to32}, %zmm23, %zmm22 -// CHECK: vfmadd213nepbf16 -2048(,%rbp,2), %zmm23, %zmm22 +// CHECK: vfmadd213bf16 -2048(,%rbp,2), %zmm23, %zmm22 // CHECK: encoding: [0x62,0xe6,0x44,0x40,0xa8,0x34,0x6d,0x00,0xf8,0xff,0xff] - vfmadd213nepbf16 -2048(,%rbp,2), %zmm23, %zmm22 + vfmadd213bf16 -2048(,%rbp,2), %zmm23, %zmm22 -// CHECK: vfmadd213nepbf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z} +// CHECK: vfmadd213bf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z} // CHECK: encoding: [0x62,0xe6,0x44,0xc7,0xa8,0x71,0x7f] - vfmadd213nepbf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z} + vfmadd213bf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z} -// CHECK: vfmadd213nepbf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z} +// CHECK: vfmadd213bf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z} // CHECK: encoding: [0x62,0xe6,0x44,0xd7,0xa8,0x72,0x80] - vfmadd213nepbf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z} + vfmadd213bf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z} -// CHECK: vfmadd213nepbf16 268435456(%rbp,%r14,8), %ymm23, %ymm22 +// CHECK: vfmadd213bf16 268435456(%rbp,%r14,8), %ymm23, %ymm22 // CHECK: encoding: [0x62,0xa6,0x44,0x20,0xa8,0xb4,0xf5,0x00,0x00,0x00,0x10] - vfmadd213nepbf16 268435456(%rbp,%r14,8), %ymm23, %ymm22 + vfmadd213bf16 268435456(%rbp,%r14,8), %ymm23, %ymm22 -// CHECK: vfmadd213nepbf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7} +// CHECK: vfmadd213bf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7} // CHECK: encoding: [0x62,0xc6,0x44,0x27,0xa8,0xb4,0x80,0x23,0x01,0x00,0x00] - vfmadd213nepbf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7} + vfmadd213bf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7} -// CHECK: vfmadd213nepbf16 (%rip){1to16}, %ymm23, %ymm22 +// CHECK: vfmadd213bf16 (%rip){1to16}, %ymm23, %ymm22 // CHECK: encoding: [0x62,0xe6,0x44,0x30,0xa8,0x35,0x00,0x00,0x00,0x00] - vfmadd213nepbf16 (%rip){1to16}, %ymm23, %ymm22 + vfmadd213bf16 (%rip){1to16}, %ymm23, %ymm22 -// CHECK: vfmadd213nepbf16 -1024(,%rbp,2), %ymm23, %ymm22 +// CHECK: vfmadd213bf16 -1024(,%rbp,2), %ymm23, %ymm22 // CHECK: encoding: [0x62,0xe6,0x44,0x20,0xa8,0x34,0x6d,0x00,0xfc,0xff,0xff] - vfmadd213nepbf16 -1024(,%rbp,2), %ymm23, %ymm22 + vfmadd213bf16 -1024(,%rbp,2), %ymm23, %ymm22 -// CHECK: vfmadd213nepbf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z} +// CHECK: vfmadd213bf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z} // CHECK: encoding: [0x62,0xe6,0x44,0xa7,0xa8,0x71,0x7f] - vfmadd213nepbf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z} + vfmadd213bf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z} -// CHECK: vfmadd213nepbf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z} +// CHECK: vfmadd213bf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z} // CHECK: encoding: [0x62,0xe6,0x44,0xb7,0xa8,0x72,0x80] - vfmadd213nepbf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z} + vfmadd213bf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z} -// CHECK: vfmadd213nepbf16 268435456(%rbp,%r14,8), %xmm23, %xmm22 +// CHECK: vfmadd213bf16 268435456(%rbp,%r14,8), %xmm23, %xmm22 // CHECK: encoding: [0x62,0xa6,0x44,0x00,0xa8,0xb4,0xf5,0x00,0x00,0x00,0x10] - vfmadd213nepbf16 268435456(%rbp,%r14,8), %xmm23, %xmm22 + vfmadd213bf16 268435456(%rbp,%r14,8), %xmm23, %xmm22 -// CHECK: vfmadd213nepbf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7} +// CHECK: vfmadd213bf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7} // CHECK: encoding: [0x62,0xc6,0x44,0x07,0xa8,0xb4,0x80,0x23,0x01,0x00,0x00] - vfmadd213nepbf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7} + vfmadd213bf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7} -// CHECK: vfmadd213nepbf16 (%rip){1to8}, %xmm23, %xmm22 +// CHECK: vfmadd213bf16 (%rip){1to8}, %xmm23, %xmm22 // CHECK: encoding: [0x62,0xe6,0x44,0x10,0xa8,0x35,0x00,0x00,0x00,0x00] - vfmadd213nepbf16 (%rip){1to8}, %xmm23, %xmm22 + vfmadd213bf16 (%rip){1to8}, %xmm23, %xmm22 -// CHECK: vfmadd213nepbf16 -512(,%rbp,2), %xmm23, %xmm22 +// CHECK: vfmadd213bf16 -512(,%rbp,2), %xmm23, %xmm22 // CHECK: encoding: [0x62,0xe6,0x44,0x00,0xa8,0x34,0x6d,0x00,0xfe,0xff,0xff] - vfmadd213nepbf16 -512(,%rbp,2), %xmm23, %xmm22 + vfmadd213bf16 -512(,%rbp,2), %xmm23, %xmm22 -// CHECK: vfmadd213nepbf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z} +// CHECK: vfmadd213bf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z} // CHECK: encoding: [0x62,0xe6,0x44,0x87,0xa8,0x71,0x7f] - vfmadd213nepbf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z} + vfmadd213bf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z} -// CHECK: vfmadd213nepbf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z} +// CHECK: vfmadd213bf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z} // CHECK: encoding: [0x62,0xe6,0x44,0x97,0xa8,0x72,0x80] - vfmadd213nepbf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z} + vfmadd213bf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z} -// CHECK: vfmadd231nepbf16 %ymm24, %ymm23, %ymm22 +// CHECK: vfmadd231bf16 %ymm24, %ymm23, %ymm22 // CHECK: encoding: [0x62,0x86,0x44,0x20,0xb8,0xf0] - vfmadd231nepbf16 %ymm24, %ymm23, %ymm22 + vfmadd231bf16 %ymm24, %ymm23, %ymm22 -// CHECK: vfmadd231nepbf16 %ymm24, %ymm23, %ymm22 {%k7} +// CHECK: vfmadd231bf16 %ymm24, %ymm23, %ymm22 {%k7} // CHECK: encoding: [0x62,0x86,0x44,0x27,0xb8,0xf0] - vfmadd231nepbf16 %ymm24, %ymm23, %ymm22 {%k7} + vfmadd231bf16 %ymm24, %ymm23, %ymm22 {%k7} -// CHECK: vfmadd231nepbf16 %ymm24, %ymm23, %ymm22 {%k7} {z} +// CHECK: vfmadd231bf16 %ymm24, %ymm23, %ymm22 {%k7} {z} // CHECK: encoding: [0x62,0x86,0x44,0xa7,0xb8,0xf0] - vfmadd231nepbf16 %ymm24, %ymm23, %ymm22 {%k7} {z} + vfmadd231bf16 %ymm24, %ymm23, %ymm22 {%k7} {z} -// CHECK: vfmadd231nepbf16 %zmm24, %zmm23, %zmm22 +// CHECK: vfmadd231bf16 %zmm24, %zmm23, %zmm22 // CHECK: encoding: [0x62,0x86,0x44,0x40,0xb8,0xf0] - vfmadd231nepbf16 %zmm24, %zmm23, %zmm22 + vfmadd231bf16 %zmm24, %zmm23, %zmm22 -// CHECK: vfmadd231nepbf16 %zmm24, %zmm23, %zmm22 {%k7} +// CHECK: vfmadd231bf16 %zmm24, %zmm23, %zmm22 {%k7} // CHECK: encoding: [0x62,0x86,0x44,0x47,0xb8,0xf0] - vfmadd231nepbf16 %zmm24, %zmm23, %zmm22 {%k7} + vfmadd231bf16 %zmm24, %zmm23, %zmm22 {%k7} -// CHECK: vfmadd231nepbf16 %zmm24, %zmm23, %zmm22 {%k7} {z} +// CHECK: vfmadd231bf16 %zmm24, %zmm23, %zmm22 {%k7} {z} // CHECK: encoding: [0x62,0x86,0x44,0xc7,0xb8,0xf0] - vfmadd231nepbf16 %zmm24, %zmm23, %zmm22 {%k7} {z} + vfmadd231bf16 %zmm24, %zmm23, %zmm22 {%k7} {z} -// CHECK: vfmadd231nepbf16 %xmm24, %xmm23, %xmm22 +// CHECK: vfmadd231bf16 %xmm24, %xmm23, %xmm22 // CHECK: encoding: [0x62,0x86,0x44,0x00,0xb8,0xf0] - vfmadd231nepbf16 %xmm24, %xmm23, %xmm22 + vfmadd231bf16 %xmm24, %xmm23, %xmm22 -// CHECK: vfmadd231nepbf16 %xmm24, %xmm23, %xmm22 {%k7} +// CHECK: vfmadd231bf16 %xmm24, %xmm23, %xmm22 {%k7} // CHECK: encoding: [0x62,0x86,0x44,0x07,0xb8,0xf0] - vfmadd231nepbf16 %xmm24, %xmm23, %xmm22 {%k7} + vfmadd231bf16 %xmm24, %xmm23, %xmm22 {%k7} -// CHECK: vfmadd231nepbf16 %xmm24, %xmm23, %xmm22 {%k7} {z} +// CHECK: vfmadd231bf16 %xmm24, %xmm23, %xmm22 {%k7} {z} // CHECK: encoding: [0x62,0x86,0x44,0x87,0xb8,0xf0] - vfmadd231nepbf16 %xmm24, %xmm23, %xmm22 {%k7} {z} + vfmadd231bf16 %xmm24, %xmm23, %xmm22 {%k7} {z} -// CHECK: vfmadd231nepbf16 268435456(%rbp,%r14,8), %zmm23, %zmm22 +// CHECK: vfmadd231bf16 268435456(%rbp,%r14,8), %zmm23, %zmm22 // CHECK: encoding: [0x62,0xa6,0x44,0x40,0xb8,0xb4,0xf5,0x00,0x00,0x00,0x10] - vfmadd231nepbf16 268435456(%rbp,%r14,8), %zmm23, %zmm22 + vfmadd231bf16 268435456(%rbp,%r14,8), %zmm23, %zmm22 -// CHECK: vfmadd231nepbf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7} +// CHECK: vfmadd231bf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7} // CHECK: encoding: [0x62,0xc6,0x44,0x47,0xb8,0xb4,0x80,0x23,0x01,0x00,0x00] - vfmadd231nepbf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7} + vfmadd231bf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7} -// CHECK: vfmadd231nepbf16 (%rip){1to32}, %zmm23, %zmm22 +// CHECK: vfmadd231bf16 (%rip){1to32}, %zmm23, %zmm22 // CHECK: encoding: [0x62,0xe6,0x44,0x50,0xb8,0x35,0x00,0x00,0x00,0x00] - vfmadd231nepbf16 (%rip){1to32}, %zmm23, %zmm22 + vfmadd231bf16 (%rip){1to32}, %zmm23, %zmm22 -// CHECK: vfmadd231nepbf16 -2048(,%rbp,2), %zmm23, %zmm22 +// CHECK: vfmadd231bf16 -2048(,%rbp,2), %zmm23, %zmm22 // CHECK: encoding: [0x62,0xe6,0x44,0x40,0xb8,0x34,0x6d,0x00,0xf8,0xff,0xff] - vfmadd231nepbf16 -2048(,%rbp,2), %zmm23, %zmm22 + vfmadd231bf16 -2048(,%rbp,2), %zmm23, %zmm22 -// CHECK: vfmadd231nepbf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z} +// CHECK: vfmadd231bf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z} // CHECK: encoding: [0x62,0xe6,0x44,0xc7,0xb8,0x71,0x7f] - vfmadd231nepbf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z} + vfmadd231bf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z} -// CHECK: vfmadd231nepbf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z} +// CHECK: vfmadd231bf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z} // CHECK: encoding: [0x62,0xe6,0x44,0xd7,0xb8,0x72,0x80] - vfmadd231nepbf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z} + vfmadd231bf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z} -// CHECK: vfmadd231nepbf16 268435456(%rbp,%r14,8), %ymm23, %ymm22 +// CHECK: vfmadd231bf16 268435456(%rbp,%r14,8), %ymm23, %ymm22 // CHECK: encoding: [0x62,0xa6,0x44,0x20,0xb8,0xb4,0xf5,0x00,0x00,0x00,0x10] - vfmadd231nepbf16 268435456(%rbp,%r14,8), %ymm23, %ymm22 + vfmadd231bf16 268435456(%rbp,%r14,8), %ymm23, %ymm22 -// CHECK: vfmadd231nepbf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7} +// CHECK: vfmadd231bf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7} // CHECK: encoding: [0x62,0xc6,0x44,0x27,0xb8,0xb4,0x80,0x23,0x01,0x00,0x00] - vfmadd231nepbf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7} + vfmadd231bf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7} -// CHECK: vfmadd231nepbf16 (%rip){1to16}, %ymm23, %ymm22 +// CHECK: vfmadd231bf16 (%rip){1to16}, %ymm23, %ymm22 // CHECK: encoding: [0x62,0xe6,0x44,0x30,0xb8,0x35,0x00,0x00,0x00,0x00] - vfmadd231nepbf16 (%rip){1to16}, %ymm23, %ymm22 + vfmadd231bf16 (%rip){1to16}, %ymm23, %ymm22 -// CHECK: vfmadd231nepbf16 -1024(,%rbp,2), %ymm23, %ymm22 +// CHECK: vfmadd231bf16 -1024(,%rbp,2), %ymm23, %ymm22 // CHECK: encoding: [0x62,0xe6,0x44,0x20,0xb8,0x34,0x6d,0x00,0xfc,0xff,0xff] - vfmadd231nepbf16 -1024(,%rbp,2), %ymm23, %ymm22 + vfmadd231bf16 -1024(,%rbp,2), %ymm23, %ymm22 -// CHECK: vfmadd231nepbf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z} +// CHECK: vfmadd231bf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z} // CHECK: encoding: [0x62,0xe6,0x44,0xa7,0xb8,0x71,0x7f] - vfmadd231nepbf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z} + vfmadd231bf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z} -// CHECK: vfmadd231nepbf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z} +// CHECK: vfmadd231bf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z} // CHECK: encoding: [0x62,0xe6,0x44,0xb7,0xb8,0x72,0x80] - vfmadd231nepbf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z} + vfmadd231bf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z} -// CHECK: vfmadd231nepbf16 268435456(%rbp,%r14,8), %xmm23, %xmm22 +// CHECK: vfmadd231bf16 268435456(%rbp,%r14,8), %xmm23, %xmm22 // CHECK: encoding: [0x62,0xa6,0x44,0x00,0xb8,0xb4,0xf5,0x00,0x00,0x00,0x10] - vfmadd231nepbf16 268435456(%rbp,%r14,8), %xmm23, %xmm22 + vfmadd231bf16 268435456(%rbp,%r14,8), %xmm23, %xmm22 -// CHECK: vfmadd231nepbf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7} +// CHECK: vfmadd231bf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7} // CHECK: encoding: [0x62,0xc6,0x44,0x07,0xb8,0xb4,0x80,0x23,0x01,0x00,0x00] - vfmadd231nepbf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7} + vfmadd231bf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7} -// CHECK: vfmadd231nepbf16 (%rip){1to8}, %xmm23, %xmm22 +// CHECK: vfmadd231bf16 (%rip){1to8}, %xmm23, %xmm22 // CHECK: encoding: [0x62,0xe6,0x44,0x10,0xb8,0x35,0x00,0x00,0x00,0x00] - vfmadd231nepbf16 (%rip){1to8}, %xmm23, %xmm22 + vfmadd231bf16 (%rip){1to8}, %xmm23, %xmm22 -// CHECK: vfmadd231nepbf16 -512(,%rbp,2), %xmm23, %xmm22 +// CHECK: vfmadd231bf16 -512(,%rbp,2), %xmm23, %xmm22 // CHECK: encoding: [0x62,0xe6,0x44,0x00,0xb8,0x34,0x6d,0x00,0xfe,0xff,0xff] - vfmadd231nepbf16 -512(,%rbp,2), %xmm23, %xmm22 + vfmadd231bf16 -512(,%rbp,2), %xmm23, %xmm22 -// CHECK: vfmadd231nepbf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z} +// CHECK: vfmadd231bf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z} // CHECK: encoding: [0x62,0xe6,0x44,0x87,0xb8,0x71,0x7f] - vfmadd231nepbf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z} + vfmadd231bf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z} -// CHECK: vfmadd231nepbf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z} +// CHECK: vfmadd231bf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z} // CHECK: encoding: [0x62,0xe6,0x44,0x97,0xb8,0x72,0x80] - vfmadd231nepbf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z} + vfmadd231bf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z} -// CHECK: vfmsub132nepbf16 %ymm24, %ymm23, %ymm22 +// CHECK: vfmsub132bf16 %ymm24, %ymm23, %ymm22 // CHECK: encoding: [0x62,0x86,0x44,0x20,0x9a,0xf0] - vfmsub132nepbf16 %ymm24, %ymm23, %ymm22 + vfmsub132bf16 %ymm24, %ymm23, %ymm22 -// CHECK: vfmsub132nepbf16 %ymm24, %ymm23, %ymm22 {%k7} +// CHECK: vfmsub132bf16 %ymm24, %ymm23, %ymm22 {%k7} // CHECK: encoding: [0x62,0x86,0x44,0x27,0x9a,0xf0] - vfmsub132nepbf16 %ymm24, %ymm23, %ymm22 {%k7} + vfmsub132bf16 %ymm24, %ymm23, %ymm22 {%k7} -// CHECK: vfmsub132nepbf16 %ymm24, %ymm23, %ymm22 {%k7} {z} +// CHECK: vfmsub132bf16 %ymm24, %ymm23, %ymm22 {%k7} {z} // CHECK: encoding: [0x62,0x86,0x44,0xa7,0x9a,0xf0] - vfmsub132nepbf16 %ymm24, %ymm23, %ymm22 {%k7} {z} + vfmsub132bf16 %ymm24, %ymm23, %ymm22 {%k7} {z} -// CHECK: vfmsub132nepbf16 %zmm24, %zmm23, %zmm22 +// CHECK: vfmsub132bf16 %zmm24, %zmm23, %zmm22 // CHECK: encoding: [0x62,0x86,0x44,0x40,0x9a,0xf0] - vfmsub132nepbf16 %zmm24, %zmm23, %zmm22 + vfmsub132bf16 %zmm24, %zmm23, %zmm22 -// CHECK: vfmsub132nepbf16 %zmm24, %zmm23, %zmm22 {%k7} +// CHECK: vfmsub132bf16 %zmm24, %zmm23, %zmm22 {%k7} // CHECK: encoding: [0x62,0x86,0x44,0x47,0x9a,0xf0] - vfmsub132nepbf16 %zmm24, %zmm23, %zmm22 {%k7} + vfmsub132bf16 %zmm24, %zmm23, %zmm22 {%k7} -// CHECK: vfmsub132nepbf16 %zmm24, %zmm23, %zmm22 {%k7} {z} +// CHECK: vfmsub132bf16 %zmm24, %zmm23, %zmm22 {%k7} {z} // CHECK: encoding: [0x62,0x86,0x44,0xc7,0x9a,0xf0] - vfmsub132nepbf16 %zmm24, %zmm23, %zmm22 {%k7} {z} + vfmsub132bf16 %zmm24, %zmm23, %zmm22 {%k7} {z} -// CHECK: vfmsub132nepbf16 %xmm24, %xmm23, %xmm22 +// CHECK: vfmsub132bf16 %xmm24, %xmm23, %xmm22 // CHECK: encoding: [0x62,0x86,0x44,0x00,0x9a,0xf0] - vfmsub132nepbf16 %xmm24, %xmm23, %xmm22 + vfmsub132bf16 %xmm24, %xmm23, %xmm22 -// CHECK: vfmsub132nepbf16 %xmm24, %xmm23, %xmm22 {%k7} +// CHECK: vfmsub132bf16 %xmm24, %xmm23, %xmm22 {%k7} // CHECK: encoding: [0x62,0x86,0x44,0x07,0x9a,0xf0] - vfmsub132nepbf16 %xmm24, %xmm23, %xmm22 {%k7} + vfmsub132bf16 %xmm24, %xmm23, %xmm22 {%k7} -// CHECK: vfmsub132nepbf16 %xmm24, %xmm23, %xmm22 {%k7} {z} +// CHECK: vfmsub132bf16 %xmm24, %xmm23, %xmm22 {%k7} {z} // CHECK: encoding: [0x62,0x86,0x44,0x87,0x9a,0xf0] - vfmsub132nepbf16 %xmm24, %xmm23, %xmm22 {%k7} {z} + vfmsub132bf16 %xmm24, %xmm23, %xmm22 {%k7} {z} -// CHECK: vfmsub132nepbf16 268435456(%rbp,%r14,8), %zmm23, %zmm22 +// CHECK: vfmsub132bf16 268435456(%rbp,%r14,8), %zmm23, %zmm22 // CHECK: encoding: [0x62,0xa6,0x44,0x40,0x9a,0xb4,0xf5,0x00,0x00,0x00,0x10] - vfmsub132nepbf16 268435456(%rbp,%r14,8), %zmm23, %zmm22 + vfmsub132bf16 268435456(%rbp,%r14,8), %zmm23, %zmm22 -// CHECK: vfmsub132nepbf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7} +// CHECK: vfmsub132bf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7} // CHECK: encoding: [0x62,0xc6,0x44,0x47,0x9a,0xb4,0x80,0x23,0x01,0x00,0x00] - vfmsub132nepbf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7} + vfmsub132bf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7} -// CHECK: vfmsub132nepbf16 (%rip){1to32}, %zmm23, %zmm22 +// CHECK: vfmsub132bf16 (%rip){1to32}, %zmm23, %zmm22 // CHECK: encoding: [0x62,0xe6,0x44,0x50,0x9a,0x35,0x00,0x00,0x00,0x00] - vfmsub132nepbf16 (%rip){1to32}, %zmm23, %zmm22 + vfmsub132bf16 (%rip){1to32}, %zmm23, %zmm22 -// CHECK: vfmsub132nepbf16 -2048(,%rbp,2), %zmm23, %zmm22 +// CHECK: vfmsub132bf16 -2048(,%rbp,2), %zmm23, %zmm22 // CHECK: encoding: [0x62,0xe6,0x44,0x40,0x9a,0x34,0x6d,0x00,0xf8,0xff,0xff] - vfmsub132nepbf16 -2048(,%rbp,2), %zmm23, %zmm22 + vfmsub132bf16 -2048(,%rbp,2), %zmm23, %zmm22 -// CHECK: vfmsub132nepbf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z} +// CHECK: vfmsub132bf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z} // CHECK: encoding: [0x62,0xe6,0x44,0xc7,0x9a,0x71,0x7f] - vfmsub132nepbf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z} + vfmsub132bf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z} -// CHECK: vfmsub132nepbf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z} +// CHECK: vfmsub132bf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z} // CHECK: encoding: [0x62,0xe6,0x44,0xd7,0x9a,0x72,0x80] - vfmsub132nepbf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z} + vfmsub132bf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z} -// CHECK: vfmsub132nepbf16 268435456(%rbp,%r14,8), %ymm23, %ymm22 +// CHECK: vfmsub132bf16 268435456(%rbp,%r14,8), %ymm23, %ymm22 // CHECK: encoding: [0x62,0xa6,0x44,0x20,0x9a,0xb4,0xf5,0x00,0x00,0x00,0x10] - vfmsub132nepbf16 268435456(%rbp,%r14,8), %ymm23, %ymm22 + vfmsub132bf16 268435456(%rbp,%r14,8), %ymm23, %ymm22 -// CHECK: vfmsub132nepbf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7} +// CHECK: vfmsub132bf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7} // CHECK: encoding: [0x62,0xc6,0x44,0x27,0x9a,0xb4,0x80,0x23,0x01,0x00,0x00] - vfmsub132nepbf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7} + vfmsub132bf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7} -// CHECK: vfmsub132nepbf16 (%rip){1to16}, %ymm23, %ymm22 +// CHECK: vfmsub132bf16 (%rip){1to16}, %ymm23, %ymm22 // CHECK: encoding: [0x62,0xe6,0x44,0x30,0x9a,0x35,0x00,0x00,0x00,0x00] - vfmsub132nepbf16 (%rip){1to16}, %ymm23, %ymm22 + vfmsub132bf16 (%rip){1to16}, %ymm23, %ymm22 -// CHECK: vfmsub132nepbf16 -1024(,%rbp,2), %ymm23, %ymm22 +// CHECK: vfmsub132bf16 -1024(,%rbp,2), %ymm23, %ymm22 // CHECK: encoding: [0x62,0xe6,0x44,0x20,0x9a,0x34,0x6d,0x00,0xfc,0xff,0xff] - vfmsub132nepbf16 -1024(,%rbp,2), %ymm23, %ymm22 + vfmsub132bf16 -1024(,%rbp,2), %ymm23, %ymm22 -// CHECK: vfmsub132nepbf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z} +// CHECK: vfmsub132bf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z} // CHECK: encoding: [0x62,0xe6,0x44,0xa7,0x9a,0x71,0x7f] - vfmsub132nepbf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z} + vfmsub132bf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z} -// CHECK: vfmsub132nepbf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z} +// CHECK: vfmsub132bf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z} // CHECK: encoding: [0x62,0xe6,0x44,0xb7,0x9a,0x72,0x80] - vfmsub132nepbf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z} + vfmsub132bf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z} -// CHECK: vfmsub132nepbf16 268435456(%rbp,%r14,8), %xmm23, %xmm22 +// CHECK: vfmsub132bf16 268435456(%rbp,%r14,8), %xmm23, %xmm22 // CHECK: encoding: [0x62,0xa6,0x44,0x00,0x9a,0xb4,0xf5,0x00,0x00,0x00,0x10] - vfmsub132nepbf16 268435456(%rbp,%r14,8), %xmm23, %xmm22 + vfmsub132bf16 268435456(%rbp,%r14,8), %xmm23, %xmm22 -// CHECK: vfmsub132nepbf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7} +// CHECK: vfmsub132bf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7} // CHECK: encoding: [0x62,0xc6,0x44,0x07,0x9a,0xb4,0x80,0x23,0x01,0x00,0x00] - vfmsub132nepbf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7} + vfmsub132bf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7} -// CHECK: vfmsub132nepbf16 (%rip){1to8}, %xmm23, %xmm22 +// CHECK: vfmsub132bf16 (%rip){1to8}, %xmm23, %xmm22 // CHECK: encoding: [0x62,0xe6,0x44,0x10,0x9a,0x35,0x00,0x00,0x00,0x00] - vfmsub132nepbf16 (%rip){1to8}, %xmm23, %xmm22 + vfmsub132bf16 (%rip){1to8}, %xmm23, %xmm22 -// CHECK: vfmsub132nepbf16 -512(,%rbp,2), %xmm23, %xmm22 +// CHECK: vfmsub132bf16 -512(,%rbp,2), %xmm23, %xmm22 // CHECK: encoding: [0x62,0xe6,0x44,0x00,0x9a,0x34,0x6d,0x00,0xfe,0xff,0xff] - vfmsub132nepbf16 -512(,%rbp,2), %xmm23, %xmm22 + vfmsub132bf16 -512(,%rbp,2), %xmm23, %xmm22 -// CHECK: vfmsub132nepbf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z} +// CHECK: vfmsub132bf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z} // CHECK: encoding: [0x62,0xe6,0x44,0x87,0x9a,0x71,0x7f] - vfmsub132nepbf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z} + vfmsub132bf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z} -// CHECK: vfmsub132nepbf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z} +// CHECK: vfmsub132bf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z} // CHECK: encoding: [0x62,0xe6,0x44,0x97,0x9a,0x72,0x80] - vfmsub132nepbf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z} + vfmsub132bf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z} -// CHECK: vfmsub213nepbf16 %ymm24, %ymm23, %ymm22 +// CHECK: vfmsub213bf16 %ymm24, %ymm23, %ymm22 // CHECK: encoding: [0x62,0x86,0x44,0x20,0xaa,0xf0] - vfmsub213nepbf16 %ymm24, %ymm23, %ymm22 + vfmsub213bf16 %ymm24, %ymm23, %ymm22 -// CHECK: vfmsub213nepbf16 %ymm24, %ymm23, %ymm22 {%k7} +// CHECK: vfmsub213bf16 %ymm24, %ymm23, %ymm22 {%k7} // CHECK: encoding: [0x62,0x86,0x44,0x27,0xaa,0xf0] - vfmsub213nepbf16 %ymm24, %ymm23, %ymm22 {%k7} + vfmsub213bf16 %ymm24, %ymm23, %ymm22 {%k7} -// CHECK: vfmsub213nepbf16 %ymm24, %ymm23, %ymm22 {%k7} {z} +// CHECK: vfmsub213bf16 %ymm24, %ymm23, %ymm22 {%k7} {z} // CHECK: encoding: [0x62,0x86,0x44,0xa7,0xaa,0xf0] - vfmsub213nepbf16 %ymm24, %ymm23, %ymm22 {%k7} {z} + vfmsub213bf16 %ymm24, %ymm23, %ymm22 {%k7} {z} -// CHECK: vfmsub213nepbf16 %zmm24, %zmm23, %zmm22 +// CHECK: vfmsub213bf16 %zmm24, %zmm23, %zmm22 // CHECK: encoding: [0x62,0x86,0x44,0x40,0xaa,0xf0] - vfmsub213nepbf16 %zmm24, %zmm23, %zmm22 + vfmsub213bf16 %zmm24, %zmm23, %zmm22 -// CHECK: vfmsub213nepbf16 %zmm24, %zmm23, %zmm22 {%k7} +// CHECK: vfmsub213bf16 %zmm24, %zmm23, %zmm22 {%k7} // CHECK: encoding: [0x62,0x86,0x44,0x47,0xaa,0xf0] - vfmsub213nepbf16 %zmm24, %zmm23, %zmm22 {%k7} + vfmsub213bf16 %zmm24, %zmm23, %zmm22 {%k7} -// CHECK: vfmsub213nepbf16 %zmm24, %zmm23, %zmm22 {%k7} {z} +// CHECK: vfmsub213bf16 %zmm24, %zmm23, %zmm22 {%k7} {z} // CHECK: encoding: [0x62,0x86,0x44,0xc7,0xaa,0xf0] - vfmsub213nepbf16 %zmm24, %zmm23, %zmm22 {%k7} {z} + vfmsub213bf16 %zmm24, %zmm23, %zmm22 {%k7} {z} -// CHECK: vfmsub213nepbf16 %xmm24, %xmm23, %xmm22 +// CHECK: vfmsub213bf16 %xmm24, %xmm23, %xmm22 // CHECK: encoding: [0x62,0x86,0x44,0x00,0xaa,0xf0] - vfmsub213nepbf16 %xmm24, %xmm23, %xmm22 + vfmsub213bf16 %xmm24, %xmm23, %xmm22 -// CHECK: vfmsub213nepbf16 %xmm24, %xmm23, %xmm22 {%k7} +// CHECK: vfmsub213bf16 %xmm24, %xmm23, %xmm22 {%k7} // CHECK: encoding: [0x62,0x86,0x44,0x07,0xaa,0xf0] - vfmsub213nepbf16 %xmm24, %xmm23, %xmm22 {%k7} + vfmsub213bf16 %xmm24, %xmm23, %xmm22 {%k7} -// CHECK: vfmsub213nepbf16 %xmm24, %xmm23, %xmm22 {%k7} {z} +// CHECK: vfmsub213bf16 %xmm24, %xmm23, %xmm22 {%k7} {z} // CHECK: encoding: [0x62,0x86,0x44,0x87,0xaa,0xf0] - vfmsub213nepbf16 %xmm24, %xmm23, %xmm22 {%k7} {z} + vfmsub213bf16 %xmm24, %xmm23, %xmm22 {%k7} {z} -// CHECK: vfmsub213nepbf16 268435456(%rbp,%r14,8), %zmm23, %zmm22 +// CHECK: vfmsub213bf16 268435456(%rbp,%r14,8), %zmm23, %zmm22 // CHECK: encoding: [0x62,0xa6,0x44,0x40,0xaa,0xb4,0xf5,0x00,0x00,0x00,0x10] - vfmsub213nepbf16 268435456(%rbp,%r14,8), %zmm23, %zmm22 + vfmsub213bf16 268435456(%rbp,%r14,8), %zmm23, %zmm22 -// CHECK: vfmsub213nepbf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7} +// CHECK: vfmsub213bf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7} // CHECK: encoding: [0x62,0xc6,0x44,0x47,0xaa,0xb4,0x80,0x23,0x01,0x00,0x00] - vfmsub213nepbf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7} + vfmsub213bf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7} -// CHECK: vfmsub213nepbf16 (%rip){1to32}, %zmm23, %zmm22 +// CHECK: vfmsub213bf16 (%rip){1to32}, %zmm23, %zmm22 // CHECK: encoding: [0x62,0xe6,0x44,0x50,0xaa,0x35,0x00,0x00,0x00,0x00] - vfmsub213nepbf16 (%rip){1to32}, %zmm23, %zmm22 + vfmsub213bf16 (%rip){1to32}, %zmm23, %zmm22 -// CHECK: vfmsub213nepbf16 -2048(,%rbp,2), %zmm23, %zmm22 +// CHECK: vfmsub213bf16 -2048(,%rbp,2), %zmm23, %zmm22 // CHECK: encoding: [0x62,0xe6,0x44,0x40,0xaa,0x34,0x6d,0x00,0xf8,0xff,0xff] - vfmsub213nepbf16 -2048(,%rbp,2), %zmm23, %zmm22 + vfmsub213bf16 -2048(,%rbp,2), %zmm23, %zmm22 -// CHECK: vfmsub213nepbf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z} +// CHECK: vfmsub213bf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z} // CHECK: encoding: [0x62,0xe6,0x44,0xc7,0xaa,0x71,0x7f] - vfmsub213nepbf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z} + vfmsub213bf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z} -// CHECK: vfmsub213nepbf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z} +// CHECK: vfmsub213bf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z} // CHECK: encoding: [0x62,0xe6,0x44,0xd7,0xaa,0x72,0x80] - vfmsub213nepbf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z} + vfmsub213bf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z} -// CHECK: vfmsub213nepbf16 268435456(%rbp,%r14,8), %ymm23, %ymm22 +// CHECK: vfmsub213bf16 268435456(%rbp,%r14,8), %ymm23, %ymm22 // CHECK: encoding: [0x62,0xa6,0x44,0x20,0xaa,0xb4,0xf5,0x00,0x00,0x00,0x10] - vfmsub213nepbf16 268435456(%rbp,%r14,8), %ymm23, %ymm22 + vfmsub213bf16 268435456(%rbp,%r14,8), %ymm23, %ymm22 -// CHECK: vfmsub213nepbf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7} +// CHECK: vfmsub213bf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7} // CHECK: encoding: [0x62,0xc6,0x44,0x27,0xaa,0xb4,0x80,0x23,0x01,0x00,0x00] - vfmsub213nepbf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7} + vfmsub213bf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7} -// CHECK: vfmsub213nepbf16 (%rip){1to16}, %ymm23, %ymm22 +// CHECK: vfmsub213bf16 (%rip){1to16}, %ymm23, %ymm22 // CHECK: encoding: [0x62,0xe6,0x44,0x30,0xaa,0x35,0x00,0x00,0x00,0x00] - vfmsub213nepbf16 (%rip){1to16}, %ymm23, %ymm22 + vfmsub213bf16 (%rip){1to16}, %ymm23, %ymm22 -// CHECK: vfmsub213nepbf16 -1024(,%rbp,2), %ymm23, %ymm22 +// CHECK: vfmsub213bf16 -1024(,%rbp,2), %ymm23, %ymm22 // CHECK: encoding: [0x62,0xe6,0x44,0x20,0xaa,0x34,0x6d,0x00,0xfc,0xff,0xff] - vfmsub213nepbf16 -1024(,%rbp,2), %ymm23, %ymm22 + vfmsub213bf16 -1024(,%rbp,2), %ymm23, %ymm22 -// CHECK: vfmsub213nepbf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z} +// CHECK: vfmsub213bf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z} // CHECK: encoding: [0x62,0xe6,0x44,0xa7,0xaa,0x71,0x7f] - vfmsub213nepbf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z} + vfmsub213bf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z} -// CHECK: vfmsub213nepbf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z} +// CHECK: vfmsub213bf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z} // CHECK: encoding: [0x62,0xe6,0x44,0xb7,0xaa,0x72,0x80] - vfmsub213nepbf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z} + vfmsub213bf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z} -// CHECK: vfmsub213nepbf16 268435456(%rbp,%r14,8), %xmm23, %xmm22 +// CHECK: vfmsub213bf16 268435456(%rbp,%r14,8), %xmm23, %xmm22 // CHECK: encoding: [0x62,0xa6,0x44,0x00,0xaa,0xb4,0xf5,0x00,0x00,0x00,0x10] - vfmsub213nepbf16 268435456(%rbp,%r14,8), %xmm23, %xmm22 + vfmsub213bf16 268435456(%rbp,%r14,8), %xmm23, %xmm22 -// CHECK: vfmsub213nepbf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7} +// CHECK: vfmsub213bf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7} // CHECK: encoding: [0x62,0xc6,0x44,0x07,0xaa,0xb4,0x80,0x23,0x01,0x00,0x00] - vfmsub213nepbf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7} + vfmsub213bf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7} -// CHECK: vfmsub213nepbf16 (%rip){1to8}, %xmm23, %xmm22 +// CHECK: vfmsub213bf16 (%rip){1to8}, %xmm23, %xmm22 // CHECK: encoding: [0x62,0xe6,0x44,0x10,0xaa,0x35,0x00,0x00,0x00,0x00] - vfmsub213nepbf16 (%rip){1to8}, %xmm23, %xmm22 + vfmsub213bf16 (%rip){1to8}, %xmm23, %xmm22 -// CHECK: vfmsub213nepbf16 -512(,%rbp,2), %xmm23, %xmm22 +// CHECK: vfmsub213bf16 -512(,%rbp,2), %xmm23, %xmm22 // CHECK: encoding: [0x62,0xe6,0x44,0x00,0xaa,0x34,0x6d,0x00,0xfe,0xff,0xff] - vfmsub213nepbf16 -512(,%rbp,2), %xmm23, %xmm22 + vfmsub213bf16 -512(,%rbp,2), %xmm23, %xmm22 -// CHECK: vfmsub213nepbf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z} +// CHECK: vfmsub213bf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z} // CHECK: encoding: [0x62,0xe6,0x44,0x87,0xaa,0x71,0x7f] - vfmsub213nepbf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z} + vfmsub213bf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z} -// CHECK: vfmsub213nepbf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z} +// CHECK: vfmsub213bf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z} // CHECK: encoding: [0x62,0xe6,0x44,0x97,0xaa,0x72,0x80] - vfmsub213nepbf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z} + vfmsub213bf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z} -// CHECK: vfmsub231nepbf16 %ymm24, %ymm23, %ymm22 +// CHECK: vfmsub231bf16 %ymm24, %ymm23, %ymm22 // CHECK: encoding: [0x62,0x86,0x44,0x20,0xba,0xf0] - vfmsub231nepbf16 %ymm24, %ymm23, %ymm22 + vfmsub231bf16 %ymm24, %ymm23, %ymm22 -// CHECK: vfmsub231nepbf16 %ymm24, %ymm23, %ymm22 {%k7} +// CHECK: vfmsub231bf16 %ymm24, %ymm23, %ymm22 {%k7} // CHECK: encoding: [0x62,0x86,0x44,0x27,0xba,0xf0] - vfmsub231nepbf16 %ymm24, %ymm23, %ymm22 {%k7} + vfmsub231bf16 %ymm24, %ymm23, %ymm22 {%k7} -// CHECK: vfmsub231nepbf16 %ymm24, %ymm23, %ymm22 {%k7} {z} +// CHECK: vfmsub231bf16 %ymm24, %ymm23, %ymm22 {%k7} {z} // CHECK: encoding: [0x62,0x86,0x44,0xa7,0xba,0xf0] - vfmsub231nepbf16 %ymm24, %ymm23, %ymm22 {%k7} {z} + vfmsub231bf16 %ymm24, %ymm23, %ymm22 {%k7} {z} -// CHECK: vfmsub231nepbf16 %zmm24, %zmm23, %zmm22 +// CHECK: vfmsub231bf16 %zmm24, %zmm23, %zmm22 // CHECK: encoding: [0x62,0x86,0x44,0x40,0xba,0xf0] - vfmsub231nepbf16 %zmm24, %zmm23, %zmm22 + vfmsub231bf16 %zmm24, %zmm23, %zmm22 -// CHECK: vfmsub231nepbf16 %zmm24, %zmm23, %zmm22 {%k7} +// CHECK: vfmsub231bf16 %zmm24, %zmm23, %zmm22 {%k7} // CHECK: encoding: [0x62,0x86,0x44,0x47,0xba,0xf0] - vfmsub231nepbf16 %zmm24, %zmm23, %zmm22 {%k7} + vfmsub231bf16 %zmm24, %zmm23, %zmm22 {%k7} -// CHECK: vfmsub231nepbf16 %zmm24, %zmm23, %zmm22 {%k7} {z} +// CHECK: vfmsub231bf16 %zmm24, %zmm23, %zmm22 {%k7} {z} // CHECK: encoding: [0x62,0x86,0x44,0xc7,0xba,0xf0] - vfmsub231nepbf16 %zmm24, %zmm23, %zmm22 {%k7} {z} + vfmsub231bf16 %zmm24, %zmm23, %zmm22 {%k7} {z} -// CHECK: vfmsub231nepbf16 %xmm24, %xmm23, %xmm22 +// CHECK: vfmsub231bf16 %xmm24, %xmm23, %xmm22 // CHECK: encoding: [0x62,0x86,0x44,0x00,0xba,0xf0] - vfmsub231nepbf16 %xmm24, %xmm23, %xmm22 + vfmsub231bf16 %xmm24, %xmm23, %xmm22 -// CHECK: vfmsub231nepbf16 %xmm24, %xmm23, %xmm22 {%k7} +// CHECK: vfmsub231bf16 %xmm24, %xmm23, %xmm22 {%k7} // CHECK: encoding: [0x62,0x86,0x44,0x07,0xba,0xf0] - vfmsub231nepbf16 %xmm24, %xmm23, %xmm22 {%k7} + vfmsub231bf16 %xmm24, %xmm23, %xmm22 {%k7} -// CHECK: vfmsub231nepbf16 %xmm24, %xmm23, %xmm22 {%k7} {z} +// CHECK: vfmsub231bf16 %xmm24, %xmm23, %xmm22 {%k7} {z} // CHECK: encoding: [0x62,0x86,0x44,0x87,0xba,0xf0] - vfmsub231nepbf16 %xmm24, %xmm23, %xmm22 {%k7} {z} + vfmsub231bf16 %xmm24, %xmm23, %xmm22 {%k7} {z} -// CHECK: vfmsub231nepbf16 268435456(%rbp,%r14,8), %zmm23, %zmm22 +// CHECK: vfmsub231bf16 268435456(%rbp,%r14,8), %zmm23, %zmm22 // CHECK: encoding: [0x62,0xa6,0x44,0x40,0xba,0xb4,0xf5,0x00,0x00,0x00,0x10] - vfmsub231nepbf16 268435456(%rbp,%r14,8), %zmm23, %zmm22 + vfmsub231bf16 268435456(%rbp,%r14,8), %zmm23, %zmm22 -// CHECK: vfmsub231nepbf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7} +// CHECK: vfmsub231bf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7} // CHECK: encoding: [0x62,0xc6,0x44,0x47,0xba,0xb4,0x80,0x23,0x01,0x00,0x00] - vfmsub231nepbf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7} + vfmsub231bf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7} -// CHECK: vfmsub231nepbf16 (%rip){1to32}, %zmm23, %zmm22 +// CHECK: vfmsub231bf16 (%rip){1to32}, %zmm23, %zmm22 // CHECK: encoding: [0x62,0xe6,0x44,0x50,0xba,0x35,0x00,0x00,0x00,0x00] - vfmsub231nepbf16 (%rip){1to32}, %zmm23, %zmm22 + vfmsub231bf16 (%rip){1to32}, %zmm23, %zmm22 -// CHECK: vfmsub231nepbf16 -2048(,%rbp,2), %zmm23, %zmm22 +// CHECK: vfmsub231bf16 -2048(,%rbp,2), %zmm23, %zmm22 // CHECK: encoding: [0x62,0xe6,0x44,0x40,0xba,0x34,0x6d,0x00,0xf8,0xff,0xff] - vfmsub231nepbf16 -2048(,%rbp,2), %zmm23, %zmm22 + vfmsub231bf16 -2048(,%rbp,2), %zmm23, %zmm22 -// CHECK: vfmsub231nepbf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z} +// CHECK: vfmsub231bf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z} // CHECK: encoding: [0x62,0xe6,0x44,0xc7,0xba,0x71,0x7f] - vfmsub231nepbf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z} + vfmsub231bf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z} -// CHECK: vfmsub231nepbf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z} +// CHECK: vfmsub231bf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z} // CHECK: encoding: [0x62,0xe6,0x44,0xd7,0xba,0x72,0x80] - vfmsub231nepbf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z} + vfmsub231bf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z} -// CHECK: vfmsub231nepbf16 268435456(%rbp,%r14,8), %ymm23, %ymm22 +// CHECK: vfmsub231bf16 268435456(%rbp,%r14,8), %ymm23, %ymm22 // CHECK: encoding: [0x62,0xa6,0x44,0x20,0xba,0xb4,0xf5,0x00,0x00,0x00,0x10] - vfmsub231nepbf16 268435456(%rbp,%r14,8), %ymm23, %ymm22 + vfmsub231bf16 268435456(%rbp,%r14,8), %ymm23, %ymm22 -// CHECK: vfmsub231nepbf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7} +// CHECK: vfmsub231bf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7} // CHECK: encoding: [0x62,0xc6,0x44,0x27,0xba,0xb4,0x80,0x23,0x01,0x00,0x00] - vfmsub231nepbf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7} + vfmsub231bf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7} -// CHECK: vfmsub231nepbf16 (%rip){1to16}, %ymm23, %ymm22 +// CHECK: vfmsub231bf16 (%rip){1to16}, %ymm23, %ymm22 // CHECK: encoding: [0x62,0xe6,0x44,0x30,0xba,0x35,0x00,0x00,0x00,0x00] - vfmsub231nepbf16 (%rip){1to16}, %ymm23, %ymm22 + vfmsub231bf16 (%rip){1to16}, %ymm23, %ymm22 -// CHECK: vfmsub231nepbf16 -1024(,%rbp,2), %ymm23, %ymm22 +// CHECK: vfmsub231bf16 -1024(,%rbp,2), %ymm23, %ymm22 // CHECK: encoding: [0x62,0xe6,0x44,0x20,0xba,0x34,0x6d,0x00,0xfc,0xff,0xff] - vfmsub231nepbf16 -1024(,%rbp,2), %ymm23, %ymm22 + vfmsub231bf16 -1024(,%rbp,2), %ymm23, %ymm22 -// CHECK: vfmsub231nepbf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z} +// CHECK: vfmsub231bf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z} // CHECK: encoding: [0x62,0xe6,0x44,0xa7,0xba,0x71,0x7f] - vfmsub231nepbf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z} + vfmsub231bf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z} -// CHECK: vfmsub231nepbf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z} +// CHECK: vfmsub231bf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z} // CHECK: encoding: [0x62,0xe6,0x44,0xb7,0xba,0x72,0x80] - vfmsub231nepbf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z} + vfmsub231bf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z} -// CHECK: vfmsub231nepbf16 268435456(%rbp,%r14,8), %xmm23, %xmm22 +// CHECK: vfmsub231bf16 268435456(%rbp,%r14,8), %xmm23, %xmm22 // CHECK: encoding: [0x62,0xa6,0x44,0x00,0xba,0xb4,0xf5,0x00,0x00,0x00,0x10] - vfmsub231nepbf16 268435456(%rbp,%r14,8), %xmm23, %xmm22 + vfmsub231bf16 268435456(%rbp,%r14,8), %xmm23, %xmm22 -// CHECK: vfmsub231nepbf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7} +// CHECK: vfmsub231bf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7} // CHECK: encoding: [0x62,0xc6,0x44,0x07,0xba,0xb4,0x80,0x23,0x01,0x00,0x00] - vfmsub231nepbf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7} + vfmsub231bf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7} -// CHECK: vfmsub231nepbf16 (%rip){1to8}, %xmm23, %xmm22 +// CHECK: vfmsub231bf16 (%rip){1to8}, %xmm23, %xmm22 // CHECK: encoding: [0x62,0xe6,0x44,0x10,0xba,0x35,0x00,0x00,0x00,0x00] - vfmsub231nepbf16 (%rip){1to8}, %xmm23, %xmm22 + vfmsub231bf16 (%rip){1to8}, %xmm23, %xmm22 -// CHECK: vfmsub231nepbf16 -512(,%rbp,2), %xmm23, %xmm22 +// CHECK: vfmsub231bf16 -512(,%rbp,2), %xmm23, %xmm22 // CHECK: encoding: [0x62,0xe6,0x44,0x00,0xba,0x34,0x6d,0x00,0xfe,0xff,0xff] - vfmsub231nepbf16 -512(,%rbp,2), %xmm23, %xmm22 + vfmsub231bf16 -512(,%rbp,2), %xmm23, %xmm22 -// CHECK: vfmsub231nepbf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z} +// CHECK: vfmsub231bf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z} // CHECK: encoding: [0x62,0xe6,0x44,0x87,0xba,0x71,0x7f] - vfmsub231nepbf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z} + vfmsub231bf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z} -// CHECK: vfmsub231nepbf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z} +// CHECK: vfmsub231bf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z} // CHECK: encoding: [0x62,0xe6,0x44,0x97,0xba,0x72,0x80] - vfmsub231nepbf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z} + vfmsub231bf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z} -// CHECK: vfnmadd132nepbf16 %ymm24, %ymm23, %ymm22 +// CHECK: vfnmadd132bf16 %ymm24, %ymm23, %ymm22 // CHECK: encoding: [0x62,0x86,0x44,0x20,0x9c,0xf0] - vfnmadd132nepbf16 %ymm24, %ymm23, %ymm22 + vfnmadd132bf16 %ymm24, %ymm23, %ymm22 -// CHECK: vfnmadd132nepbf16 %ymm24, %ymm23, %ymm22 {%k7} +// CHECK: vfnmadd132bf16 %ymm24, %ymm23, %ymm22 {%k7} // CHECK: encoding: [0x62,0x86,0x44,0x27,0x9c,0xf0] - vfnmadd132nepbf16 %ymm24, %ymm23, %ymm22 {%k7} + vfnmadd132bf16 %ymm24, %ymm23, %ymm22 {%k7} -// CHECK: vfnmadd132nepbf16 %ymm24, %ymm23, %ymm22 {%k7} {z} +// CHECK: vfnmadd132bf16 %ymm24, %ymm23, %ymm22 {%k7} {z} // CHECK: encoding: [0x62,0x86,0x44,0xa7,0x9c,0xf0] - vfnmadd132nepbf16 %ymm24, %ymm23, %ymm22 {%k7} {z} + vfnmadd132bf16 %ymm24, %ymm23, %ymm22 {%k7} {z} -// CHECK: vfnmadd132nepbf16 %zmm24, %zmm23, %zmm22 +// CHECK: vfnmadd132bf16 %zmm24, %zmm23, %zmm22 // CHECK: encoding: [0x62,0x86,0x44,0x40,0x9c,0xf0] - vfnmadd132nepbf16 %zmm24, %zmm23, %zmm22 + vfnmadd132bf16 %zmm24, %zmm23, %zmm22 -// CHECK: vfnmadd132nepbf16 %zmm24, %zmm23, %zmm22 {%k7} +// CHECK: vfnmadd132bf16 %zmm24, %zmm23, %zmm22 {%k7} // CHECK: encoding: [0x62,0x86,0x44,0x47,0x9c,0xf0] - vfnmadd132nepbf16 %zmm24, %zmm23, %zmm22 {%k7} + vfnmadd132bf16 %zmm24, %zmm23, %zmm22 {%k7} -// CHECK: vfnmadd132nepbf16 %zmm24, %zmm23, %zmm22 {%k7} {z} +// CHECK: vfnmadd132bf16 %zmm24, %zmm23, %zmm22 {%k7} {z} // CHECK: encoding: [0x62,0x86,0x44,0xc7,0x9c,0xf0] - vfnmadd132nepbf16 %zmm24, %zmm23, %zmm22 {%k7} {z} + vfnmadd132bf16 %zmm24, %zmm23, %zmm22 {%k7} {z} -// CHECK: vfnmadd132nepbf16 %xmm24, %xmm23, %xmm22 +// CHECK: vfnmadd132bf16 %xmm24, %xmm23, %xmm22 // CHECK: encoding: [0x62,0x86,0x44,0x00,0x9c,0xf0] - vfnmadd132nepbf16 %xmm24, %xmm23, %xmm22 + vfnmadd132bf16 %xmm24, %xmm23, %xmm22 -// CHECK: vfnmadd132nepbf16 %xmm24, %xmm23, %xmm22 {%k7} +// CHECK: vfnmadd132bf16 %xmm24, %xmm23, %xmm22 {%k7} // CHECK: encoding: [0x62,0x86,0x44,0x07,0x9c,0xf0] - vfnmadd132nepbf16 %xmm24, %xmm23, %xmm22 {%k7} + vfnmadd132bf16 %xmm24, %xmm23, %xmm22 {%k7} -// CHECK: vfnmadd132nepbf16 %xmm24, %xmm23, %xmm22 {%k7} {z} +// CHECK: vfnmadd132bf16 %xmm24, %xmm23, %xmm22 {%k7} {z} // CHECK: encoding: [0x62,0x86,0x44,0x87,0x9c,0xf0] - vfnmadd132nepbf16 %xmm24, %xmm23, %xmm22 {%k7} {z} + vfnmadd132bf16 %xmm24, %xmm23, %xmm22 {%k7} {z} -// CHECK: vfnmadd132nepbf16 268435456(%rbp,%r14,8), %zmm23, %zmm22 +// CHECK: vfnmadd132bf16 268435456(%rbp,%r14,8), %zmm23, %zmm22 // CHECK: encoding: [0x62,0xa6,0x44,0x40,0x9c,0xb4,0xf5,0x00,0x00,0x00,0x10] - vfnmadd132nepbf16 268435456(%rbp,%r14,8), %zmm23, %zmm22 + vfnmadd132bf16 268435456(%rbp,%r14,8), %zmm23, %zmm22 -// CHECK: vfnmadd132nepbf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7} +// CHECK: vfnmadd132bf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7} // CHECK: encoding: [0x62,0xc6,0x44,0x47,0x9c,0xb4,0x80,0x23,0x01,0x00,0x00] - vfnmadd132nepbf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7} + vfnmadd132bf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7} -// CHECK: vfnmadd132nepbf16 (%rip){1to32}, %zmm23, %zmm22 +// CHECK: vfnmadd132bf16 (%rip){1to32}, %zmm23, %zmm22 // CHECK: encoding: [0x62,0xe6,0x44,0x50,0x9c,0x35,0x00,0x00,0x00,0x00] - vfnmadd132nepbf16 (%rip){1to32}, %zmm23, %zmm22 + vfnmadd132bf16 (%rip){1to32}, %zmm23, %zmm22 -// CHECK: vfnmadd132nepbf16 -2048(,%rbp,2), %zmm23, %zmm22 +// CHECK: vfnmadd132bf16 -2048(,%rbp,2), %zmm23, %zmm22 // CHECK: encoding: [0x62,0xe6,0x44,0x40,0x9c,0x34,0x6d,0x00,0xf8,0xff,0xff] - vfnmadd132nepbf16 -2048(,%rbp,2), %zmm23, %zmm22 + vfnmadd132bf16 -2048(,%rbp,2), %zmm23, %zmm22 -// CHECK: vfnmadd132nepbf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z} +// CHECK: vfnmadd132bf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z} // CHECK: encoding: [0x62,0xe6,0x44,0xc7,0x9c,0x71,0x7f] - vfnmadd132nepbf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z} + vfnmadd132bf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z} -// CHECK: vfnmadd132nepbf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z} +// CHECK: vfnmadd132bf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z} // CHECK: encoding: [0x62,0xe6,0x44,0xd7,0x9c,0x72,0x80] - vfnmadd132nepbf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z} + vfnmadd132bf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z} -// CHECK: vfnmadd132nepbf16 268435456(%rbp,%r14,8), %ymm23, %ymm22 +// CHECK: vfnmadd132bf16 268435456(%rbp,%r14,8), %ymm23, %ymm22 // CHECK: encoding: [0x62,0xa6,0x44,0x20,0x9c,0xb4,0xf5,0x00,0x00,0x00,0x10] - vfnmadd132nepbf16 268435456(%rbp,%r14,8), %ymm23, %ymm22 + vfnmadd132bf16 268435456(%rbp,%r14,8), %ymm23, %ymm22 -// CHECK: vfnmadd132nepbf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7} +// CHECK: vfnmadd132bf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7} // CHECK: encoding: [0x62,0xc6,0x44,0x27,0x9c,0xb4,0x80,0x23,0x01,0x00,0x00] - vfnmadd132nepbf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7} + vfnmadd132bf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7} -// CHECK: vfnmadd132nepbf16 (%rip){1to16}, %ymm23, %ymm22 +// CHECK: vfnmadd132bf16 (%rip){1to16}, %ymm23, %ymm22 // CHECK: encoding: [0x62,0xe6,0x44,0x30,0x9c,0x35,0x00,0x00,0x00,0x00] - vfnmadd132nepbf16 (%rip){1to16}, %ymm23, %ymm22 + vfnmadd132bf16 (%rip){1to16}, %ymm23, %ymm22 -// CHECK: vfnmadd132nepbf16 -1024(,%rbp,2), %ymm23, %ymm22 +// CHECK: vfnmadd132bf16 -1024(,%rbp,2), %ymm23, %ymm22 // CHECK: encoding: [0x62,0xe6,0x44,0x20,0x9c,0x34,0x6d,0x00,0xfc,0xff,0xff] - vfnmadd132nepbf16 -1024(,%rbp,2), %ymm23, %ymm22 + vfnmadd132bf16 -1024(,%rbp,2), %ymm23, %ymm22 -// CHECK: vfnmadd132nepbf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z} +// CHECK: vfnmadd132bf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z} // CHECK: encoding: [0x62,0xe6,0x44,0xa7,0x9c,0x71,0x7f] - vfnmadd132nepbf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z} + vfnmadd132bf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z} -// CHECK: vfnmadd132nepbf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z} +// CHECK: vfnmadd132bf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z} // CHECK: encoding: [0x62,0xe6,0x44,0xb7,0x9c,0x72,0x80] - vfnmadd132nepbf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z} + vfnmadd132bf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z} -// CHECK: vfnmadd132nepbf16 268435456(%rbp,%r14,8), %xmm23, %xmm22 +// CHECK: vfnmadd132bf16 268435456(%rbp,%r14,8), %xmm23, %xmm22 // CHECK: encoding: [0x62,0xa6,0x44,0x00,0x9c,0xb4,0xf5,0x00,0x00,0x00,0x10] - vfnmadd132nepbf16 268435456(%rbp,%r14,8), %xmm23, %xmm22 + vfnmadd132bf16 268435456(%rbp,%r14,8), %xmm23, %xmm22 -// CHECK: vfnmadd132nepbf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7} +// CHECK: vfnmadd132bf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7} // CHECK: encoding: [0x62,0xc6,0x44,0x07,0x9c,0xb4,0x80,0x23,0x01,0x00,0x00] - vfnmadd132nepbf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7} + vfnmadd132bf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7} -// CHECK: vfnmadd132nepbf16 (%rip){1to8}, %xmm23, %xmm22 +// CHECK: vfnmadd132bf16 (%rip){1to8}, %xmm23, %xmm22 // CHECK: encoding: [0x62,0xe6,0x44,0x10,0x9c,0x35,0x00,0x00,0x00,0x00] - vfnmadd132nepbf16 (%rip){1to8}, %xmm23, %xmm22 + vfnmadd132bf16 (%rip){1to8}, %xmm23, %xmm22 -// CHECK: vfnmadd132nepbf16 -512(,%rbp,2), %xmm23, %xmm22 +// CHECK: vfnmadd132bf16 -512(,%rbp,2), %xmm23, %xmm22 // CHECK: encoding: [0x62,0xe6,0x44,0x00,0x9c,0x34,0x6d,0x00,0xfe,0xff,0xff] - vfnmadd132nepbf16 -512(,%rbp,2), %xmm23, %xmm22 + vfnmadd132bf16 -512(,%rbp,2), %xmm23, %xmm22 -// CHECK: vfnmadd132nepbf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z} +// CHECK: vfnmadd132bf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z} // CHECK: encoding: [0x62,0xe6,0x44,0x87,0x9c,0x71,0x7f] - vfnmadd132nepbf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z} + vfnmadd132bf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z} -// CHECK: vfnmadd132nepbf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z} +// CHECK: vfnmadd132bf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z} // CHECK: encoding: [0x62,0xe6,0x44,0x97,0x9c,0x72,0x80] - vfnmadd132nepbf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z} + vfnmadd132bf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z} -// CHECK: vfnmadd213nepbf16 %ymm24, %ymm23, %ymm22 +// CHECK: vfnmadd213bf16 %ymm24, %ymm23, %ymm22 // CHECK: encoding: [0x62,0x86,0x44,0x20,0xac,0xf0] - vfnmadd213nepbf16 %ymm24, %ymm23, %ymm22 + vfnmadd213bf16 %ymm24, %ymm23, %ymm22 -// CHECK: vfnmadd213nepbf16 %ymm24, %ymm23, %ymm22 {%k7} +// CHECK: vfnmadd213bf16 %ymm24, %ymm23, %ymm22 {%k7} // CHECK: encoding: [0x62,0x86,0x44,0x27,0xac,0xf0] - vfnmadd213nepbf16 %ymm24, %ymm23, %ymm22 {%k7} + vfnmadd213bf16 %ymm24, %ymm23, %ymm22 {%k7} -// CHECK: vfnmadd213nepbf16 %ymm24, %ymm23, %ymm22 {%k7} {z} +// CHECK: vfnmadd213bf16 %ymm24, %ymm23, %ymm22 {%k7} {z} // CHECK: encoding: [0x62,0x86,0x44,0xa7,0xac,0xf0] - vfnmadd213nepbf16 %ymm24, %ymm23, %ymm22 {%k7} {z} + vfnmadd213bf16 %ymm24, %ymm23, %ymm22 {%k7} {z} -// CHECK: vfnmadd213nepbf16 %zmm24, %zmm23, %zmm22 +// CHECK: vfnmadd213bf16 %zmm24, %zmm23, %zmm22 // CHECK: encoding: [0x62,0x86,0x44,0x40,0xac,0xf0] - vfnmadd213nepbf16 %zmm24, %zmm23, %zmm22 + vfnmadd213bf16 %zmm24, %zmm23, %zmm22 -// CHECK: vfnmadd213nepbf16 %zmm24, %zmm23, %zmm22 {%k7} +// CHECK: vfnmadd213bf16 %zmm24, %zmm23, %zmm22 {%k7} // CHECK: encoding: [0x62,0x86,0x44,0x47,0xac,0xf0] - vfnmadd213nepbf16 %zmm24, %zmm23, %zmm22 {%k7} + vfnmadd213bf16 %zmm24, %zmm23, %zmm22 {%k7} -// CHECK: vfnmadd213nepbf16 %zmm24, %zmm23, %zmm22 {%k7} {z} +// CHECK: vfnmadd213bf16 %zmm24, %zmm23, %zmm22 {%k7} {z} // CHECK: encoding: [0x62,0x86,0x44,0xc7,0xac,0xf0] - vfnmadd213nepbf16 %zmm24, %zmm23, %zmm22 {%k7} {z} + vfnmadd213bf16 %zmm24, %zmm23, %zmm22 {%k7} {z} -// CHECK: vfnmadd213nepbf16 %xmm24, %xmm23, %xmm22 +// CHECK: vfnmadd213bf16 %xmm24, %xmm23, %xmm22 // CHECK: encoding: [0x62,0x86,0x44,0x00,0xac,0xf0] - vfnmadd213nepbf16 %xmm24, %xmm23, %xmm22 + vfnmadd213bf16 %xmm24, %xmm23, %xmm22 -// CHECK: vfnmadd213nepbf16 %xmm24, %xmm23, %xmm22 {%k7} +// CHECK: vfnmadd213bf16 %xmm24, %xmm23, %xmm22 {%k7} // CHECK: encoding: [0x62,0x86,0x44,0x07,0xac,0xf0] - vfnmadd213nepbf16 %xmm24, %xmm23, %xmm22 {%k7} + vfnmadd213bf16 %xmm24, %xmm23, %xmm22 {%k7} -// CHECK: vfnmadd213nepbf16 %xmm24, %xmm23, %xmm22 {%k7} {z} +// CHECK: vfnmadd213bf16 %xmm24, %xmm23, %xmm22 {%k7} {z} // CHECK: encoding: [0x62,0x86,0x44,0x87,0xac,0xf0] - vfnmadd213nepbf16 %xmm24, %xmm23, %xmm22 {%k7} {z} + vfnmadd213bf16 %xmm24, %xmm23, %xmm22 {%k7} {z} -// CHECK: vfnmadd213nepbf16 268435456(%rbp,%r14,8), %zmm23, %zmm22 +// CHECK: vfnmadd213bf16 268435456(%rbp,%r14,8), %zmm23, %zmm22 // CHECK: encoding: [0x62,0xa6,0x44,0x40,0xac,0xb4,0xf5,0x00,0x00,0x00,0x10] - vfnmadd213nepbf16 268435456(%rbp,%r14,8), %zmm23, %zmm22 + vfnmadd213bf16 268435456(%rbp,%r14,8), %zmm23, %zmm22 -// CHECK: vfnmadd213nepbf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7} +// CHECK: vfnmadd213bf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7} // CHECK: encoding: [0x62,0xc6,0x44,0x47,0xac,0xb4,0x80,0x23,0x01,0x00,0x00] - vfnmadd213nepbf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7} + vfnmadd213bf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7} -// CHECK: vfnmadd213nepbf16 (%rip){1to32}, %zmm23, %zmm22 +// CHECK: vfnmadd213bf16 (%rip){1to32}, %zmm23, %zmm22 // CHECK: encoding: [0x62,0xe6,0x44,0x50,0xac,0x35,0x00,0x00,0x00,0x00] - vfnmadd213nepbf16 (%rip){1to32}, %zmm23, %zmm22 + vfnmadd213bf16 (%rip){1to32}, %zmm23, %zmm22 -// CHECK: vfnmadd213nepbf16 -2048(,%rbp,2), %zmm23, %zmm22 +// CHECK: vfnmadd213bf16 -2048(,%rbp,2), %zmm23, %zmm22 // CHECK: encoding: [0x62,0xe6,0x44,0x40,0xac,0x34,0x6d,0x00,0xf8,0xff,0xff] - vfnmadd213nepbf16 -2048(,%rbp,2), %zmm23, %zmm22 + vfnmadd213bf16 -2048(,%rbp,2), %zmm23, %zmm22 -// CHECK: vfnmadd213nepbf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z} +// CHECK: vfnmadd213bf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z} // CHECK: encoding: [0x62,0xe6,0x44,0xc7,0xac,0x71,0x7f] - vfnmadd213nepbf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z} + vfnmadd213bf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z} -// CHECK: vfnmadd213nepbf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z} +// CHECK: vfnmadd213bf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z} // CHECK: encoding: [0x62,0xe6,0x44,0xd7,0xac,0x72,0x80] - vfnmadd213nepbf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z} + vfnmadd213bf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z} -// CHECK: vfnmadd213nepbf16 268435456(%rbp,%r14,8), %ymm23, %ymm22 +// CHECK: vfnmadd213bf16 268435456(%rbp,%r14,8), %ymm23, %ymm22 // CHECK: encoding: [0x62,0xa6,0x44,0x20,0xac,0xb4,0xf5,0x00,0x00,0x00,0x10] - vfnmadd213nepbf16 268435456(%rbp,%r14,8), %ymm23, %ymm22 + vfnmadd213bf16 268435456(%rbp,%r14,8), %ymm23, %ymm22 -// CHECK: vfnmadd213nepbf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7} +// CHECK: vfnmadd213bf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7} // CHECK: encoding: [0x62,0xc6,0x44,0x27,0xac,0xb4,0x80,0x23,0x01,0x00,0x00] - vfnmadd213nepbf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7} + vfnmadd213bf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7} -// CHECK: vfnmadd213nepbf16 (%rip){1to16}, %ymm23, %ymm22 +// CHECK: vfnmadd213bf16 (%rip){1to16}, %ymm23, %ymm22 // CHECK: encoding: [0x62,0xe6,0x44,0x30,0xac,0x35,0x00,0x00,0x00,0x00] - vfnmadd213nepbf16 (%rip){1to16}, %ymm23, %ymm22 + vfnmadd213bf16 (%rip){1to16}, %ymm23, %ymm22 -// CHECK: vfnmadd213nepbf16 -1024(,%rbp,2), %ymm23, %ymm22 +// CHECK: vfnmadd213bf16 -1024(,%rbp,2), %ymm23, %ymm22 // CHECK: encoding: [0x62,0xe6,0x44,0x20,0xac,0x34,0x6d,0x00,0xfc,0xff,0xff] - vfnmadd213nepbf16 -1024(,%rbp,2), %ymm23, %ymm22 + vfnmadd213bf16 -1024(,%rbp,2), %ymm23, %ymm22 -// CHECK: vfnmadd213nepbf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z} +// CHECK: vfnmadd213bf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z} // CHECK: encoding: [0x62,0xe6,0x44,0xa7,0xac,0x71,0x7f] - vfnmadd213nepbf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z} + vfnmadd213bf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z} -// CHECK: vfnmadd213nepbf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z} +// CHECK: vfnmadd213bf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z} // CHECK: encoding: [0x62,0xe6,0x44,0xb7,0xac,0x72,0x80] - vfnmadd213nepbf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z} + vfnmadd213bf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z} -// CHECK: vfnmadd213nepbf16 268435456(%rbp,%r14,8), %xmm23, %xmm22 +// CHECK: vfnmadd213bf16 268435456(%rbp,%r14,8), %xmm23, %xmm22 // CHECK: encoding: [0x62,0xa6,0x44,0x00,0xac,0xb4,0xf5,0x00,0x00,0x00,0x10] - vfnmadd213nepbf16 268435456(%rbp,%r14,8), %xmm23, %xmm22 + vfnmadd213bf16 268435456(%rbp,%r14,8), %xmm23, %xmm22 -// CHECK: vfnmadd213nepbf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7} +// CHECK: vfnmadd213bf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7} // CHECK: encoding: [0x62,0xc6,0x44,0x07,0xac,0xb4,0x80,0x23,0x01,0x00,0x00] - vfnmadd213nepbf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7} + vfnmadd213bf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7} -// CHECK: vfnmadd213nepbf16 (%rip){1to8}, %xmm23, %xmm22 +// CHECK: vfnmadd213bf16 (%rip){1to8}, %xmm23, %xmm22 // CHECK: encoding: [0x62,0xe6,0x44,0x10,0xac,0x35,0x00,0x00,0x00,0x00] - vfnmadd213nepbf16 (%rip){1to8}, %xmm23, %xmm22 + vfnmadd213bf16 (%rip){1to8}, %xmm23, %xmm22 -// CHECK: vfnmadd213nepbf16 -512(,%rbp,2), %xmm23, %xmm22 +// CHECK: vfnmadd213bf16 -512(,%rbp,2), %xmm23, %xmm22 // CHECK: encoding: [0x62,0xe6,0x44,0x00,0xac,0x34,0x6d,0x00,0xfe,0xff,0xff] - vfnmadd213nepbf16 -512(,%rbp,2), %xmm23, %xmm22 + vfnmadd213bf16 -512(,%rbp,2), %xmm23, %xmm22 -// CHECK: vfnmadd213nepbf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z} +// CHECK: vfnmadd213bf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z} // CHECK: encoding: [0x62,0xe6,0x44,0x87,0xac,0x71,0x7f] - vfnmadd213nepbf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z} + vfnmadd213bf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z} -// CHECK: vfnmadd213nepbf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z} +// CHECK: vfnmadd213bf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z} // CHECK: encoding: [0x62,0xe6,0x44,0x97,0xac,0x72,0x80] - vfnmadd213nepbf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z} + vfnmadd213bf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z} -// CHECK: vfnmadd231nepbf16 %ymm24, %ymm23, %ymm22 +// CHECK: vfnmadd231bf16 %ymm24, %ymm23, %ymm22 // CHECK: encoding: [0x62,0x86,0x44,0x20,0xbc,0xf0] - vfnmadd231nepbf16 %ymm24, %ymm23, %ymm22 + vfnmadd231bf16 %ymm24, %ymm23, %ymm22 -// CHECK: vfnmadd231nepbf16 %ymm24, %ymm23, %ymm22 {%k7} +// CHECK: vfnmadd231bf16 %ymm24, %ymm23, %ymm22 {%k7} // CHECK: encoding: [0x62,0x86,0x44,0x27,0xbc,0xf0] - vfnmadd231nepbf16 %ymm24, %ymm23, %ymm22 {%k7} + vfnmadd231bf16 %ymm24, %ymm23, %ymm22 {%k7} -// CHECK: vfnmadd231nepbf16 %ymm24, %ymm23, %ymm22 {%k7} {z} +// CHECK: vfnmadd231bf16 %ymm24, %ymm23, %ymm22 {%k7} {z} // CHECK: encoding: [0x62,0x86,0x44,0xa7,0xbc,0xf0] - vfnmadd231nepbf16 %ymm24, %ymm23, %ymm22 {%k7} {z} + vfnmadd231bf16 %ymm24, %ymm23, %ymm22 {%k7} {z} -// CHECK: vfnmadd231nepbf16 %zmm24, %zmm23, %zmm22 +// CHECK: vfnmadd231bf16 %zmm24, %zmm23, %zmm22 // CHECK: encoding: [0x62,0x86,0x44,0x40,0xbc,0xf0] - vfnmadd231nepbf16 %zmm24, %zmm23, %zmm22 + vfnmadd231bf16 %zmm24, %zmm23, %zmm22 -// CHECK: vfnmadd231nepbf16 %zmm24, %zmm23, %zmm22 {%k7} +// CHECK: vfnmadd231bf16 %zmm24, %zmm23, %zmm22 {%k7} // CHECK: encoding: [0x62,0x86,0x44,0x47,0xbc,0xf0] - vfnmadd231nepbf16 %zmm24, %zmm23, %zmm22 {%k7} + vfnmadd231bf16 %zmm24, %zmm23, %zmm22 {%k7} -// CHECK: vfnmadd231nepbf16 %zmm24, %zmm23, %zmm22 {%k7} {z} +// CHECK: vfnmadd231bf16 %zmm24, %zmm23, %zmm22 {%k7} {z} // CHECK: encoding: [0x62,0x86,0x44,0xc7,0xbc,0xf0] - vfnmadd231nepbf16 %zmm24, %zmm23, %zmm22 {%k7} {z} + vfnmadd231bf16 %zmm24, %zmm23, %zmm22 {%k7} {z} -// CHECK: vfnmadd231nepbf16 %xmm24, %xmm23, %xmm22 +// CHECK: vfnmadd231bf16 %xmm24, %xmm23, %xmm22 // CHECK: encoding: [0x62,0x86,0x44,0x00,0xbc,0xf0] - vfnmadd231nepbf16 %xmm24, %xmm23, %xmm22 + vfnmadd231bf16 %xmm24, %xmm23, %xmm22 -// CHECK: vfnmadd231nepbf16 %xmm24, %xmm23, %xmm22 {%k7} +// CHECK: vfnmadd231bf16 %xmm24, %xmm23, %xmm22 {%k7} // CHECK: encoding: [0x62,0x86,0x44,0x07,0xbc,0xf0] - vfnmadd231nepbf16 %xmm24, %xmm23, %xmm22 {%k7} + vfnmadd231bf16 %xmm24, %xmm23, %xmm22 {%k7} -// CHECK: vfnmadd231nepbf16 %xmm24, %xmm23, %xmm22 {%k7} {z} +// CHECK: vfnmadd231bf16 %xmm24, %xmm23, %xmm22 {%k7} {z} // CHECK: encoding: [0x62,0x86,0x44,0x87,0xbc,0xf0] - vfnmadd231nepbf16 %xmm24, %xmm23, %xmm22 {%k7} {z} + vfnmadd231bf16 %xmm24, %xmm23, %xmm22 {%k7} {z} -// CHECK: vfnmadd231nepbf16 268435456(%rbp,%r14,8), %zmm23, %zmm22 +// CHECK: vfnmadd231bf16 268435456(%rbp,%r14,8), %zmm23, %zmm22 // CHECK: encoding: [0x62,0xa6,0x44,0x40,0xbc,0xb4,0xf5,0x00,0x00,0x00,0x10] - vfnmadd231nepbf16 268435456(%rbp,%r14,8), %zmm23, %zmm22 + vfnmadd231bf16 268435456(%rbp,%r14,8), %zmm23, %zmm22 -// CHECK: vfnmadd231nepbf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7} +// CHECK: vfnmadd231bf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7} // CHECK: encoding: [0x62,0xc6,0x44,0x47,0xbc,0xb4,0x80,0x23,0x01,0x00,0x00] - vfnmadd231nepbf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7} + vfnmadd231bf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7} -// CHECK: vfnmadd231nepbf16 (%rip){1to32}, %zmm23, %zmm22 +// CHECK: vfnmadd231bf16 (%rip){1to32}, %zmm23, %zmm22 // CHECK: encoding: [0x62,0xe6,0x44,0x50,0xbc,0x35,0x00,0x00,0x00,0x00] - vfnmadd231nepbf16 (%rip){1to32}, %zmm23, %zmm22 + vfnmadd231bf16 (%rip){1to32}, %zmm23, %zmm22 -// CHECK: vfnmadd231nepbf16 -2048(,%rbp,2), %zmm23, %zmm22 +// CHECK: vfnmadd231bf16 -2048(,%rbp,2), %zmm23, %zmm22 // CHECK: encoding: [0x62,0xe6,0x44,0x40,0xbc,0x34,0x6d,0x00,0xf8,0xff,0xff] - vfnmadd231nepbf16 -2048(,%rbp,2), %zmm23, %zmm22 + vfnmadd231bf16 -2048(,%rbp,2), %zmm23, %zmm22 -// CHECK: vfnmadd231nepbf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z} +// CHECK: vfnmadd231bf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z} // CHECK: encoding: [0x62,0xe6,0x44,0xc7,0xbc,0x71,0x7f] - vfnmadd231nepbf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z} + vfnmadd231bf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z} -// CHECK: vfnmadd231nepbf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z} +// CHECK: vfnmadd231bf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z} // CHECK: encoding: [0x62,0xe6,0x44,0xd7,0xbc,0x72,0x80] - vfnmadd231nepbf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z} + vfnmadd231bf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z} -// CHECK: vfnmadd231nepbf16 268435456(%rbp,%r14,8), %ymm23, %ymm22 +// CHECK: vfnmadd231bf16 268435456(%rbp,%r14,8), %ymm23, %ymm22 // CHECK: encoding: [0x62,0xa6,0x44,0x20,0xbc,0xb4,0xf5,0x00,0x00,0x00,0x10] - vfnmadd231nepbf16 268435456(%rbp,%r14,8), %ymm23, %ymm22 + vfnmadd231bf16 268435456(%rbp,%r14,8), %ymm23, %ymm22 -// CHECK: vfnmadd231nepbf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7} +// CHECK: vfnmadd231bf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7} // CHECK: encoding: [0x62,0xc6,0x44,0x27,0xbc,0xb4,0x80,0x23,0x01,0x00,0x00] - vfnmadd231nepbf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7} + vfnmadd231bf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7} -// CHECK: vfnmadd231nepbf16 (%rip){1to16}, %ymm23, %ymm22 +// CHECK: vfnmadd231bf16 (%rip){1to16}, %ymm23, %ymm22 // CHECK: encoding: [0x62,0xe6,0x44,0x30,0xbc,0x35,0x00,0x00,0x00,0x00] - vfnmadd231nepbf16 (%rip){1to16}, %ymm23, %ymm22 + vfnmadd231bf16 (%rip){1to16}, %ymm23, %ymm22 -// CHECK: vfnmadd231nepbf16 -1024(,%rbp,2), %ymm23, %ymm22 +// CHECK: vfnmadd231bf16 -1024(,%rbp,2), %ymm23, %ymm22 // CHECK: encoding: [0x62,0xe6,0x44,0x20,0xbc,0x34,0x6d,0x00,0xfc,0xff,0xff] - vfnmadd231nepbf16 -1024(,%rbp,2), %ymm23, %ymm22 + vfnmadd231bf16 -1024(,%rbp,2), %ymm23, %ymm22 -// CHECK: vfnmadd231nepbf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z} +// CHECK: vfnmadd231bf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z} // CHECK: encoding: [0x62,0xe6,0x44,0xa7,0xbc,0x71,0x7f] - vfnmadd231nepbf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z} + vfnmadd231bf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z} -// CHECK: vfnmadd231nepbf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z} +// CHECK: vfnmadd231bf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z} // CHECK: encoding: [0x62,0xe6,0x44,0xb7,0xbc,0x72,0x80] - vfnmadd231nepbf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z} + vfnmadd231bf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z} -// CHECK: vfnmadd231nepbf16 268435456(%rbp,%r14,8), %xmm23, %xmm22 +// CHECK: vfnmadd231bf16 268435456(%rbp,%r14,8), %xmm23, %xmm22 // CHECK: encoding: [0x62,0xa6,0x44,0x00,0xbc,0xb4,0xf5,0x00,0x00,0x00,0x10] - vfnmadd231nepbf16 268435456(%rbp,%r14,8), %xmm23, %xmm22 + vfnmadd231bf16 268435456(%rbp,%r14,8), %xmm23, %xmm22 -// CHECK: vfnmadd231nepbf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7} +// CHECK: vfnmadd231bf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7} // CHECK: encoding: [0x62,0xc6,0x44,0x07,0xbc,0xb4,0x80,0x23,0x01,0x00,0x00] - vfnmadd231nepbf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7} + vfnmadd231bf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7} -// CHECK: vfnmadd231nepbf16 (%rip){1to8}, %xmm23, %xmm22 +// CHECK: vfnmadd231bf16 (%rip){1to8}, %xmm23, %xmm22 // CHECK: encoding: [0x62,0xe6,0x44,0x10,0xbc,0x35,0x00,0x00,0x00,0x00] - vfnmadd231nepbf16 (%rip){1to8}, %xmm23, %xmm22 + vfnmadd231bf16 (%rip){1to8}, %xmm23, %xmm22 -// CHECK: vfnmadd231nepbf16 -512(,%rbp,2), %xmm23, %xmm22 +// CHECK: vfnmadd231bf16 -512(,%rbp,2), %xmm23, %xmm22 // CHECK: encoding: [0x62,0xe6,0x44,0x00,0xbc,0x34,0x6d,0x00,0xfe,0xff,0xff] - vfnmadd231nepbf16 -512(,%rbp,2), %xmm23, %xmm22 + vfnmadd231bf16 -512(,%rbp,2), %xmm23, %xmm22 -// CHECK: vfnmadd231nepbf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z} +// CHECK: vfnmadd231bf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z} // CHECK: encoding: [0x62,0xe6,0x44,0x87,0xbc,0x71,0x7f] - vfnmadd231nepbf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z} + vfnmadd231bf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z} -// CHECK: vfnmadd231nepbf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z} +// CHECK: vfnmadd231bf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z} // CHECK: encoding: [0x62,0xe6,0x44,0x97,0xbc,0x72,0x80] - vfnmadd231nepbf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z} + vfnmadd231bf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z} -// CHECK: vfnmsub132nepbf16 %ymm24, %ymm23, %ymm22 +// CHECK: vfnmsub132bf16 %ymm24, %ymm23, %ymm22 // CHECK: encoding: [0x62,0x86,0x44,0x20,0x9e,0xf0] - vfnmsub132nepbf16 %ymm24, %ymm23, %ymm22 + vfnmsub132bf16 %ymm24, %ymm23, %ymm22 -// CHECK: vfnmsub132nepbf16 %ymm24, %ymm23, %ymm22 {%k7} +// CHECK: vfnmsub132bf16 %ymm24, %ymm23, %ymm22 {%k7} // CHECK: encoding: [0x62,0x86,0x44,0x27,0x9e,0xf0] - vfnmsub132nepbf16 %ymm24, %ymm23, %ymm22 {%k7} + vfnmsub132bf16 %ymm24, %ymm23, %ymm22 {%k7} -// CHECK: vfnmsub132nepbf16 %ymm24, %ymm23, %ymm22 {%k7} {z} +// CHECK: vfnmsub132bf16 %ymm24, %ymm23, %ymm22 {%k7} {z} // CHECK: encoding: [0x62,0x86,0x44,0xa7,0x9e,0xf0] - vfnmsub132nepbf16 %ymm24, %ymm23, %ymm22 {%k7} {z} + vfnmsub132bf16 %ymm24, %ymm23, %ymm22 {%k7} {z} -// CHECK: vfnmsub132nepbf16 %zmm24, %zmm23, %zmm22 +// CHECK: vfnmsub132bf16 %zmm24, %zmm23, %zmm22 // CHECK: encoding: [0x62,0x86,0x44,0x40,0x9e,0xf0] - vfnmsub132nepbf16 %zmm24, %zmm23, %zmm22 + vfnmsub132bf16 %zmm24, %zmm23, %zmm22 -// CHECK: vfnmsub132nepbf16 %zmm24, %zmm23, %zmm22 {%k7} +// CHECK: vfnmsub132bf16 %zmm24, %zmm23, %zmm22 {%k7} // CHECK: encoding: [0x62,0x86,0x44,0x47,0x9e,0xf0] - vfnmsub132nepbf16 %zmm24, %zmm23, %zmm22 {%k7} + vfnmsub132bf16 %zmm24, %zmm23, %zmm22 {%k7} -// CHECK: vfnmsub132nepbf16 %zmm24, %zmm23, %zmm22 {%k7} {z} +// CHECK: vfnmsub132bf16 %zmm24, %zmm23, %zmm22 {%k7} {z} // CHECK: encoding: [0x62,0x86,0x44,0xc7,0x9e,0xf0] - vfnmsub132nepbf16 %zmm24, %zmm23, %zmm22 {%k7} {z} + vfnmsub132bf16 %zmm24, %zmm23, %zmm22 {%k7} {z} -// CHECK: vfnmsub132nepbf16 %xmm24, %xmm23, %xmm22 +// CHECK: vfnmsub132bf16 %xmm24, %xmm23, %xmm22 // CHECK: encoding: [0x62,0x86,0x44,0x00,0x9e,0xf0] - vfnmsub132nepbf16 %xmm24, %xmm23, %xmm22 + vfnmsub132bf16 %xmm24, %xmm23, %xmm22 -// CHECK: vfnmsub132nepbf16 %xmm24, %xmm23, %xmm22 {%k7} +// CHECK: vfnmsub132bf16 %xmm24, %xmm23, %xmm22 {%k7} // CHECK: encoding: [0x62,0x86,0x44,0x07,0x9e,0xf0] - vfnmsub132nepbf16 %xmm24, %xmm23, %xmm22 {%k7} + vfnmsub132bf16 %xmm24, %xmm23, %xmm22 {%k7} -// CHECK: vfnmsub132nepbf16 %xmm24, %xmm23, %xmm22 {%k7} {z} +// CHECK: vfnmsub132bf16 %xmm24, %xmm23, %xmm22 {%k7} {z} // CHECK: encoding: [0x62,0x86,0x44,0x87,0x9e,0xf0] - vfnmsub132nepbf16 %xmm24, %xmm23, %xmm22 {%k7} {z} + vfnmsub132bf16 %xmm24, %xmm23, %xmm22 {%k7} {z} -// CHECK: vfnmsub132nepbf16 268435456(%rbp,%r14,8), %zmm23, %zmm22 +// CHECK: vfnmsub132bf16 268435456(%rbp,%r14,8), %zmm23, %zmm22 // CHECK: encoding: [0x62,0xa6,0x44,0x40,0x9e,0xb4,0xf5,0x00,0x00,0x00,0x10] - vfnmsub132nepbf16 268435456(%rbp,%r14,8), %zmm23, %zmm22 + vfnmsub132bf16 268435456(%rbp,%r14,8), %zmm23, %zmm22 -// CHECK: vfnmsub132nepbf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7} +// CHECK: vfnmsub132bf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7} // CHECK: encoding: [0x62,0xc6,0x44,0x47,0x9e,0xb4,0x80,0x23,0x01,0x00,0x00] - vfnmsub132nepbf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7} + vfnmsub132bf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7} -// CHECK: vfnmsub132nepbf16 (%rip){1to32}, %zmm23, %zmm22 +// CHECK: vfnmsub132bf16 (%rip){1to32}, %zmm23, %zmm22 // CHECK: encoding: [0x62,0xe6,0x44,0x50,0x9e,0x35,0x00,0x00,0x00,0x00] - vfnmsub132nepbf16 (%rip){1to32}, %zmm23, %zmm22 + vfnmsub132bf16 (%rip){1to32}, %zmm23, %zmm22 -// CHECK: vfnmsub132nepbf16 -2048(,%rbp,2), %zmm23, %zmm22 +// CHECK: vfnmsub132bf16 -2048(,%rbp,2), %zmm23, %zmm22 // CHECK: encoding: [0x62,0xe6,0x44,0x40,0x9e,0x34,0x6d,0x00,0xf8,0xff,0xff] - vfnmsub132nepbf16 -2048(,%rbp,2), %zmm23, %zmm22 + vfnmsub132bf16 -2048(,%rbp,2), %zmm23, %zmm22 -// CHECK: vfnmsub132nepbf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z} +// CHECK: vfnmsub132bf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z} // CHECK: encoding: [0x62,0xe6,0x44,0xc7,0x9e,0x71,0x7f] - vfnmsub132nepbf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z} + vfnmsub132bf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z} -// CHECK: vfnmsub132nepbf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z} +// CHECK: vfnmsub132bf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z} // CHECK: encoding: [0x62,0xe6,0x44,0xd7,0x9e,0x72,0x80] - vfnmsub132nepbf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z} + vfnmsub132bf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z} -// CHECK: vfnmsub132nepbf16 268435456(%rbp,%r14,8), %ymm23, %ymm22 +// CHECK: vfnmsub132bf16 268435456(%rbp,%r14,8), %ymm23, %ymm22 // CHECK: encoding: [0x62,0xa6,0x44,0x20,0x9e,0xb4,0xf5,0x00,0x00,0x00,0x10] - vfnmsub132nepbf16 268435456(%rbp,%r14,8), %ymm23, %ymm22 + vfnmsub132bf16 268435456(%rbp,%r14,8), %ymm23, %ymm22 -// CHECK: vfnmsub132nepbf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7} +// CHECK: vfnmsub132bf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7} // CHECK: encoding: [0x62,0xc6,0x44,0x27,0x9e,0xb4,0x80,0x23,0x01,0x00,0x00] - vfnmsub132nepbf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7} + vfnmsub132bf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7} -// CHECK: vfnmsub132nepbf16 (%rip){1to16}, %ymm23, %ymm22 +// CHECK: vfnmsub132bf16 (%rip){1to16}, %ymm23, %ymm22 // CHECK: encoding: [0x62,0xe6,0x44,0x30,0x9e,0x35,0x00,0x00,0x00,0x00] - vfnmsub132nepbf16 (%rip){1to16}, %ymm23, %ymm22 + vfnmsub132bf16 (%rip){1to16}, %ymm23, %ymm22 -// CHECK: vfnmsub132nepbf16 -1024(,%rbp,2), %ymm23, %ymm22 +// CHECK: vfnmsub132bf16 -1024(,%rbp,2), %ymm23, %ymm22 // CHECK: encoding: [0x62,0xe6,0x44,0x20,0x9e,0x34,0x6d,0x00,0xfc,0xff,0xff] - vfnmsub132nepbf16 -1024(,%rbp,2), %ymm23, %ymm22 + vfnmsub132bf16 -1024(,%rbp,2), %ymm23, %ymm22 -// CHECK: vfnmsub132nepbf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z} +// CHECK: vfnmsub132bf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z} // CHECK: encoding: [0x62,0xe6,0x44,0xa7,0x9e,0x71,0x7f] - vfnmsub132nepbf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z} + vfnmsub132bf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z} -// CHECK: vfnmsub132nepbf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z} +// CHECK: vfnmsub132bf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z} // CHECK: encoding: [0x62,0xe6,0x44,0xb7,0x9e,0x72,0x80] - vfnmsub132nepbf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z} + vfnmsub132bf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z} -// CHECK: vfnmsub132nepbf16 268435456(%rbp,%r14,8), %xmm23, %xmm22 +// CHECK: vfnmsub132bf16 268435456(%rbp,%r14,8), %xmm23, %xmm22 // CHECK: encoding: [0x62,0xa6,0x44,0x00,0x9e,0xb4,0xf5,0x00,0x00,0x00,0x10] - vfnmsub132nepbf16 268435456(%rbp,%r14,8), %xmm23, %xmm22 + vfnmsub132bf16 268435456(%rbp,%r14,8), %xmm23, %xmm22 -// CHECK: vfnmsub132nepbf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7} +// CHECK: vfnmsub132bf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7} // CHECK: encoding: [0x62,0xc6,0x44,0x07,0x9e,0xb4,0x80,0x23,0x01,0x00,0x00] - vfnmsub132nepbf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7} + vfnmsub132bf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7} -// CHECK: vfnmsub132nepbf16 (%rip){1to8}, %xmm23, %xmm22 +// CHECK: vfnmsub132bf16 (%rip){1to8}, %xmm23, %xmm22 // CHECK: encoding: [0x62,0xe6,0x44,0x10,0x9e,0x35,0x00,0x00,0x00,0x00] - vfnmsub132nepbf16 (%rip){1to8}, %xmm23, %xmm22 + vfnmsub132bf16 (%rip){1to8}, %xmm23, %xmm22 -// CHECK: vfnmsub132nepbf16 -512(,%rbp,2), %xmm23, %xmm22 +// CHECK: vfnmsub132bf16 -512(,%rbp,2), %xmm23, %xmm22 // CHECK: encoding: [0x62,0xe6,0x44,0x00,0x9e,0x34,0x6d,0x00,0xfe,0xff,0xff] - vfnmsub132nepbf16 -512(,%rbp,2), %xmm23, %xmm22 + vfnmsub132bf16 -512(,%rbp,2), %xmm23, %xmm22 -// CHECK: vfnmsub132nepbf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z} +// CHECK: vfnmsub132bf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z} // CHECK: encoding: [0x62,0xe6,0x44,0x87,0x9e,0x71,0x7f] - vfnmsub132nepbf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z} + vfnmsub132bf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z} -// CHECK: vfnmsub132nepbf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z} +// CHECK: vfnmsub132bf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z} // CHECK: encoding: [0x62,0xe6,0x44,0x97,0x9e,0x72,0x80] - vfnmsub132nepbf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z} + vfnmsub132bf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z} -// CHECK: vfnmsub213nepbf16 %ymm24, %ymm23, %ymm22 +// CHECK: vfnmsub213bf16 %ymm24, %ymm23, %ymm22 // CHECK: encoding: [0x62,0x86,0x44,0x20,0xae,0xf0] - vfnmsub213nepbf16 %ymm24, %ymm23, %ymm22 + vfnmsub213bf16 %ymm24, %ymm23, %ymm22 -// CHECK: vfnmsub213nepbf16 %ymm24, %ymm23, %ymm22 {%k7} +// CHECK: vfnmsub213bf16 %ymm24, %ymm23, %ymm22 {%k7} // CHECK: encoding: [0x62,0x86,0x44,0x27,0xae,0xf0] - vfnmsub213nepbf16 %ymm24, %ymm23, %ymm22 {%k7} + vfnmsub213bf16 %ymm24, %ymm23, %ymm22 {%k7} -// CHECK: vfnmsub213nepbf16 %ymm24, %ymm23, %ymm22 {%k7} {z} +// CHECK: vfnmsub213bf16 %ymm24, %ymm23, %ymm22 {%k7} {z} // CHECK: encoding: [0x62,0x86,0x44,0xa7,0xae,0xf0] - vfnmsub213nepbf16 %ymm24, %ymm23, %ymm22 {%k7} {z} + vfnmsub213bf16 %ymm24, %ymm23, %ymm22 {%k7} {z} -// CHECK: vfnmsub213nepbf16 %zmm24, %zmm23, %zmm22 +// CHECK: vfnmsub213bf16 %zmm24, %zmm23, %zmm22 // CHECK: encoding: [0x62,0x86,0x44,0x40,0xae,0xf0] - vfnmsub213nepbf16 %zmm24, %zmm23, %zmm22 + vfnmsub213bf16 %zmm24, %zmm23, %zmm22 -// CHECK: vfnmsub213nepbf16 %zmm24, %zmm23, %zmm22 {%k7} +// CHECK: vfnmsub213bf16 %zmm24, %zmm23, %zmm22 {%k7} // CHECK: encoding: [0x62,0x86,0x44,0x47,0xae,0xf0] - vfnmsub213nepbf16 %zmm24, %zmm23, %zmm22 {%k7} + vfnmsub213bf16 %zmm24, %zmm23, %zmm22 {%k7} -// CHECK: vfnmsub213nepbf16 %zmm24, %zmm23, %zmm22 {%k7} {z} +// CHECK: vfnmsub213bf16 %zmm24, %zmm23, %zmm22 {%k7} {z} // CHECK: encoding: [0x62,0x86,0x44,0xc7,0xae,0xf0] - vfnmsub213nepbf16 %zmm24, %zmm23, %zmm22 {%k7} {z} + vfnmsub213bf16 %zmm24, %zmm23, %zmm22 {%k7} {z} -// CHECK: vfnmsub213nepbf16 %xmm24, %xmm23, %xmm22 +// CHECK: vfnmsub213bf16 %xmm24, %xmm23, %xmm22 // CHECK: encoding: [0x62,0x86,0x44,0x00,0xae,0xf0] - vfnmsub213nepbf16 %xmm24, %xmm23, %xmm22 + vfnmsub213bf16 %xmm24, %xmm23, %xmm22 -// CHECK: vfnmsub213nepbf16 %xmm24, %xmm23, %xmm22 {%k7} +// CHECK: vfnmsub213bf16 %xmm24, %xmm23, %xmm22 {%k7} // CHECK: encoding: [0x62,0x86,0x44,0x07,0xae,0xf0] - vfnmsub213nepbf16 %xmm24, %xmm23, %xmm22 {%k7} + vfnmsub213bf16 %xmm24, %xmm23, %xmm22 {%k7} -// CHECK: vfnmsub213nepbf16 %xmm24, %xmm23, %xmm22 {%k7} {z} +// CHECK: vfnmsub213bf16 %xmm24, %xmm23, %xmm22 {%k7} {z} // CHECK: encoding: [0x62,0x86,0x44,0x87,0xae,0xf0] - vfnmsub213nepbf16 %xmm24, %xmm23, %xmm22 {%k7} {z} + vfnmsub213bf16 %xmm24, %xmm23, %xmm22 {%k7} {z} -// CHECK: vfnmsub213nepbf16 268435456(%rbp,%r14,8), %zmm23, %zmm22 +// CHECK: vfnmsub213bf16 268435456(%rbp,%r14,8), %zmm23, %zmm22 // CHECK: encoding: [0x62,0xa6,0x44,0x40,0xae,0xb4,0xf5,0x00,0x00,0x00,0x10] - vfnmsub213nepbf16 268435456(%rbp,%r14,8), %zmm23, %zmm22 + vfnmsub213bf16 268435456(%rbp,%r14,8), %zmm23, %zmm22 -// CHECK: vfnmsub213nepbf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7} +// CHECK: vfnmsub213bf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7} // CHECK: encoding: [0x62,0xc6,0x44,0x47,0xae,0xb4,0x80,0x23,0x01,0x00,0x00] - vfnmsub213nepbf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7} + vfnmsub213bf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7} -// CHECK: vfnmsub213nepbf16 (%rip){1to32}, %zmm23, %zmm22 +// CHECK: vfnmsub213bf16 (%rip){1to32}, %zmm23, %zmm22 // CHECK: encoding: [0x62,0xe6,0x44,0x50,0xae,0x35,0x00,0x00,0x00,0x00] - vfnmsub213nepbf16 (%rip){1to32}, %zmm23, %zmm22 + vfnmsub213bf16 (%rip){1to32}, %zmm23, %zmm22 -// CHECK: vfnmsub213nepbf16 -2048(,%rbp,2), %zmm23, %zmm22 +// CHECK: vfnmsub213bf16 -2048(,%rbp,2), %zmm23, %zmm22 // CHECK: encoding: [0x62,0xe6,0x44,0x40,0xae,0x34,0x6d,0x00,0xf8,0xff,0xff] - vfnmsub213nepbf16 -2048(,%rbp,2), %zmm23, %zmm22 + vfnmsub213bf16 -2048(,%rbp,2), %zmm23, %zmm22 -// CHECK: vfnmsub213nepbf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z} +// CHECK: vfnmsub213bf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z} // CHECK: encoding: [0x62,0xe6,0x44,0xc7,0xae,0x71,0x7f] - vfnmsub213nepbf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z} + vfnmsub213bf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z} -// CHECK: vfnmsub213nepbf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z} +// CHECK: vfnmsub213bf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z} // CHECK: encoding: [0x62,0xe6,0x44,0xd7,0xae,0x72,0x80] - vfnmsub213nepbf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z} + vfnmsub213bf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z} -// CHECK: vfnmsub213nepbf16 268435456(%rbp,%r14,8), %ymm23, %ymm22 +// CHECK: vfnmsub213bf16 268435456(%rbp,%r14,8), %ymm23, %ymm22 // CHECK: encoding: [0x62,0xa6,0x44,0x20,0xae,0xb4,0xf5,0x00,0x00,0x00,0x10] - vfnmsub213nepbf16 268435456(%rbp,%r14,8), %ymm23, %ymm22 + vfnmsub213bf16 268435456(%rbp,%r14,8), %ymm23, %ymm22 -// CHECK: vfnmsub213nepbf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7} +// CHECK: vfnmsub213bf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7} // CHECK: encoding: [0x62,0xc6,0x44,0x27,0xae,0xb4,0x80,0x23,0x01,0x00,0x00] - vfnmsub213nepbf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7} + vfnmsub213bf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7} -// CHECK: vfnmsub213nepbf16 (%rip){1to16}, %ymm23, %ymm22 +// CHECK: vfnmsub213bf16 (%rip){1to16}, %ymm23, %ymm22 // CHECK: encoding: [0x62,0xe6,0x44,0x30,0xae,0x35,0x00,0x00,0x00,0x00] - vfnmsub213nepbf16 (%rip){1to16}, %ymm23, %ymm22 + vfnmsub213bf16 (%rip){1to16}, %ymm23, %ymm22 -// CHECK: vfnmsub213nepbf16 -1024(,%rbp,2), %ymm23, %ymm22 +// CHECK: vfnmsub213bf16 -1024(,%rbp,2), %ymm23, %ymm22 // CHECK: encoding: [0x62,0xe6,0x44,0x20,0xae,0x34,0x6d,0x00,0xfc,0xff,0xff] - vfnmsub213nepbf16 -1024(,%rbp,2), %ymm23, %ymm22 + vfnmsub213bf16 -1024(,%rbp,2), %ymm23, %ymm22 -// CHECK: vfnmsub213nepbf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z} +// CHECK: vfnmsub213bf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z} // CHECK: encoding: [0x62,0xe6,0x44,0xa7,0xae,0x71,0x7f] - vfnmsub213nepbf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z} + vfnmsub213bf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z} -// CHECK: vfnmsub213nepbf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z} +// CHECK: vfnmsub213bf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z} // CHECK: encoding: [0x62,0xe6,0x44,0xb7,0xae,0x72,0x80] - vfnmsub213nepbf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z} + vfnmsub213bf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z} -// CHECK: vfnmsub213nepbf16 268435456(%rbp,%r14,8), %xmm23, %xmm22 +// CHECK: vfnmsub213bf16 268435456(%rbp,%r14,8), %xmm23, %xmm22 // CHECK: encoding: [0x62,0xa6,0x44,0x00,0xae,0xb4,0xf5,0x00,0x00,0x00,0x10] - vfnmsub213nepbf16 268435456(%rbp,%r14,8), %xmm23, %xmm22 + vfnmsub213bf16 268435456(%rbp,%r14,8), %xmm23, %xmm22 -// CHECK: vfnmsub213nepbf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7} +// CHECK: vfnmsub213bf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7} // CHECK: encoding: [0x62,0xc6,0x44,0x07,0xae,0xb4,0x80,0x23,0x01,0x00,0x00] - vfnmsub213nepbf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7} + vfnmsub213bf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7} -// CHECK: vfnmsub213nepbf16 (%rip){1to8}, %xmm23, %xmm22 +// CHECK: vfnmsub213bf16 (%rip){1to8}, %xmm23, %xmm22 // CHECK: encoding: [0x62,0xe6,0x44,0x10,0xae,0x35,0x00,0x00,0x00,0x00] - vfnmsub213nepbf16 (%rip){1to8}, %xmm23, %xmm22 + vfnmsub213bf16 (%rip){1to8}, %xmm23, %xmm22 -// CHECK: vfnmsub213nepbf16 -512(,%rbp,2), %xmm23, %xmm22 +// CHECK: vfnmsub213bf16 -512(,%rbp,2), %xmm23, %xmm22 // CHECK: encoding: [0x62,0xe6,0x44,0x00,0xae,0x34,0x6d,0x00,0xfe,0xff,0xff] - vfnmsub213nepbf16 -512(,%rbp,2), %xmm23, %xmm22 + vfnmsub213bf16 -512(,%rbp,2), %xmm23, %xmm22 -// CHECK: vfnmsub213nepbf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z} +// CHECK: vfnmsub213bf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z} // CHECK: encoding: [0x62,0xe6,0x44,0x87,0xae,0x71,0x7f] - vfnmsub213nepbf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z} + vfnmsub213bf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z} -// CHECK: vfnmsub213nepbf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z} +// CHECK: vfnmsub213bf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z} // CHECK: encoding: [0x62,0xe6,0x44,0x97,0xae,0x72,0x80] - vfnmsub213nepbf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z} + vfnmsub213bf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z} -// CHECK: vfnmsub231nepbf16 %ymm24, %ymm23, %ymm22 +// CHECK: vfnmsub231bf16 %ymm24, %ymm23, %ymm22 // CHECK: encoding: [0x62,0x86,0x44,0x20,0xbe,0xf0] - vfnmsub231nepbf16 %ymm24, %ymm23, %ymm22 + vfnmsub231bf16 %ymm24, %ymm23, %ymm22 -// CHECK: vfnmsub231nepbf16 %ymm24, %ymm23, %ymm22 {%k7} +// CHECK: vfnmsub231bf16 %ymm24, %ymm23, %ymm22 {%k7} // CHECK: encoding: [0x62,0x86,0x44,0x27,0xbe,0xf0] - vfnmsub231nepbf16 %ymm24, %ymm23, %ymm22 {%k7} + vfnmsub231bf16 %ymm24, %ymm23, %ymm22 {%k7} -// CHECK: vfnmsub231nepbf16 %ymm24, %ymm23, %ymm22 {%k7} {z} +// CHECK: vfnmsub231bf16 %ymm24, %ymm23, %ymm22 {%k7} {z} // CHECK: encoding: [0x62,0x86,0x44,0xa7,0xbe,0xf0] - vfnmsub231nepbf16 %ymm24, %ymm23, %ymm22 {%k7} {z} + vfnmsub231bf16 %ymm24, %ymm23, %ymm22 {%k7} {z} -// CHECK: vfnmsub231nepbf16 %zmm24, %zmm23, %zmm22 +// CHECK: vfnmsub231bf16 %zmm24, %zmm23, %zmm22 // CHECK: encoding: [0x62,0x86,0x44,0x40,0xbe,0xf0] - vfnmsub231nepbf16 %zmm24, %zmm23, %zmm22 + vfnmsub231bf16 %zmm24, %zmm23, %zmm22 -// CHECK: vfnmsub231nepbf16 %zmm24, %zmm23, %zmm22 {%k7} +// CHECK: vfnmsub231bf16 %zmm24, %zmm23, %zmm22 {%k7} // CHECK: encoding: [0x62,0x86,0x44,0x47,0xbe,0xf0] - vfnmsub231nepbf16 %zmm24, %zmm23, %zmm22 {%k7} + vfnmsub231bf16 %zmm24, %zmm23, %zmm22 {%k7} -// CHECK: vfnmsub231nepbf16 %zmm24, %zmm23, %zmm22 {%k7} {z} +// CHECK: vfnmsub231bf16 %zmm24, %zmm23, %zmm22 {%k7} {z} // CHECK: encoding: [0x62,0x86,0x44,0xc7,0xbe,0xf0] - vfnmsub231nepbf16 %zmm24, %zmm23, %zmm22 {%k7} {z} + vfnmsub231bf16 %zmm24, %zmm23, %zmm22 {%k7} {z} -// CHECK: vfnmsub231nepbf16 %xmm24, %xmm23, %xmm22 +// CHECK: vfnmsub231bf16 %xmm24, %xmm23, %xmm22 // CHECK: encoding: [0x62,0x86,0x44,0x00,0xbe,0xf0] - vfnmsub231nepbf16 %xmm24, %xmm23, %xmm22 + vfnmsub231bf16 %xmm24, %xmm23, %xmm22 -// CHECK: vfnmsub231nepbf16 %xmm24, %xmm23, %xmm22 {%k7} +// CHECK: vfnmsub231bf16 %xmm24, %xmm23, %xmm22 {%k7} // CHECK: encoding: [0x62,0x86,0x44,0x07,0xbe,0xf0] - vfnmsub231nepbf16 %xmm24, %xmm23, %xmm22 {%k7} + vfnmsub231bf16 %xmm24, %xmm23, %xmm22 {%k7} -// CHECK: vfnmsub231nepbf16 %xmm24, %xmm23, %xmm22 {%k7} {z} +// CHECK: vfnmsub231bf16 %xmm24, %xmm23, %xmm22 {%k7} {z} // CHECK: encoding: [0x62,0x86,0x44,0x87,0xbe,0xf0] - vfnmsub231nepbf16 %xmm24, %xmm23, %xmm22 {%k7} {z} + vfnmsub231bf16 %xmm24, %xmm23, %xmm22 {%k7} {z} -// CHECK: vfnmsub231nepbf16 268435456(%rbp,%r14,8), %zmm23, %zmm22 +// CHECK: vfnmsub231bf16 268435456(%rbp,%r14,8), %zmm23, %zmm22 // CHECK: encoding: [0x62,0xa6,0x44,0x40,0xbe,0xb4,0xf5,0x00,0x00,0x00,0x10] - vfnmsub231nepbf16 268435456(%rbp,%r14,8), %zmm23, %zmm22 + vfnmsub231bf16 268435456(%rbp,%r14,8), %zmm23, %zmm22 -// CHECK: vfnmsub231nepbf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7} +// CHECK: vfnmsub231bf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7} // CHECK: encoding: [0x62,0xc6,0x44,0x47,0xbe,0xb4,0x80,0x23,0x01,0x00,0x00] - vfnmsub231nepbf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7} + vfnmsub231bf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7} -// CHECK: vfnmsub231nepbf16 (%rip){1to32}, %zmm23, %zmm22 +// CHECK: vfnmsub231bf16 (%rip){1to32}, %zmm23, %zmm22 // CHECK: encoding: [0x62,0xe6,0x44,0x50,0xbe,0x35,0x00,0x00,0x00,0x00] - vfnmsub231nepbf16 (%rip){1to32}, %zmm23, %zmm22 + vfnmsub231bf16 (%rip){1to32}, %zmm23, %zmm22 -// CHECK: vfnmsub231nepbf16 -2048(,%rbp,2), %zmm23, %zmm22 +// CHECK: vfnmsub231bf16 -2048(,%rbp,2), %zmm23, %zmm22 // CHECK: encoding: [0x62,0xe6,0x44,0x40,0xbe,0x34,0x6d,0x00,0xf8,0xff,0xff] - vfnmsub231nepbf16 -2048(,%rbp,2), %zmm23, %zmm22 + vfnmsub231bf16 -2048(,%rbp,2), %zmm23, %zmm22 -// CHECK: vfnmsub231nepbf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z} +// CHECK: vfnmsub231bf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z} // CHECK: encoding: [0x62,0xe6,0x44,0xc7,0xbe,0x71,0x7f] - vfnmsub231nepbf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z} + vfnmsub231bf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z} -// CHECK: vfnmsub231nepbf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z} +// CHECK: vfnmsub231bf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z} // CHECK: encoding: [0x62,0xe6,0x44,0xd7,0xbe,0x72,0x80] - vfnmsub231nepbf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z} + vfnmsub231bf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z} -// CHECK: vfnmsub231nepbf16 268435456(%rbp,%r14,8), %ymm23, %ymm22 +// CHECK: vfnmsub231bf16 268435456(%rbp,%r14,8), %ymm23, %ymm22 // CHECK: encoding: [0x62,0xa6,0x44,0x20,0xbe,0xb4,0xf5,0x00,0x00,0x00,0x10] - vfnmsub231nepbf16 268435456(%rbp,%r14,8), %ymm23, %ymm22 + vfnmsub231bf16 268435456(%rbp,%r14,8), %ymm23, %ymm22 -// CHECK: vfnmsub231nepbf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7} +// CHECK: vfnmsub231bf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7} // CHECK: encoding: [0x62,0xc6,0x44,0x27,0xbe,0xb4,0x80,0x23,0x01,0x00,0x00] - vfnmsub231nepbf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7} + vfnmsub231bf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7} -// CHECK: vfnmsub231nepbf16 (%rip){1to16}, %ymm23, %ymm22 +// CHECK: vfnmsub231bf16 (%rip){1to16}, %ymm23, %ymm22 // CHECK: encoding: [0x62,0xe6,0x44,0x30,0xbe,0x35,0x00,0x00,0x00,0x00] - vfnmsub231nepbf16 (%rip){1to16}, %ymm23, %ymm22 + vfnmsub231bf16 (%rip){1to16}, %ymm23, %ymm22 -// CHECK: vfnmsub231nepbf16 -1024(,%rbp,2), %ymm23, %ymm22 +// CHECK: vfnmsub231bf16 -1024(,%rbp,2), %ymm23, %ymm22 // CHECK: encoding: [0x62,0xe6,0x44,0x20,0xbe,0x34,0x6d,0x00,0xfc,0xff,0xff] - vfnmsub231nepbf16 -1024(,%rbp,2), %ymm23, %ymm22 + vfnmsub231bf16 -1024(,%rbp,2), %ymm23, %ymm22 -// CHECK: vfnmsub231nepbf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z} +// CHECK: vfnmsub231bf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z} // CHECK: encoding: [0x62,0xe6,0x44,0xa7,0xbe,0x71,0x7f] - vfnmsub231nepbf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z} + vfnmsub231bf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z} -// CHECK: vfnmsub231nepbf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z} +// CHECK: vfnmsub231bf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z} // CHECK: encoding: [0x62,0xe6,0x44,0xb7,0xbe,0x72,0x80] - vfnmsub231nepbf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z} + vfnmsub231bf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z} -// CHECK: vfnmsub231nepbf16 268435456(%rbp,%r14,8), %xmm23, %xmm22 +// CHECK: vfnmsub231bf16 268435456(%rbp,%r14,8), %xmm23, %xmm22 // CHECK: encoding: [0x62,0xa6,0x44,0x00,0xbe,0xb4,0xf5,0x00,0x00,0x00,0x10] - vfnmsub231nepbf16 268435456(%rbp,%r14,8), %xmm23, %xmm22 + vfnmsub231bf16 268435456(%rbp,%r14,8), %xmm23, %xmm22 -// CHECK: vfnmsub231nepbf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7} +// CHECK: vfnmsub231bf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7} // CHECK: encoding: [0x62,0xc6,0x44,0x07,0xbe,0xb4,0x80,0x23,0x01,0x00,0x00] - vfnmsub231nepbf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7} + vfnmsub231bf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7} -// CHECK: vfnmsub231nepbf16 (%rip){1to8}, %xmm23, %xmm22 +// CHECK: vfnmsub231bf16 (%rip){1to8}, %xmm23, %xmm22 // CHECK: encoding: [0x62,0xe6,0x44,0x10,0xbe,0x35,0x00,0x00,0x00,0x00] - vfnmsub231nepbf16 (%rip){1to8}, %xmm23, %xmm22 + vfnmsub231bf16 (%rip){1to8}, %xmm23, %xmm22 -// CHECK: vfnmsub231nepbf16 -512(,%rbp,2), %xmm23, %xmm22 +// CHECK: vfnmsub231bf16 -512(,%rbp,2), %xmm23, %xmm22 // CHECK: encoding: [0x62,0xe6,0x44,0x00,0xbe,0x34,0x6d,0x00,0xfe,0xff,0xff] - vfnmsub231nepbf16 -512(,%rbp,2), %xmm23, %xmm22 + vfnmsub231bf16 -512(,%rbp,2), %xmm23, %xmm22 -// CHECK: vfnmsub231nepbf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z} +// CHECK: vfnmsub231bf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z} // CHECK: encoding: [0x62,0xe6,0x44,0x87,0xbe,0x71,0x7f] - vfnmsub231nepbf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z} + vfnmsub231bf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z} -// CHECK: vfnmsub231nepbf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z} +// CHECK: vfnmsub231bf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z} // CHECK: encoding: [0x62,0xe6,0x44,0x97,0xbe,0x72,0x80] - vfnmsub231nepbf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z} + vfnmsub231bf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z} -// CHECK: vfpclasspbf16 $123, %zmm23, %k5 +// CHECK: vfpclassbf16 $123, %zmm23, %k5 // CHECK: encoding: [0x62,0xb3,0x7f,0x48,0x66,0xef,0x7b] - vfpclasspbf16 $123, %zmm23, %k5 + vfpclassbf16 $123, %zmm23, %k5 -// CHECK: vfpclasspbf16 $123, %zmm23, %k5 {%k7} +// CHECK: vfpclassbf16 $123, %zmm23, %k5 {%k7} // CHECK: encoding: [0x62,0xb3,0x7f,0x4f,0x66,0xef,0x7b] - vfpclasspbf16 $123, %zmm23, %k5 {%k7} + vfpclassbf16 $123, %zmm23, %k5 {%k7} -// CHECK: vfpclasspbf16 $123, %ymm23, %k5 +// CHECK: vfpclassbf16 $123, %ymm23, %k5 // CHECK: encoding: [0x62,0xb3,0x7f,0x28,0x66,0xef,0x7b] - vfpclasspbf16 $123, %ymm23, %k5 + vfpclassbf16 $123, %ymm23, %k5 -// CHECK: vfpclasspbf16 $123, %ymm23, %k5 {%k7} +// CHECK: vfpclassbf16 $123, %ymm23, %k5 {%k7} // CHECK: encoding: [0x62,0xb3,0x7f,0x2f,0x66,0xef,0x7b] - vfpclasspbf16 $123, %ymm23, %k5 {%k7} + vfpclassbf16 $123, %ymm23, %k5 {%k7} -// CHECK: vfpclasspbf16 $123, %xmm23, %k5 +// CHECK: vfpclassbf16 $123, %xmm23, %k5 // CHECK: encoding: [0x62,0xb3,0x7f,0x08,0x66,0xef,0x7b] - vfpclasspbf16 $123, %xmm23, %k5 + vfpclassbf16 $123, %xmm23, %k5 -// CHECK: vfpclasspbf16 $123, %xmm23, %k5 {%k7} +// CHECK: vfpclassbf16 $123, %xmm23, %k5 {%k7} // CHECK: encoding: [0x62,0xb3,0x7f,0x0f,0x66,0xef,0x7b] - vfpclasspbf16 $123, %xmm23, %k5 {%k7} + vfpclassbf16 $123, %xmm23, %k5 {%k7} -// CHECK: vfpclasspbf16x $123, 268435456(%rbp,%r14,8), %k5 +// CHECK: vfpclassbf16x $123, 268435456(%rbp,%r14,8), %k5 // CHECK: encoding: [0x62,0xb3,0x7f,0x08,0x66,0xac,0xf5,0x00,0x00,0x00,0x10,0x7b] - vfpclasspbf16x $123, 268435456(%rbp,%r14,8), %k5 + vfpclassbf16x $123, 268435456(%rbp,%r14,8), %k5 -// CHECK: vfpclasspbf16x $123, 291(%r8,%rax,4), %k5 {%k7} +// CHECK: vfpclassbf16x $123, 291(%r8,%rax,4), %k5 {%k7} // CHECK: encoding: [0x62,0xd3,0x7f,0x0f,0x66,0xac,0x80,0x23,0x01,0x00,0x00,0x7b] - vfpclasspbf16x $123, 291(%r8,%rax,4), %k5 {%k7} + vfpclassbf16x $123, 291(%r8,%rax,4), %k5 {%k7} -// CHECK: vfpclasspbf16 $123, (%rip){1to8}, %k5 +// CHECK: vfpclassbf16 $123, (%rip){1to8}, %k5 // CHECK: encoding: [0x62,0xf3,0x7f,0x18,0x66,0x2d,0x00,0x00,0x00,0x00,0x7b] - vfpclasspbf16 $123, (%rip){1to8}, %k5 + vfpclassbf16 $123, (%rip){1to8}, %k5 -// CHECK: vfpclasspbf16x $123, -512(,%rbp,2), %k5 +// CHECK: vfpclassbf16x $123, -512(,%rbp,2), %k5 // CHECK: encoding: [0x62,0xf3,0x7f,0x08,0x66,0x2c,0x6d,0x00,0xfe,0xff,0xff,0x7b] - vfpclasspbf16x $123, -512(,%rbp,2), %k5 + vfpclassbf16x $123, -512(,%rbp,2), %k5 -// CHECK: vfpclasspbf16x $123, 2032(%rcx), %k5 {%k7} +// CHECK: vfpclassbf16x $123, 2032(%rcx), %k5 {%k7} // CHECK: encoding: [0x62,0xf3,0x7f,0x0f,0x66,0x69,0x7f,0x7b] - vfpclasspbf16x $123, 2032(%rcx), %k5 {%k7} + vfpclassbf16x $123, 2032(%rcx), %k5 {%k7} -// CHECK: vfpclasspbf16 $123, -256(%rdx){1to8}, %k5 {%k7} +// CHECK: vfpclassbf16 $123, -256(%rdx){1to8}, %k5 {%k7} // CHECK: encoding: [0x62,0xf3,0x7f,0x1f,0x66,0x6a,0x80,0x7b] - vfpclasspbf16 $123, -256(%rdx){1to8}, %k5 {%k7} + vfpclassbf16 $123, -256(%rdx){1to8}, %k5 {%k7} -// CHECK: vfpclasspbf16 $123, (%rip){1to16}, %k5 +// CHECK: vfpclassbf16 $123, (%rip){1to16}, %k5 // CHECK: encoding: [0x62,0xf3,0x7f,0x38,0x66,0x2d,0x00,0x00,0x00,0x00,0x7b] - vfpclasspbf16 $123, (%rip){1to16}, %k5 + vfpclassbf16 $123, (%rip){1to16}, %k5 -// CHECK: vfpclasspbf16y $123, -1024(,%rbp,2), %k5 +// CHECK: vfpclassbf16y $123, -1024(,%rbp,2), %k5 // CHECK: encoding: [0x62,0xf3,0x7f,0x28,0x66,0x2c,0x6d,0x00,0xfc,0xff,0xff,0x7b] - vfpclasspbf16y $123, -1024(,%rbp,2), %k5 + vfpclassbf16y $123, -1024(,%rbp,2), %k5 -// CHECK: vfpclasspbf16y $123, 4064(%rcx), %k5 {%k7} +// CHECK: vfpclassbf16y $123, 4064(%rcx), %k5 {%k7} // CHECK: encoding: [0x62,0xf3,0x7f,0x2f,0x66,0x69,0x7f,0x7b] - vfpclasspbf16y $123, 4064(%rcx), %k5 {%k7} + vfpclassbf16y $123, 4064(%rcx), %k5 {%k7} -// CHECK: vfpclasspbf16 $123, -256(%rdx){1to16}, %k5 {%k7} +// CHECK: vfpclassbf16 $123, -256(%rdx){1to16}, %k5 {%k7} // CHECK: encoding: [0x62,0xf3,0x7f,0x3f,0x66,0x6a,0x80,0x7b] - vfpclasspbf16 $123, -256(%rdx){1to16}, %k5 {%k7} + vfpclassbf16 $123, -256(%rdx){1to16}, %k5 {%k7} -// CHECK: vfpclasspbf16 $123, (%rip){1to32}, %k5 +// CHECK: vfpclassbf16 $123, (%rip){1to32}, %k5 // CHECK: encoding: [0x62,0xf3,0x7f,0x58,0x66,0x2d,0x00,0x00,0x00,0x00,0x7b] - vfpclasspbf16 $123, (%rip){1to32}, %k5 + vfpclassbf16 $123, (%rip){1to32}, %k5 -// CHECK: vfpclasspbf16z $123, -2048(,%rbp,2), %k5 +// CHECK: vfpclassbf16z $123, -2048(,%rbp,2), %k5 // CHECK: encoding: [0x62,0xf3,0x7f,0x48,0x66,0x2c,0x6d,0x00,0xf8,0xff,0xff,0x7b] - vfpclasspbf16z $123, -2048(,%rbp,2), %k5 + vfpclassbf16z $123, -2048(,%rbp,2), %k5 -// CHECK: vfpclasspbf16z $123, 8128(%rcx), %k5 {%k7} +// CHECK: vfpclassbf16z $123, 8128(%rcx), %k5 {%k7} // CHECK: encoding: [0x62,0xf3,0x7f,0x4f,0x66,0x69,0x7f,0x7b] - vfpclasspbf16z $123, 8128(%rcx), %k5 {%k7} + vfpclassbf16z $123, 8128(%rcx), %k5 {%k7} -// CHECK: vfpclasspbf16 $123, -256(%rdx){1to32}, %k5 {%k7} +// CHECK: vfpclassbf16 $123, -256(%rdx){1to32}, %k5 {%k7} // CHECK: encoding: [0x62,0xf3,0x7f,0x5f,0x66,0x6a,0x80,0x7b] - vfpclasspbf16 $123, -256(%rdx){1to32}, %k5 {%k7} + vfpclassbf16 $123, -256(%rdx){1to32}, %k5 {%k7} -// CHECK: vgetexppbf16 %xmm23, %xmm22 +// CHECK: vgetexpbf16 %xmm23, %xmm22 // CHECK: encoding: [0x62,0xa5,0x7d,0x08,0x42,0xf7] - vgetexppbf16 %xmm23, %xmm22 + vgetexpbf16 %xmm23, %xmm22 -// CHECK: vgetexppbf16 %xmm23, %xmm22 {%k7} +// CHECK: vgetexpbf16 %xmm23, %xmm22 {%k7} // CHECK: encoding: [0x62,0xa5,0x7d,0x0f,0x42,0xf7] - vgetexppbf16 %xmm23, %xmm22 {%k7} + vgetexpbf16 %xmm23, %xmm22 {%k7} -// CHECK: vgetexppbf16 %xmm23, %xmm22 {%k7} {z} +// CHECK: vgetexpbf16 %xmm23, %xmm22 {%k7} {z} // CHECK: encoding: [0x62,0xa5,0x7d,0x8f,0x42,0xf7] - vgetexppbf16 %xmm23, %xmm22 {%k7} {z} + vgetexpbf16 %xmm23, %xmm22 {%k7} {z} -// CHECK: vgetexppbf16 %zmm23, %zmm22 +// CHECK: vgetexpbf16 %zmm23, %zmm22 // CHECK: encoding: [0x62,0xa5,0x7d,0x48,0x42,0xf7] - vgetexppbf16 %zmm23, %zmm22 + vgetexpbf16 %zmm23, %zmm22 -// CHECK: vgetexppbf16 %zmm23, %zmm22 {%k7} +// CHECK: vgetexpbf16 %zmm23, %zmm22 {%k7} // CHECK: encoding: [0x62,0xa5,0x7d,0x4f,0x42,0xf7] - vgetexppbf16 %zmm23, %zmm22 {%k7} + vgetexpbf16 %zmm23, %zmm22 {%k7} -// CHECK: vgetexppbf16 %zmm23, %zmm22 {%k7} {z} +// CHECK: vgetexpbf16 %zmm23, %zmm22 {%k7} {z} // CHECK: encoding: [0x62,0xa5,0x7d,0xcf,0x42,0xf7] - vgetexppbf16 %zmm23, %zmm22 {%k7} {z} + vgetexpbf16 %zmm23, %zmm22 {%k7} {z} -// CHECK: vgetexppbf16 %ymm23, %ymm22 +// CHECK: vgetexpbf16 %ymm23, %ymm22 // CHECK: encoding: [0x62,0xa5,0x7d,0x28,0x42,0xf7] - vgetexppbf16 %ymm23, %ymm22 + vgetexpbf16 %ymm23, %ymm22 -// CHECK: vgetexppbf16 %ymm23, %ymm22 {%k7} +// CHECK: vgetexpbf16 %ymm23, %ymm22 {%k7} // CHECK: encoding: [0x62,0xa5,0x7d,0x2f,0x42,0xf7] - vgetexppbf16 %ymm23, %ymm22 {%k7} + vgetexpbf16 %ymm23, %ymm22 {%k7} -// CHECK: vgetexppbf16 %ymm23, %ymm22 {%k7} {z} +// CHECK: vgetexpbf16 %ymm23, %ymm22 {%k7} {z} // CHECK: encoding: [0x62,0xa5,0x7d,0xaf,0x42,0xf7] - vgetexppbf16 %ymm23, %ymm22 {%k7} {z} + vgetexpbf16 %ymm23, %ymm22 {%k7} {z} -// CHECK: vgetexppbf16 268435456(%rbp,%r14,8), %xmm22 +// CHECK: vgetexpbf16 268435456(%rbp,%r14,8), %xmm22 // CHECK: encoding: [0x62,0xa5,0x7d,0x08,0x42,0xb4,0xf5,0x00,0x00,0x00,0x10] - vgetexppbf16 268435456(%rbp,%r14,8), %xmm22 + vgetexpbf16 268435456(%rbp,%r14,8), %xmm22 -// CHECK: vgetexppbf16 291(%r8,%rax,4), %xmm22 {%k7} +// CHECK: vgetexpbf16 291(%r8,%rax,4), %xmm22 {%k7} // CHECK: encoding: [0x62,0xc5,0x7d,0x0f,0x42,0xb4,0x80,0x23,0x01,0x00,0x00] - vgetexppbf16 291(%r8,%rax,4), %xmm22 {%k7} + vgetexpbf16 291(%r8,%rax,4), %xmm22 {%k7} -// CHECK: vgetexppbf16 (%rip){1to8}, %xmm22 +// CHECK: vgetexpbf16 (%rip){1to8}, %xmm22 // CHECK: encoding: [0x62,0xe5,0x7d,0x18,0x42,0x35,0x00,0x00,0x00,0x00] - vgetexppbf16 (%rip){1to8}, %xmm22 + vgetexpbf16 (%rip){1to8}, %xmm22 -// CHECK: vgetexppbf16 -512(,%rbp,2), %xmm22 +// CHECK: vgetexpbf16 -512(,%rbp,2), %xmm22 // CHECK: encoding: [0x62,0xe5,0x7d,0x08,0x42,0x34,0x6d,0x00,0xfe,0xff,0xff] - vgetexppbf16 -512(,%rbp,2), %xmm22 + vgetexpbf16 -512(,%rbp,2), %xmm22 -// CHECK: vgetexppbf16 2032(%rcx), %xmm22 {%k7} {z} +// CHECK: vgetexpbf16 2032(%rcx), %xmm22 {%k7} {z} // CHECK: encoding: [0x62,0xe5,0x7d,0x8f,0x42,0x71,0x7f] - vgetexppbf16 2032(%rcx), %xmm22 {%k7} {z} + vgetexpbf16 2032(%rcx), %xmm22 {%k7} {z} -// CHECK: vgetexppbf16 -256(%rdx){1to8}, %xmm22 {%k7} {z} +// CHECK: vgetexpbf16 -256(%rdx){1to8}, %xmm22 {%k7} {z} // CHECK: encoding: [0x62,0xe5,0x7d,0x9f,0x42,0x72,0x80] - vgetexppbf16 -256(%rdx){1to8}, %xmm22 {%k7} {z} + vgetexpbf16 -256(%rdx){1to8}, %xmm22 {%k7} {z} -// CHECK: vgetexppbf16 268435456(%rbp,%r14,8), %ymm22 +// CHECK: vgetexpbf16 268435456(%rbp,%r14,8), %ymm22 // CHECK: encoding: [0x62,0xa5,0x7d,0x28,0x42,0xb4,0xf5,0x00,0x00,0x00,0x10] - vgetexppbf16 268435456(%rbp,%r14,8), %ymm22 + vgetexpbf16 268435456(%rbp,%r14,8), %ymm22 -// CHECK: vgetexppbf16 291(%r8,%rax,4), %ymm22 {%k7} +// CHECK: vgetexpbf16 291(%r8,%rax,4), %ymm22 {%k7} // CHECK: encoding: [0x62,0xc5,0x7d,0x2f,0x42,0xb4,0x80,0x23,0x01,0x00,0x00] - vgetexppbf16 291(%r8,%rax,4), %ymm22 {%k7} + vgetexpbf16 291(%r8,%rax,4), %ymm22 {%k7} -// CHECK: vgetexppbf16 (%rip){1to16}, %ymm22 +// CHECK: vgetexpbf16 (%rip){1to16}, %ymm22 // CHECK: encoding: [0x62,0xe5,0x7d,0x38,0x42,0x35,0x00,0x00,0x00,0x00] - vgetexppbf16 (%rip){1to16}, %ymm22 + vgetexpbf16 (%rip){1to16}, %ymm22 -// CHECK: vgetexppbf16 -1024(,%rbp,2), %ymm22 +// CHECK: vgetexpbf16 -1024(,%rbp,2), %ymm22 // CHECK: encoding: [0x62,0xe5,0x7d,0x28,0x42,0x34,0x6d,0x00,0xfc,0xff,0xff] - vgetexppbf16 -1024(,%rbp,2), %ymm22 + vgetexpbf16 -1024(,%rbp,2), %ymm22 -// CHECK: vgetexppbf16 4064(%rcx), %ymm22 {%k7} {z} +// CHECK: vgetexpbf16 4064(%rcx), %ymm22 {%k7} {z} // CHECK: encoding: [0x62,0xe5,0x7d,0xaf,0x42,0x71,0x7f] - vgetexppbf16 4064(%rcx), %ymm22 {%k7} {z} + vgetexpbf16 4064(%rcx), %ymm22 {%k7} {z} -// CHECK: vgetexppbf16 -256(%rdx){1to16}, %ymm22 {%k7} {z} +// CHECK: vgetexpbf16 -256(%rdx){1to16}, %ymm22 {%k7} {z} // CHECK: encoding: [0x62,0xe5,0x7d,0xbf,0x42,0x72,0x80] - vgetexppbf16 -256(%rdx){1to16}, %ymm22 {%k7} {z} + vgetexpbf16 -256(%rdx){1to16}, %ymm22 {%k7} {z} -// CHECK: vgetexppbf16 268435456(%rbp,%r14,8), %zmm22 +// CHECK: vgetexpbf16 268435456(%rbp,%r14,8), %zmm22 // CHECK: encoding: [0x62,0xa5,0x7d,0x48,0x42,0xb4,0xf5,0x00,0x00,0x00,0x10] - vgetexppbf16 268435456(%rbp,%r14,8), %zmm22 + vgetexpbf16 268435456(%rbp,%r14,8), %zmm22 -// CHECK: vgetexppbf16 291(%r8,%rax,4), %zmm22 {%k7} +// CHECK: vgetexpbf16 291(%r8,%rax,4), %zmm22 {%k7} // CHECK: encoding: [0x62,0xc5,0x7d,0x4f,0x42,0xb4,0x80,0x23,0x01,0x00,0x00] - vgetexppbf16 291(%r8,%rax,4), %zmm22 {%k7} + vgetexpbf16 291(%r8,%rax,4), %zmm22 {%k7} -// CHECK: vgetexppbf16 (%rip){1to32}, %zmm22 +// CHECK: vgetexpbf16 (%rip){1to32}, %zmm22 // CHECK: encoding: [0x62,0xe5,0x7d,0x58,0x42,0x35,0x00,0x00,0x00,0x00] - vgetexppbf16 (%rip){1to32}, %zmm22 + vgetexpbf16 (%rip){1to32}, %zmm22 -// CHECK: vgetexppbf16 -2048(,%rbp,2), %zmm22 +// CHECK: vgetexpbf16 -2048(,%rbp,2), %zmm22 // CHECK: encoding: [0x62,0xe5,0x7d,0x48,0x42,0x34,0x6d,0x00,0xf8,0xff,0xff] - vgetexppbf16 -2048(,%rbp,2), %zmm22 + vgetexpbf16 -2048(,%rbp,2), %zmm22 -// CHECK: vgetexppbf16 8128(%rcx), %zmm22 {%k7} {z} +// CHECK: vgetexpbf16 8128(%rcx), %zmm22 {%k7} {z} // CHECK: encoding: [0x62,0xe5,0x7d,0xcf,0x42,0x71,0x7f] - vgetexppbf16 8128(%rcx), %zmm22 {%k7} {z} + vgetexpbf16 8128(%rcx), %zmm22 {%k7} {z} -// CHECK: vgetexppbf16 -256(%rdx){1to32}, %zmm22 {%k7} {z} +// CHECK: vgetexpbf16 -256(%rdx){1to32}, %zmm22 {%k7} {z} // CHECK: encoding: [0x62,0xe5,0x7d,0xdf,0x42,0x72,0x80] - vgetexppbf16 -256(%rdx){1to32}, %zmm22 {%k7} {z} + vgetexpbf16 -256(%rdx){1to32}, %zmm22 {%k7} {z} -// CHECK: vgetmantpbf16 $123, %zmm23, %zmm22 +// CHECK: vgetmantbf16 $123, %zmm23, %zmm22 // CHECK: encoding: [0x62,0xa3,0x7f,0x48,0x26,0xf7,0x7b] - vgetmantpbf16 $123, %zmm23, %zmm22 + vgetmantbf16 $123, %zmm23, %zmm22 -// CHECK: vgetmantpbf16 $123, %zmm23, %zmm22 {%k7} +// CHECK: vgetmantbf16 $123, %zmm23, %zmm22 {%k7} // CHECK: encoding: [0x62,0xa3,0x7f,0x4f,0x26,0xf7,0x7b] - vgetmantpbf16 $123, %zmm23, %zmm22 {%k7} + vgetmantbf16 $123, %zmm23, %zmm22 {%k7} -// CHECK: vgetmantpbf16 $123, %zmm23, %zmm22 {%k7} {z} +// CHECK: vgetmantbf16 $123, %zmm23, %zmm22 {%k7} {z} // CHECK: encoding: [0x62,0xa3,0x7f,0xcf,0x26,0xf7,0x7b] - vgetmantpbf16 $123, %zmm23, %zmm22 {%k7} {z} + vgetmantbf16 $123, %zmm23, %zmm22 {%k7} {z} -// CHECK: vgetmantpbf16 $123, %ymm23, %ymm22 +// CHECK: vgetmantbf16 $123, %ymm23, %ymm22 // CHECK: encoding: [0x62,0xa3,0x7f,0x28,0x26,0xf7,0x7b] - vgetmantpbf16 $123, %ymm23, %ymm22 + vgetmantbf16 $123, %ymm23, %ymm22 -// CHECK: vgetmantpbf16 $123, %ymm23, %ymm22 {%k7} +// CHECK: vgetmantbf16 $123, %ymm23, %ymm22 {%k7} // CHECK: encoding: [0x62,0xa3,0x7f,0x2f,0x26,0xf7,0x7b] - vgetmantpbf16 $123, %ymm23, %ymm22 {%k7} + vgetmantbf16 $123, %ymm23, %ymm22 {%k7} -// CHECK: vgetmantpbf16 $123, %ymm23, %ymm22 {%k7} {z} +// CHECK: vgetmantbf16 $123, %ymm23, %ymm22 {%k7} {z} // CHECK: encoding: [0x62,0xa3,0x7f,0xaf,0x26,0xf7,0x7b] - vgetmantpbf16 $123, %ymm23, %ymm22 {%k7} {z} + vgetmantbf16 $123, %ymm23, %ymm22 {%k7} {z} -// CHECK: vgetmantpbf16 $123, %xmm23, %xmm22 +// CHECK: vgetmantbf16 $123, %xmm23, %xmm22 // CHECK: encoding: [0x62,0xa3,0x7f,0x08,0x26,0xf7,0x7b] - vgetmantpbf16 $123, %xmm23, %xmm22 + vgetmantbf16 $123, %xmm23, %xmm22 -// CHECK: vgetmantpbf16 $123, %xmm23, %xmm22 {%k7} +// CHECK: vgetmantbf16 $123, %xmm23, %xmm22 {%k7} // CHECK: encoding: [0x62,0xa3,0x7f,0x0f,0x26,0xf7,0x7b] - vgetmantpbf16 $123, %xmm23, %xmm22 {%k7} + vgetmantbf16 $123, %xmm23, %xmm22 {%k7} -// CHECK: vgetmantpbf16 $123, %xmm23, %xmm22 {%k7} {z} +// CHECK: vgetmantbf16 $123, %xmm23, %xmm22 {%k7} {z} // CHECK: encoding: [0x62,0xa3,0x7f,0x8f,0x26,0xf7,0x7b] - vgetmantpbf16 $123, %xmm23, %xmm22 {%k7} {z} + vgetmantbf16 $123, %xmm23, %xmm22 {%k7} {z} -// CHECK: vgetmantpbf16 $123, 268435456(%rbp,%r14,8), %xmm22 +// CHECK: vgetmantbf16 $123, 268435456(%rbp,%r14,8), %xmm22 // CHECK: encoding: [0x62,0xa3,0x7f,0x08,0x26,0xb4,0xf5,0x00,0x00,0x00,0x10,0x7b] - vgetmantpbf16 $123, 268435456(%rbp,%r14,8), %xmm22 + vgetmantbf16 $123, 268435456(%rbp,%r14,8), %xmm22 -// CHECK: vgetmantpbf16 $123, 291(%r8,%rax,4), %xmm22 {%k7} +// CHECK: vgetmantbf16 $123, 291(%r8,%rax,4), %xmm22 {%k7} // CHECK: encoding: [0x62,0xc3,0x7f,0x0f,0x26,0xb4,0x80,0x23,0x01,0x00,0x00,0x7b] - vgetmantpbf16 $123, 291(%r8,%rax,4), %xmm22 {%k7} + vgetmantbf16 $123, 291(%r8,%rax,4), %xmm22 {%k7} -// CHECK: vgetmantpbf16 $123, (%rip){1to8}, %xmm22 +// CHECK: vgetmantbf16 $123, (%rip){1to8}, %xmm22 // CHECK: encoding: [0x62,0xe3,0x7f,0x18,0x26,0x35,0x00,0x00,0x00,0x00,0x7b] - vgetmantpbf16 $123, (%rip){1to8}, %xmm22 + vgetmantbf16 $123, (%rip){1to8}, %xmm22 -// CHECK: vgetmantpbf16 $123, -512(,%rbp,2), %xmm22 +// CHECK: vgetmantbf16 $123, -512(,%rbp,2), %xmm22 // CHECK: encoding: [0x62,0xe3,0x7f,0x08,0x26,0x34,0x6d,0x00,0xfe,0xff,0xff,0x7b] - vgetmantpbf16 $123, -512(,%rbp,2), %xmm22 + vgetmantbf16 $123, -512(,%rbp,2), %xmm22 -// CHECK: vgetmantpbf16 $123, 2032(%rcx), %xmm22 {%k7} {z} +// CHECK: vgetmantbf16 $123, 2032(%rcx), %xmm22 {%k7} {z} // CHECK: encoding: [0x62,0xe3,0x7f,0x8f,0x26,0x71,0x7f,0x7b] - vgetmantpbf16 $123, 2032(%rcx), %xmm22 {%k7} {z} + vgetmantbf16 $123, 2032(%rcx), %xmm22 {%k7} {z} -// CHECK: vgetmantpbf16 $123, -256(%rdx){1to8}, %xmm22 {%k7} {z} +// CHECK: vgetmantbf16 $123, -256(%rdx){1to8}, %xmm22 {%k7} {z} // CHECK: encoding: [0x62,0xe3,0x7f,0x9f,0x26,0x72,0x80,0x7b] - vgetmantpbf16 $123, -256(%rdx){1to8}, %xmm22 {%k7} {z} + vgetmantbf16 $123, -256(%rdx){1to8}, %xmm22 {%k7} {z} -// CHECK: vgetmantpbf16 $123, 268435456(%rbp,%r14,8), %ymm22 +// CHECK: vgetmantbf16 $123, 268435456(%rbp,%r14,8), %ymm22 // CHECK: encoding: [0x62,0xa3,0x7f,0x28,0x26,0xb4,0xf5,0x00,0x00,0x00,0x10,0x7b] - vgetmantpbf16 $123, 268435456(%rbp,%r14,8), %ymm22 + vgetmantbf16 $123, 268435456(%rbp,%r14,8), %ymm22 -// CHECK: vgetmantpbf16 $123, 291(%r8,%rax,4), %ymm22 {%k7} +// CHECK: vgetmantbf16 $123, 291(%r8,%rax,4), %ymm22 {%k7} // CHECK: encoding: [0x62,0xc3,0x7f,0x2f,0x26,0xb4,0x80,0x23,0x01,0x00,0x00,0x7b] - vgetmantpbf16 $123, 291(%r8,%rax,4), %ymm22 {%k7} + vgetmantbf16 $123, 291(%r8,%rax,4), %ymm22 {%k7} -// CHECK: vgetmantpbf16 $123, (%rip){1to16}, %ymm22 +// CHECK: vgetmantbf16 $123, (%rip){1to16}, %ymm22 // CHECK: encoding: [0x62,0xe3,0x7f,0x38,0x26,0x35,0x00,0x00,0x00,0x00,0x7b] - vgetmantpbf16 $123, (%rip){1to16}, %ymm22 + vgetmantbf16 $123, (%rip){1to16}, %ymm22 -// CHECK: vgetmantpbf16 $123, -1024(,%rbp,2), %ymm22 +// CHECK: vgetmantbf16 $123, -1024(,%rbp,2), %ymm22 // CHECK: encoding: [0x62,0xe3,0x7f,0x28,0x26,0x34,0x6d,0x00,0xfc,0xff,0xff,0x7b] - vgetmantpbf16 $123, -1024(,%rbp,2), %ymm22 + vgetmantbf16 $123, -1024(,%rbp,2), %ymm22 -// CHECK: vgetmantpbf16 $123, 4064(%rcx), %ymm22 {%k7} {z} +// CHECK: vgetmantbf16 $123, 4064(%rcx), %ymm22 {%k7} {z} // CHECK: encoding: [0x62,0xe3,0x7f,0xaf,0x26,0x71,0x7f,0x7b] - vgetmantpbf16 $123, 4064(%rcx), %ymm22 {%k7} {z} + vgetmantbf16 $123, 4064(%rcx), %ymm22 {%k7} {z} -// CHECK: vgetmantpbf16 $123, -256(%rdx){1to16}, %ymm22 {%k7} {z} +// CHECK: vgetmantbf16 $123, -256(%rdx){1to16}, %ymm22 {%k7} {z} // CHECK: encoding: [0x62,0xe3,0x7f,0xbf,0x26,0x72,0x80,0x7b] - vgetmantpbf16 $123, -256(%rdx){1to16}, %ymm22 {%k7} {z} + vgetmantbf16 $123, -256(%rdx){1to16}, %ymm22 {%k7} {z} -// CHECK: vgetmantpbf16 $123, 268435456(%rbp,%r14,8), %zmm22 +// CHECK: vgetmantbf16 $123, 268435456(%rbp,%r14,8), %zmm22 // CHECK: encoding: [0x62,0xa3,0x7f,0x48,0x26,0xb4,0xf5,0x00,0x00,0x00,0x10,0x7b] - vgetmantpbf16 $123, 268435456(%rbp,%r14,8), %zmm22 + vgetmantbf16 $123, 268435456(%rbp,%r14,8), %zmm22 -// CHECK: vgetmantpbf16 $123, 291(%r8,%rax,4), %zmm22 {%k7} +// CHECK: vgetmantbf16 $123, 291(%r8,%rax,4), %zmm22 {%k7} // CHECK: encoding: [0x62,0xc3,0x7f,0x4f,0x26,0xb4,0x80,0x23,0x01,0x00,0x00,0x7b] - vgetmantpbf16 $123, 291(%r8,%rax,4), %zmm22 {%k7} + vgetmantbf16 $123, 291(%r8,%rax,4), %zmm22 {%k7} -// CHECK: vgetmantpbf16 $123, (%rip){1to32}, %zmm22 +// CHECK: vgetmantbf16 $123, (%rip){1to32}, %zmm22 // CHECK: encoding: [0x62,0xe3,0x7f,0x58,0x26,0x35,0x00,0x00,0x00,0x00,0x7b] - vgetmantpbf16 $123, (%rip){1to32}, %zmm22 + vgetmantbf16 $123, (%rip){1to32}, %zmm22 -// CHECK: vgetmantpbf16 $123, -2048(,%rbp,2), %zmm22 +// CHECK: vgetmantbf16 $123, -2048(,%rbp,2), %zmm22 // CHECK: encoding: [0x62,0xe3,0x7f,0x48,0x26,0x34,0x6d,0x00,0xf8,0xff,0xff,0x7b] - vgetmantpbf16 $123, -2048(,%rbp,2), %zmm22 + vgetmantbf16 $123, -2048(,%rbp,2), %zmm22 -// CHECK: vgetmantpbf16 $123, 8128(%rcx), %zmm22 {%k7} {z} +// CHECK: vgetmantbf16 $123, 8128(%rcx), %zmm22 {%k7} {z} // CHECK: encoding: [0x62,0xe3,0x7f,0xcf,0x26,0x71,0x7f,0x7b] - vgetmantpbf16 $123, 8128(%rcx), %zmm22 {%k7} {z} + vgetmantbf16 $123, 8128(%rcx), %zmm22 {%k7} {z} -// CHECK: vgetmantpbf16 $123, -256(%rdx){1to32}, %zmm22 {%k7} {z} +// CHECK: vgetmantbf16 $123, -256(%rdx){1to32}, %zmm22 {%k7} {z} // CHECK: encoding: [0x62,0xe3,0x7f,0xdf,0x26,0x72,0x80,0x7b] - vgetmantpbf16 $123, -256(%rdx){1to32}, %zmm22 {%k7} {z} + vgetmantbf16 $123, -256(%rdx){1to32}, %zmm22 {%k7} {z} -// CHECK: vmaxpbf16 %ymm24, %ymm23, %ymm22 +// CHECK: vmaxbf16 %ymm24, %ymm23, %ymm22 // CHECK: encoding: [0x62,0x85,0x45,0x20,0x5f,0xf0] - vmaxpbf16 %ymm24, %ymm23, %ymm22 + vmaxbf16 %ymm24, %ymm23, %ymm22 -// CHECK: vmaxpbf16 %ymm24, %ymm23, %ymm22 {%k7} +// CHECK: vmaxbf16 %ymm24, %ymm23, %ymm22 {%k7} // CHECK: encoding: [0x62,0x85,0x45,0x27,0x5f,0xf0] - vmaxpbf16 %ymm24, %ymm23, %ymm22 {%k7} + vmaxbf16 %ymm24, %ymm23, %ymm22 {%k7} -// CHECK: vmaxpbf16 %ymm24, %ymm23, %ymm22 {%k7} {z} +// CHECK: vmaxbf16 %ymm24, %ymm23, %ymm22 {%k7} {z} // CHECK: encoding: [0x62,0x85,0x45,0xa7,0x5f,0xf0] - vmaxpbf16 %ymm24, %ymm23, %ymm22 {%k7} {z} + vmaxbf16 %ymm24, %ymm23, %ymm22 {%k7} {z} -// CHECK: vmaxpbf16 %zmm24, %zmm23, %zmm22 +// CHECK: vmaxbf16 %zmm24, %zmm23, %zmm22 // CHECK: encoding: [0x62,0x85,0x45,0x40,0x5f,0xf0] - vmaxpbf16 %zmm24, %zmm23, %zmm22 + vmaxbf16 %zmm24, %zmm23, %zmm22 -// CHECK: vmaxpbf16 %zmm24, %zmm23, %zmm22 {%k7} +// CHECK: vmaxbf16 %zmm24, %zmm23, %zmm22 {%k7} // CHECK: encoding: [0x62,0x85,0x45,0x47,0x5f,0xf0] - vmaxpbf16 %zmm24, %zmm23, %zmm22 {%k7} + vmaxbf16 %zmm24, %zmm23, %zmm22 {%k7} -// CHECK: vmaxpbf16 %zmm24, %zmm23, %zmm22 {%k7} {z} +// CHECK: vmaxbf16 %zmm24, %zmm23, %zmm22 {%k7} {z} // CHECK: encoding: [0x62,0x85,0x45,0xc7,0x5f,0xf0] - vmaxpbf16 %zmm24, %zmm23, %zmm22 {%k7} {z} + vmaxbf16 %zmm24, %zmm23, %zmm22 {%k7} {z} -// CHECK: vmaxpbf16 %xmm24, %xmm23, %xmm22 +// CHECK: vmaxbf16 %xmm24, %xmm23, %xmm22 // CHECK: encoding: [0x62,0x85,0x45,0x00,0x5f,0xf0] - vmaxpbf16 %xmm24, %xmm23, %xmm22 + vmaxbf16 %xmm24, %xmm23, %xmm22 -// CHECK: vmaxpbf16 %xmm24, %xmm23, %xmm22 {%k7} +// CHECK: vmaxbf16 %xmm24, %xmm23, %xmm22 {%k7} // CHECK: encoding: [0x62,0x85,0x45,0x07,0x5f,0xf0] - vmaxpbf16 %xmm24, %xmm23, %xmm22 {%k7} + vmaxbf16 %xmm24, %xmm23, %xmm22 {%k7} -// CHECK: vmaxpbf16 %xmm24, %xmm23, %xmm22 {%k7} {z} +// CHECK: vmaxbf16 %xmm24, %xmm23, %xmm22 {%k7} {z} // CHECK: encoding: [0x62,0x85,0x45,0x87,0x5f,0xf0] - vmaxpbf16 %xmm24, %xmm23, %xmm22 {%k7} {z} + vmaxbf16 %xmm24, %xmm23, %xmm22 {%k7} {z} -// CHECK: vmaxpbf16 268435456(%rbp,%r14,8), %zmm23, %zmm22 +// CHECK: vmaxbf16 268435456(%rbp,%r14,8), %zmm23, %zmm22 // CHECK: encoding: [0x62,0xa5,0x45,0x40,0x5f,0xb4,0xf5,0x00,0x00,0x00,0x10] - vmaxpbf16 268435456(%rbp,%r14,8), %zmm23, %zmm22 + vmaxbf16 268435456(%rbp,%r14,8), %zmm23, %zmm22 -// CHECK: vmaxpbf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7} +// CHECK: vmaxbf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7} // CHECK: encoding: [0x62,0xc5,0x45,0x47,0x5f,0xb4,0x80,0x23,0x01,0x00,0x00] - vmaxpbf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7} + vmaxbf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7} -// CHECK: vmaxpbf16 (%rip){1to32}, %zmm23, %zmm22 +// CHECK: vmaxbf16 (%rip){1to32}, %zmm23, %zmm22 // CHECK: encoding: [0x62,0xe5,0x45,0x50,0x5f,0x35,0x00,0x00,0x00,0x00] - vmaxpbf16 (%rip){1to32}, %zmm23, %zmm22 + vmaxbf16 (%rip){1to32}, %zmm23, %zmm22 -// CHECK: vmaxpbf16 -2048(,%rbp,2), %zmm23, %zmm22 +// CHECK: vmaxbf16 -2048(,%rbp,2), %zmm23, %zmm22 // CHECK: encoding: [0x62,0xe5,0x45,0x40,0x5f,0x34,0x6d,0x00,0xf8,0xff,0xff] - vmaxpbf16 -2048(,%rbp,2), %zmm23, %zmm22 + vmaxbf16 -2048(,%rbp,2), %zmm23, %zmm22 -// CHECK: vmaxpbf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z} +// CHECK: vmaxbf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z} // CHECK: encoding: [0x62,0xe5,0x45,0xc7,0x5f,0x71,0x7f] - vmaxpbf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z} + vmaxbf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z} -// CHECK: vmaxpbf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z} +// CHECK: vmaxbf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z} // CHECK: encoding: [0x62,0xe5,0x45,0xd7,0x5f,0x72,0x80] - vmaxpbf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z} + vmaxbf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z} -// CHECK: vmaxpbf16 268435456(%rbp,%r14,8), %ymm23, %ymm22 +// CHECK: vmaxbf16 268435456(%rbp,%r14,8), %ymm23, %ymm22 // CHECK: encoding: [0x62,0xa5,0x45,0x20,0x5f,0xb4,0xf5,0x00,0x00,0x00,0x10] - vmaxpbf16 268435456(%rbp,%r14,8), %ymm23, %ymm22 + vmaxbf16 268435456(%rbp,%r14,8), %ymm23, %ymm22 -// CHECK: vmaxpbf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7} +// CHECK: vmaxbf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7} // CHECK: encoding: [0x62,0xc5,0x45,0x27,0x5f,0xb4,0x80,0x23,0x01,0x00,0x00] - vmaxpbf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7} + vmaxbf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7} -// CHECK: vmaxpbf16 (%rip){1to16}, %ymm23, %ymm22 +// CHECK: vmaxbf16 (%rip){1to16}, %ymm23, %ymm22 // CHECK: encoding: [0x62,0xe5,0x45,0x30,0x5f,0x35,0x00,0x00,0x00,0x00] - vmaxpbf16 (%rip){1to16}, %ymm23, %ymm22 + vmaxbf16 (%rip){1to16}, %ymm23, %ymm22 -// CHECK: vmaxpbf16 -1024(,%rbp,2), %ymm23, %ymm22 +// CHECK: vmaxbf16 -1024(,%rbp,2), %ymm23, %ymm22 // CHECK: encoding: [0x62,0xe5,0x45,0x20,0x5f,0x34,0x6d,0x00,0xfc,0xff,0xff] - vmaxpbf16 -1024(,%rbp,2), %ymm23, %ymm22 + vmaxbf16 -1024(,%rbp,2), %ymm23, %ymm22 -// CHECK: vmaxpbf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z} +// CHECK: vmaxbf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z} // CHECK: encoding: [0x62,0xe5,0x45,0xa7,0x5f,0x71,0x7f] - vmaxpbf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z} + vmaxbf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z} -// CHECK: vmaxpbf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z} +// CHECK: vmaxbf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z} // CHECK: encoding: [0x62,0xe5,0x45,0xb7,0x5f,0x72,0x80] - vmaxpbf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z} + vmaxbf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z} -// CHECK: vmaxpbf16 268435456(%rbp,%r14,8), %xmm23, %xmm22 +// CHECK: vmaxbf16 268435456(%rbp,%r14,8), %xmm23, %xmm22 // CHECK: encoding: [0x62,0xa5,0x45,0x00,0x5f,0xb4,0xf5,0x00,0x00,0x00,0x10] - vmaxpbf16 268435456(%rbp,%r14,8), %xmm23, %xmm22 + vmaxbf16 268435456(%rbp,%r14,8), %xmm23, %xmm22 -// CHECK: vmaxpbf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7} +// CHECK: vmaxbf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7} // CHECK: encoding: [0x62,0xc5,0x45,0x07,0x5f,0xb4,0x80,0x23,0x01,0x00,0x00] - vmaxpbf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7} + vmaxbf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7} -// CHECK: vmaxpbf16 (%rip){1to8}, %xmm23, %xmm22 +// CHECK: vmaxbf16 (%rip){1to8}, %xmm23, %xmm22 // CHECK: encoding: [0x62,0xe5,0x45,0x10,0x5f,0x35,0x00,0x00,0x00,0x00] - vmaxpbf16 (%rip){1to8}, %xmm23, %xmm22 + vmaxbf16 (%rip){1to8}, %xmm23, %xmm22 -// CHECK: vmaxpbf16 -512(,%rbp,2), %xmm23, %xmm22 +// CHECK: vmaxbf16 -512(,%rbp,2), %xmm23, %xmm22 // CHECK: encoding: [0x62,0xe5,0x45,0x00,0x5f,0x34,0x6d,0x00,0xfe,0xff,0xff] - vmaxpbf16 -512(,%rbp,2), %xmm23, %xmm22 + vmaxbf16 -512(,%rbp,2), %xmm23, %xmm22 -// CHECK: vmaxpbf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z} +// CHECK: vmaxbf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z} // CHECK: encoding: [0x62,0xe5,0x45,0x87,0x5f,0x71,0x7f] - vmaxpbf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z} + vmaxbf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z} -// CHECK: vmaxpbf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z} +// CHECK: vmaxbf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z} // CHECK: encoding: [0x62,0xe5,0x45,0x97,0x5f,0x72,0x80] - vmaxpbf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z} + vmaxbf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z} -// CHECK: vminpbf16 %ymm24, %ymm23, %ymm22 +// CHECK: vminbf16 %ymm24, %ymm23, %ymm22 // CHECK: encoding: [0x62,0x85,0x45,0x20,0x5d,0xf0] - vminpbf16 %ymm24, %ymm23, %ymm22 + vminbf16 %ymm24, %ymm23, %ymm22 -// CHECK: vminpbf16 %ymm24, %ymm23, %ymm22 {%k7} +// CHECK: vminbf16 %ymm24, %ymm23, %ymm22 {%k7} // CHECK: encoding: [0x62,0x85,0x45,0x27,0x5d,0xf0] - vminpbf16 %ymm24, %ymm23, %ymm22 {%k7} + vminbf16 %ymm24, %ymm23, %ymm22 {%k7} -// CHECK: vminpbf16 %ymm24, %ymm23, %ymm22 {%k7} {z} +// CHECK: vminbf16 %ymm24, %ymm23, %ymm22 {%k7} {z} // CHECK: encoding: [0x62,0x85,0x45,0xa7,0x5d,0xf0] - vminpbf16 %ymm24, %ymm23, %ymm22 {%k7} {z} + vminbf16 %ymm24, %ymm23, %ymm22 {%k7} {z} -// CHECK: vminpbf16 %zmm24, %zmm23, %zmm22 +// CHECK: vminbf16 %zmm24, %zmm23, %zmm22 // CHECK: encoding: [0x62,0x85,0x45,0x40,0x5d,0xf0] - vminpbf16 %zmm24, %zmm23, %zmm22 + vminbf16 %zmm24, %zmm23, %zmm22 -// CHECK: vminpbf16 %zmm24, %zmm23, %zmm22 {%k7} +// CHECK: vminbf16 %zmm24, %zmm23, %zmm22 {%k7} // CHECK: encoding: [0x62,0x85,0x45,0x47,0x5d,0xf0] - vminpbf16 %zmm24, %zmm23, %zmm22 {%k7} + vminbf16 %zmm24, %zmm23, %zmm22 {%k7} -// CHECK: vminpbf16 %zmm24, %zmm23, %zmm22 {%k7} {z} +// CHECK: vminbf16 %zmm24, %zmm23, %zmm22 {%k7} {z} // CHECK: encoding: [0x62,0x85,0x45,0xc7,0x5d,0xf0] - vminpbf16 %zmm24, %zmm23, %zmm22 {%k7} {z} + vminbf16 %zmm24, %zmm23, %zmm22 {%k7} {z} -// CHECK: vminpbf16 %xmm24, %xmm23, %xmm22 +// CHECK: vminbf16 %xmm24, %xmm23, %xmm22 // CHECK: encoding: [0x62,0x85,0x45,0x00,0x5d,0xf0] - vminpbf16 %xmm24, %xmm23, %xmm22 + vminbf16 %xmm24, %xmm23, %xmm22 -// CHECK: vminpbf16 %xmm24, %xmm23, %xmm22 {%k7} +// CHECK: vminbf16 %xmm24, %xmm23, %xmm22 {%k7} // CHECK: encoding: [0x62,0x85,0x45,0x07,0x5d,0xf0] - vminpbf16 %xmm24, %xmm23, %xmm22 {%k7} + vminbf16 %xmm24, %xmm23, %xmm22 {%k7} -// CHECK: vminpbf16 %xmm24, %xmm23, %xmm22 {%k7} {z} +// CHECK: vminbf16 %xmm24, %xmm23, %xmm22 {%k7} {z} // CHECK: encoding: [0x62,0x85,0x45,0x87,0x5d,0xf0] - vminpbf16 %xmm24, %xmm23, %xmm22 {%k7} {z} + vminbf16 %xmm24, %xmm23, %xmm22 {%k7} {z} -// CHECK: vminpbf16 268435456(%rbp,%r14,8), %zmm23, %zmm22 +// CHECK: vminbf16 268435456(%rbp,%r14,8), %zmm23, %zmm22 // CHECK: encoding: [0x62,0xa5,0x45,0x40,0x5d,0xb4,0xf5,0x00,0x00,0x00,0x10] - vminpbf16 268435456(%rbp,%r14,8), %zmm23, %zmm22 + vminbf16 268435456(%rbp,%r14,8), %zmm23, %zmm22 -// CHECK: vminpbf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7} +// CHECK: vminbf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7} // CHECK: encoding: [0x62,0xc5,0x45,0x47,0x5d,0xb4,0x80,0x23,0x01,0x00,0x00] - vminpbf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7} + vminbf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7} -// CHECK: vminpbf16 (%rip){1to32}, %zmm23, %zmm22 +// CHECK: vminbf16 (%rip){1to32}, %zmm23, %zmm22 // CHECK: encoding: [0x62,0xe5,0x45,0x50,0x5d,0x35,0x00,0x00,0x00,0x00] - vminpbf16 (%rip){1to32}, %zmm23, %zmm22 + vminbf16 (%rip){1to32}, %zmm23, %zmm22 -// CHECK: vminpbf16 -2048(,%rbp,2), %zmm23, %zmm22 +// CHECK: vminbf16 -2048(,%rbp,2), %zmm23, %zmm22 // CHECK: encoding: [0x62,0xe5,0x45,0x40,0x5d,0x34,0x6d,0x00,0xf8,0xff,0xff] - vminpbf16 -2048(,%rbp,2), %zmm23, %zmm22 + vminbf16 -2048(,%rbp,2), %zmm23, %zmm22 -// CHECK: vminpbf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z} +// CHECK: vminbf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z} // CHECK: encoding: [0x62,0xe5,0x45,0xc7,0x5d,0x71,0x7f] - vminpbf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z} + vminbf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z} -// CHECK: vminpbf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z} +// CHECK: vminbf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z} // CHECK: encoding: [0x62,0xe5,0x45,0xd7,0x5d,0x72,0x80] - vminpbf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z} + vminbf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z} -// CHECK: vminpbf16 268435456(%rbp,%r14,8), %ymm23, %ymm22 +// CHECK: vminbf16 268435456(%rbp,%r14,8), %ymm23, %ymm22 // CHECK: encoding: [0x62,0xa5,0x45,0x20,0x5d,0xb4,0xf5,0x00,0x00,0x00,0x10] - vminpbf16 268435456(%rbp,%r14,8), %ymm23, %ymm22 + vminbf16 268435456(%rbp,%r14,8), %ymm23, %ymm22 -// CHECK: vminpbf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7} +// CHECK: vminbf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7} // CHECK: encoding: [0x62,0xc5,0x45,0x27,0x5d,0xb4,0x80,0x23,0x01,0x00,0x00] - vminpbf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7} + vminbf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7} -// CHECK: vminpbf16 (%rip){1to16}, %ymm23, %ymm22 +// CHECK: vminbf16 (%rip){1to16}, %ymm23, %ymm22 // CHECK: encoding: [0x62,0xe5,0x45,0x30,0x5d,0x35,0x00,0x00,0x00,0x00] - vminpbf16 (%rip){1to16}, %ymm23, %ymm22 + vminbf16 (%rip){1to16}, %ymm23, %ymm22 -// CHECK: vminpbf16 -1024(,%rbp,2), %ymm23, %ymm22 +// CHECK: vminbf16 -1024(,%rbp,2), %ymm23, %ymm22 // CHECK: encoding: [0x62,0xe5,0x45,0x20,0x5d,0x34,0x6d,0x00,0xfc,0xff,0xff] - vminpbf16 -1024(,%rbp,2), %ymm23, %ymm22 + vminbf16 -1024(,%rbp,2), %ymm23, %ymm22 -// CHECK: vminpbf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z} +// CHECK: vminbf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z} // CHECK: encoding: [0x62,0xe5,0x45,0xa7,0x5d,0x71,0x7f] - vminpbf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z} + vminbf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z} -// CHECK: vminpbf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z} +// CHECK: vminbf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z} // CHECK: encoding: [0x62,0xe5,0x45,0xb7,0x5d,0x72,0x80] - vminpbf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z} + vminbf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z} -// CHECK: vminpbf16 268435456(%rbp,%r14,8), %xmm23, %xmm22 +// CHECK: vminbf16 268435456(%rbp,%r14,8), %xmm23, %xmm22 // CHECK: encoding: [0x62,0xa5,0x45,0x00,0x5d,0xb4,0xf5,0x00,0x00,0x00,0x10] - vminpbf16 268435456(%rbp,%r14,8), %xmm23, %xmm22 + vminbf16 268435456(%rbp,%r14,8), %xmm23, %xmm22 -// CHECK: vminpbf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7} +// CHECK: vminbf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7} // CHECK: encoding: [0x62,0xc5,0x45,0x07,0x5d,0xb4,0x80,0x23,0x01,0x00,0x00] - vminpbf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7} + vminbf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7} -// CHECK: vminpbf16 (%rip){1to8}, %xmm23, %xmm22 +// CHECK: vminbf16 (%rip){1to8}, %xmm23, %xmm22 // CHECK: encoding: [0x62,0xe5,0x45,0x10,0x5d,0x35,0x00,0x00,0x00,0x00] - vminpbf16 (%rip){1to8}, %xmm23, %xmm22 + vminbf16 (%rip){1to8}, %xmm23, %xmm22 -// CHECK: vminpbf16 -512(,%rbp,2), %xmm23, %xmm22 +// CHECK: vminbf16 -512(,%rbp,2), %xmm23, %xmm22 // CHECK: encoding: [0x62,0xe5,0x45,0x00,0x5d,0x34,0x6d,0x00,0xfe,0xff,0xff] - vminpbf16 -512(,%rbp,2), %xmm23, %xmm22 + vminbf16 -512(,%rbp,2), %xmm23, %xmm22 -// CHECK: vminpbf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z} +// CHECK: vminbf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z} // CHECK: encoding: [0x62,0xe5,0x45,0x87,0x5d,0x71,0x7f] - vminpbf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z} + vminbf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z} -// CHECK: vminpbf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z} +// CHECK: vminbf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z} // CHECK: encoding: [0x62,0xe5,0x45,0x97,0x5d,0x72,0x80] - vminpbf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z} + vminbf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z} -// CHECK: vmulnepbf16 %ymm24, %ymm23, %ymm22 +// CHECK: vmulbf16 %ymm24, %ymm23, %ymm22 // CHECK: encoding: [0x62,0x85,0x45,0x20,0x59,0xf0] - vmulnepbf16 %ymm24, %ymm23, %ymm22 + vmulbf16 %ymm24, %ymm23, %ymm22 -// CHECK: vmulnepbf16 %ymm24, %ymm23, %ymm22 {%k7} +// CHECK: vmulbf16 %ymm24, %ymm23, %ymm22 {%k7} // CHECK: encoding: [0x62,0x85,0x45,0x27,0x59,0xf0] - vmulnepbf16 %ymm24, %ymm23, %ymm22 {%k7} + vmulbf16 %ymm24, %ymm23, %ymm22 {%k7} -// CHECK: vmulnepbf16 %ymm24, %ymm23, %ymm22 {%k7} {z} +// CHECK: vmulbf16 %ymm24, %ymm23, %ymm22 {%k7} {z} // CHECK: encoding: [0x62,0x85,0x45,0xa7,0x59,0xf0] - vmulnepbf16 %ymm24, %ymm23, %ymm22 {%k7} {z} + vmulbf16 %ymm24, %ymm23, %ymm22 {%k7} {z} -// CHECK: vmulnepbf16 %zmm24, %zmm23, %zmm22 +// CHECK: vmulbf16 %zmm24, %zmm23, %zmm22 // CHECK: encoding: [0x62,0x85,0x45,0x40,0x59,0xf0] - vmulnepbf16 %zmm24, %zmm23, %zmm22 + vmulbf16 %zmm24, %zmm23, %zmm22 -// CHECK: vmulnepbf16 %zmm24, %zmm23, %zmm22 {%k7} +// CHECK: vmulbf16 %zmm24, %zmm23, %zmm22 {%k7} // CHECK: encoding: [0x62,0x85,0x45,0x47,0x59,0xf0] - vmulnepbf16 %zmm24, %zmm23, %zmm22 {%k7} + vmulbf16 %zmm24, %zmm23, %zmm22 {%k7} -// CHECK: vmulnepbf16 %zmm24, %zmm23, %zmm22 {%k7} {z} +// CHECK: vmulbf16 %zmm24, %zmm23, %zmm22 {%k7} {z} // CHECK: encoding: [0x62,0x85,0x45,0xc7,0x59,0xf0] - vmulnepbf16 %zmm24, %zmm23, %zmm22 {%k7} {z} + vmulbf16 %zmm24, %zmm23, %zmm22 {%k7} {z} -// CHECK: vmulnepbf16 %xmm24, %xmm23, %xmm22 +// CHECK: vmulbf16 %xmm24, %xmm23, %xmm22 // CHECK: encoding: [0x62,0x85,0x45,0x00,0x59,0xf0] - vmulnepbf16 %xmm24, %xmm23, %xmm22 + vmulbf16 %xmm24, %xmm23, %xmm22 -// CHECK: vmulnepbf16 %xmm24, %xmm23, %xmm22 {%k7} +// CHECK: vmulbf16 %xmm24, %xmm23, %xmm22 {%k7} // CHECK: encoding: [0x62,0x85,0x45,0x07,0x59,0xf0] - vmulnepbf16 %xmm24, %xmm23, %xmm22 {%k7} + vmulbf16 %xmm24, %xmm23, %xmm22 {%k7} -// CHECK: vmulnepbf16 %xmm24, %xmm23, %xmm22 {%k7} {z} +// CHECK: vmulbf16 %xmm24, %xmm23, %xmm22 {%k7} {z} // CHECK: encoding: [0x62,0x85,0x45,0x87,0x59,0xf0] - vmulnepbf16 %xmm24, %xmm23, %xmm22 {%k7} {z} + vmulbf16 %xmm24, %xmm23, %xmm22 {%k7} {z} -// CHECK: vmulnepbf16 268435456(%rbp,%r14,8), %zmm23, %zmm22 +// CHECK: vmulbf16 268435456(%rbp,%r14,8), %zmm23, %zmm22 // CHECK: encoding: [0x62,0xa5,0x45,0x40,0x59,0xb4,0xf5,0x00,0x00,0x00,0x10] - vmulnepbf16 268435456(%rbp,%r14,8), %zmm23, %zmm22 + vmulbf16 268435456(%rbp,%r14,8), %zmm23, %zmm22 -// CHECK: vmulnepbf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7} +// CHECK: vmulbf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7} // CHECK: encoding: [0x62,0xc5,0x45,0x47,0x59,0xb4,0x80,0x23,0x01,0x00,0x00] - vmulnepbf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7} + vmulbf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7} -// CHECK: vmulnepbf16 (%rip){1to32}, %zmm23, %zmm22 +// CHECK: vmulbf16 (%rip){1to32}, %zmm23, %zmm22 // CHECK: encoding: [0x62,0xe5,0x45,0x50,0x59,0x35,0x00,0x00,0x00,0x00] - vmulnepbf16 (%rip){1to32}, %zmm23, %zmm22 + vmulbf16 (%rip){1to32}, %zmm23, %zmm22 -// CHECK: vmulnepbf16 -2048(,%rbp,2), %zmm23, %zmm22 +// CHECK: vmulbf16 -2048(,%rbp,2), %zmm23, %zmm22 // CHECK: encoding: [0x62,0xe5,0x45,0x40,0x59,0x34,0x6d,0x00,0xf8,0xff,0xff] - vmulnepbf16 -2048(,%rbp,2), %zmm23, %zmm22 + vmulbf16 -2048(,%rbp,2), %zmm23, %zmm22 -// CHECK: vmulnepbf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z} +// CHECK: vmulbf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z} // CHECK: encoding: [0x62,0xe5,0x45,0xc7,0x59,0x71,0x7f] - vmulnepbf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z} + vmulbf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z} -// CHECK: vmulnepbf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z} +// CHECK: vmulbf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z} // CHECK: encoding: [0x62,0xe5,0x45,0xd7,0x59,0x72,0x80] - vmulnepbf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z} + vmulbf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z} -// CHECK: vmulnepbf16 268435456(%rbp,%r14,8), %ymm23, %ymm22 +// CHECK: vmulbf16 268435456(%rbp,%r14,8), %ymm23, %ymm22 // CHECK: encoding: [0x62,0xa5,0x45,0x20,0x59,0xb4,0xf5,0x00,0x00,0x00,0x10] - vmulnepbf16 268435456(%rbp,%r14,8), %ymm23, %ymm22 + vmulbf16 268435456(%rbp,%r14,8), %ymm23, %ymm22 -// CHECK: vmulnepbf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7} +// CHECK: vmulbf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7} // CHECK: encoding: [0x62,0xc5,0x45,0x27,0x59,0xb4,0x80,0x23,0x01,0x00,0x00] - vmulnepbf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7} + vmulbf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7} -// CHECK: vmulnepbf16 (%rip){1to16}, %ymm23, %ymm22 +// CHECK: vmulbf16 (%rip){1to16}, %ymm23, %ymm22 // CHECK: encoding: [0x62,0xe5,0x45,0x30,0x59,0x35,0x00,0x00,0x00,0x00] - vmulnepbf16 (%rip){1to16}, %ymm23, %ymm22 + vmulbf16 (%rip){1to16}, %ymm23, %ymm22 -// CHECK: vmulnepbf16 -1024(,%rbp,2), %ymm23, %ymm22 +// CHECK: vmulbf16 -1024(,%rbp,2), %ymm23, %ymm22 // CHECK: encoding: [0x62,0xe5,0x45,0x20,0x59,0x34,0x6d,0x00,0xfc,0xff,0xff] - vmulnepbf16 -1024(,%rbp,2), %ymm23, %ymm22 + vmulbf16 -1024(,%rbp,2), %ymm23, %ymm22 -// CHECK: vmulnepbf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z} +// CHECK: vmulbf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z} // CHECK: encoding: [0x62,0xe5,0x45,0xa7,0x59,0x71,0x7f] - vmulnepbf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z} + vmulbf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z} -// CHECK: vmulnepbf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z} +// CHECK: vmulbf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z} // CHECK: encoding: [0x62,0xe5,0x45,0xb7,0x59,0x72,0x80] - vmulnepbf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z} + vmulbf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z} -// CHECK: vmulnepbf16 268435456(%rbp,%r14,8), %xmm23, %xmm22 +// CHECK: vmulbf16 268435456(%rbp,%r14,8), %xmm23, %xmm22 // CHECK: encoding: [0x62,0xa5,0x45,0x00,0x59,0xb4,0xf5,0x00,0x00,0x00,0x10] - vmulnepbf16 268435456(%rbp,%r14,8), %xmm23, %xmm22 + vmulbf16 268435456(%rbp,%r14,8), %xmm23, %xmm22 -// CHECK: vmulnepbf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7} +// CHECK: vmulbf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7} // CHECK: encoding: [0x62,0xc5,0x45,0x07,0x59,0xb4,0x80,0x23,0x01,0x00,0x00] - vmulnepbf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7} + vmulbf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7} -// CHECK: vmulnepbf16 (%rip){1to8}, %xmm23, %xmm22 +// CHECK: vmulbf16 (%rip){1to8}, %xmm23, %xmm22 // CHECK: encoding: [0x62,0xe5,0x45,0x10,0x59,0x35,0x00,0x00,0x00,0x00] - vmulnepbf16 (%rip){1to8}, %xmm23, %xmm22 + vmulbf16 (%rip){1to8}, %xmm23, %xmm22 -// CHECK: vmulnepbf16 -512(,%rbp,2), %xmm23, %xmm22 +// CHECK: vmulbf16 -512(,%rbp,2), %xmm23, %xmm22 // CHECK: encoding: [0x62,0xe5,0x45,0x00,0x59,0x34,0x6d,0x00,0xfe,0xff,0xff] - vmulnepbf16 -512(,%rbp,2), %xmm23, %xmm22 + vmulbf16 -512(,%rbp,2), %xmm23, %xmm22 -// CHECK: vmulnepbf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z} +// CHECK: vmulbf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z} // CHECK: encoding: [0x62,0xe5,0x45,0x87,0x59,0x71,0x7f] - vmulnepbf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z} + vmulbf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z} -// CHECK: vmulnepbf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z} +// CHECK: vmulbf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z} // CHECK: encoding: [0x62,0xe5,0x45,0x97,0x59,0x72,0x80] - vmulnepbf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z} + vmulbf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z} -// CHECK: vrcppbf16 %xmm23, %xmm22 +// CHECK: vrcpbf16 %xmm23, %xmm22 // CHECK: encoding: [0x62,0xa6,0x7c,0x08,0x4c,0xf7] - vrcppbf16 %xmm23, %xmm22 + vrcpbf16 %xmm23, %xmm22 -// CHECK: vrcppbf16 %xmm23, %xmm22 {%k7} +// CHECK: vrcpbf16 %xmm23, %xmm22 {%k7} // CHECK: encoding: [0x62,0xa6,0x7c,0x0f,0x4c,0xf7] - vrcppbf16 %xmm23, %xmm22 {%k7} + vrcpbf16 %xmm23, %xmm22 {%k7} -// CHECK: vrcppbf16 %xmm23, %xmm22 {%k7} {z} +// CHECK: vrcpbf16 %xmm23, %xmm22 {%k7} {z} // CHECK: encoding: [0x62,0xa6,0x7c,0x8f,0x4c,0xf7] - vrcppbf16 %xmm23, %xmm22 {%k7} {z} + vrcpbf16 %xmm23, %xmm22 {%k7} {z} -// CHECK: vrcppbf16 %zmm23, %zmm22 +// CHECK: vrcpbf16 %zmm23, %zmm22 // CHECK: encoding: [0x62,0xa6,0x7c,0x48,0x4c,0xf7] - vrcppbf16 %zmm23, %zmm22 + vrcpbf16 %zmm23, %zmm22 -// CHECK: vrcppbf16 %zmm23, %zmm22 {%k7} +// CHECK: vrcpbf16 %zmm23, %zmm22 {%k7} // CHECK: encoding: [0x62,0xa6,0x7c,0x4f,0x4c,0xf7] - vrcppbf16 %zmm23, %zmm22 {%k7} + vrcpbf16 %zmm23, %zmm22 {%k7} -// CHECK: vrcppbf16 %zmm23, %zmm22 {%k7} {z} +// CHECK: vrcpbf16 %zmm23, %zmm22 {%k7} {z} // CHECK: encoding: [0x62,0xa6,0x7c,0xcf,0x4c,0xf7] - vrcppbf16 %zmm23, %zmm22 {%k7} {z} + vrcpbf16 %zmm23, %zmm22 {%k7} {z} -// CHECK: vrcppbf16 %ymm23, %ymm22 +// CHECK: vrcpbf16 %ymm23, %ymm22 // CHECK: encoding: [0x62,0xa6,0x7c,0x28,0x4c,0xf7] - vrcppbf16 %ymm23, %ymm22 + vrcpbf16 %ymm23, %ymm22 -// CHECK: vrcppbf16 %ymm23, %ymm22 {%k7} +// CHECK: vrcpbf16 %ymm23, %ymm22 {%k7} // CHECK: encoding: [0x62,0xa6,0x7c,0x2f,0x4c,0xf7] - vrcppbf16 %ymm23, %ymm22 {%k7} + vrcpbf16 %ymm23, %ymm22 {%k7} -// CHECK: vrcppbf16 %ymm23, %ymm22 {%k7} {z} +// CHECK: vrcpbf16 %ymm23, %ymm22 {%k7} {z} // CHECK: encoding: [0x62,0xa6,0x7c,0xaf,0x4c,0xf7] - vrcppbf16 %ymm23, %ymm22 {%k7} {z} + vrcpbf16 %ymm23, %ymm22 {%k7} {z} -// CHECK: vrcppbf16 268435456(%rbp,%r14,8), %xmm22 +// CHECK: vrcpbf16 268435456(%rbp,%r14,8), %xmm22 // CHECK: encoding: [0x62,0xa6,0x7c,0x08,0x4c,0xb4,0xf5,0x00,0x00,0x00,0x10] - vrcppbf16 268435456(%rbp,%r14,8), %xmm22 + vrcpbf16 268435456(%rbp,%r14,8), %xmm22 -// CHECK: vrcppbf16 291(%r8,%rax,4), %xmm22 {%k7} +// CHECK: vrcpbf16 291(%r8,%rax,4), %xmm22 {%k7} // CHECK: encoding: [0x62,0xc6,0x7c,0x0f,0x4c,0xb4,0x80,0x23,0x01,0x00,0x00] - vrcppbf16 291(%r8,%rax,4), %xmm22 {%k7} + vrcpbf16 291(%r8,%rax,4), %xmm22 {%k7} -// CHECK: vrcppbf16 (%rip){1to8}, %xmm22 +// CHECK: vrcpbf16 (%rip){1to8}, %xmm22 // CHECK: encoding: [0x62,0xe6,0x7c,0x18,0x4c,0x35,0x00,0x00,0x00,0x00] - vrcppbf16 (%rip){1to8}, %xmm22 + vrcpbf16 (%rip){1to8}, %xmm22 -// CHECK: vrcppbf16 -512(,%rbp,2), %xmm22 +// CHECK: vrcpbf16 -512(,%rbp,2), %xmm22 // CHECK: encoding: [0x62,0xe6,0x7c,0x08,0x4c,0x34,0x6d,0x00,0xfe,0xff,0xff] - vrcppbf16 -512(,%rbp,2), %xmm22 + vrcpbf16 -512(,%rbp,2), %xmm22 -// CHECK: vrcppbf16 2032(%rcx), %xmm22 {%k7} {z} +// CHECK: vrcpbf16 2032(%rcx), %xmm22 {%k7} {z} // CHECK: encoding: [0x62,0xe6,0x7c,0x8f,0x4c,0x71,0x7f] - vrcppbf16 2032(%rcx), %xmm22 {%k7} {z} + vrcpbf16 2032(%rcx), %xmm22 {%k7} {z} -// CHECK: vrcppbf16 -256(%rdx){1to8}, %xmm22 {%k7} {z} +// CHECK: vrcpbf16 -256(%rdx){1to8}, %xmm22 {%k7} {z} // CHECK: encoding: [0x62,0xe6,0x7c,0x9f,0x4c,0x72,0x80] - vrcppbf16 -256(%rdx){1to8}, %xmm22 {%k7} {z} + vrcpbf16 -256(%rdx){1to8}, %xmm22 {%k7} {z} -// CHECK: vrcppbf16 268435456(%rbp,%r14,8), %ymm22 +// CHECK: vrcpbf16 268435456(%rbp,%r14,8), %ymm22 // CHECK: encoding: [0x62,0xa6,0x7c,0x28,0x4c,0xb4,0xf5,0x00,0x00,0x00,0x10] - vrcppbf16 268435456(%rbp,%r14,8), %ymm22 + vrcpbf16 268435456(%rbp,%r14,8), %ymm22 -// CHECK: vrcppbf16 291(%r8,%rax,4), %ymm22 {%k7} +// CHECK: vrcpbf16 291(%r8,%rax,4), %ymm22 {%k7} // CHECK: encoding: [0x62,0xc6,0x7c,0x2f,0x4c,0xb4,0x80,0x23,0x01,0x00,0x00] - vrcppbf16 291(%r8,%rax,4), %ymm22 {%k7} + vrcpbf16 291(%r8,%rax,4), %ymm22 {%k7} -// CHECK: vrcppbf16 (%rip){1to16}, %ymm22 +// CHECK: vrcpbf16 (%rip){1to16}, %ymm22 // CHECK: encoding: [0x62,0xe6,0x7c,0x38,0x4c,0x35,0x00,0x00,0x00,0x00] - vrcppbf16 (%rip){1to16}, %ymm22 + vrcpbf16 (%rip){1to16}, %ymm22 -// CHECK: vrcppbf16 -1024(,%rbp,2), %ymm22 +// CHECK: vrcpbf16 -1024(,%rbp,2), %ymm22 // CHECK: encoding: [0x62,0xe6,0x7c,0x28,0x4c,0x34,0x6d,0x00,0xfc,0xff,0xff] - vrcppbf16 -1024(,%rbp,2), %ymm22 + vrcpbf16 -1024(,%rbp,2), %ymm22 -// CHECK: vrcppbf16 4064(%rcx), %ymm22 {%k7} {z} +// CHECK: vrcpbf16 4064(%rcx), %ymm22 {%k7} {z} // CHECK: encoding: [0x62,0xe6,0x7c,0xaf,0x4c,0x71,0x7f] - vrcppbf16 4064(%rcx), %ymm22 {%k7} {z} + vrcpbf16 4064(%rcx), %ymm22 {%k7} {z} -// CHECK: vrcppbf16 -256(%rdx){1to16}, %ymm22 {%k7} {z} +// CHECK: vrcpbf16 -256(%rdx){1to16}, %ymm22 {%k7} {z} // CHECK: encoding: [0x62,0xe6,0x7c,0xbf,0x4c,0x72,0x80] - vrcppbf16 -256(%rdx){1to16}, %ymm22 {%k7} {z} + vrcpbf16 -256(%rdx){1to16}, %ymm22 {%k7} {z} -// CHECK: vrcppbf16 268435456(%rbp,%r14,8), %zmm22 +// CHECK: vrcpbf16 268435456(%rbp,%r14,8), %zmm22 // CHECK: encoding: [0x62,0xa6,0x7c,0x48,0x4c,0xb4,0xf5,0x00,0x00,0x00,0x10] - vrcppbf16 268435456(%rbp,%r14,8), %zmm22 + vrcpbf16 268435456(%rbp,%r14,8), %zmm22 -// CHECK: vrcppbf16 291(%r8,%rax,4), %zmm22 {%k7} +// CHECK: vrcpbf16 291(%r8,%rax,4), %zmm22 {%k7} // CHECK: encoding: [0x62,0xc6,0x7c,0x4f,0x4c,0xb4,0x80,0x23,0x01,0x00,0x00] - vrcppbf16 291(%r8,%rax,4), %zmm22 {%k7} + vrcpbf16 291(%r8,%rax,4), %zmm22 {%k7} -// CHECK: vrcppbf16 (%rip){1to32}, %zmm22 +// CHECK: vrcpbf16 (%rip){1to32}, %zmm22 // CHECK: encoding: [0x62,0xe6,0x7c,0x58,0x4c,0x35,0x00,0x00,0x00,0x00] - vrcppbf16 (%rip){1to32}, %zmm22 + vrcpbf16 (%rip){1to32}, %zmm22 -// CHECK: vrcppbf16 -2048(,%rbp,2), %zmm22 +// CHECK: vrcpbf16 -2048(,%rbp,2), %zmm22 // CHECK: encoding: [0x62,0xe6,0x7c,0x48,0x4c,0x34,0x6d,0x00,0xf8,0xff,0xff] - vrcppbf16 -2048(,%rbp,2), %zmm22 + vrcpbf16 -2048(,%rbp,2), %zmm22 -// CHECK: vrcppbf16 8128(%rcx), %zmm22 {%k7} {z} +// CHECK: vrcpbf16 8128(%rcx), %zmm22 {%k7} {z} // CHECK: encoding: [0x62,0xe6,0x7c,0xcf,0x4c,0x71,0x7f] - vrcppbf16 8128(%rcx), %zmm22 {%k7} {z} + vrcpbf16 8128(%rcx), %zmm22 {%k7} {z} -// CHECK: vrcppbf16 -256(%rdx){1to32}, %zmm22 {%k7} {z} +// CHECK: vrcpbf16 -256(%rdx){1to32}, %zmm22 {%k7} {z} // CHECK: encoding: [0x62,0xe6,0x7c,0xdf,0x4c,0x72,0x80] - vrcppbf16 -256(%rdx){1to32}, %zmm22 {%k7} {z} + vrcpbf16 -256(%rdx){1to32}, %zmm22 {%k7} {z} -// CHECK: vreducenepbf16 $123, %zmm23, %zmm22 +// CHECK: vreducebf16 $123, %zmm23, %zmm22 // CHECK: encoding: [0x62,0xa3,0x7f,0x48,0x56,0xf7,0x7b] - vreducenepbf16 $123, %zmm23, %zmm22 + vreducebf16 $123, %zmm23, %zmm22 -// CHECK: vreducenepbf16 $123, %zmm23, %zmm22 {%k7} +// CHECK: vreducebf16 $123, %zmm23, %zmm22 {%k7} // CHECK: encoding: [0x62,0xa3,0x7f,0x4f,0x56,0xf7,0x7b] - vreducenepbf16 $123, %zmm23, %zmm22 {%k7} + vreducebf16 $123, %zmm23, %zmm22 {%k7} -// CHECK: vreducenepbf16 $123, %zmm23, %zmm22 {%k7} {z} +// CHECK: vreducebf16 $123, %zmm23, %zmm22 {%k7} {z} // CHECK: encoding: [0x62,0xa3,0x7f,0xcf,0x56,0xf7,0x7b] - vreducenepbf16 $123, %zmm23, %zmm22 {%k7} {z} + vreducebf16 $123, %zmm23, %zmm22 {%k7} {z} -// CHECK: vreducenepbf16 $123, %ymm23, %ymm22 +// CHECK: vreducebf16 $123, %ymm23, %ymm22 // CHECK: encoding: [0x62,0xa3,0x7f,0x28,0x56,0xf7,0x7b] - vreducenepbf16 $123, %ymm23, %ymm22 + vreducebf16 $123, %ymm23, %ymm22 -// CHECK: vreducenepbf16 $123, %ymm23, %ymm22 {%k7} +// CHECK: vreducebf16 $123, %ymm23, %ymm22 {%k7} // CHECK: encoding: [0x62,0xa3,0x7f,0x2f,0x56,0xf7,0x7b] - vreducenepbf16 $123, %ymm23, %ymm22 {%k7} + vreducebf16 $123, %ymm23, %ymm22 {%k7} -// CHECK: vreducenepbf16 $123, %ymm23, %ymm22 {%k7} {z} +// CHECK: vreducebf16 $123, %ymm23, %ymm22 {%k7} {z} // CHECK: encoding: [0x62,0xa3,0x7f,0xaf,0x56,0xf7,0x7b] - vreducenepbf16 $123, %ymm23, %ymm22 {%k7} {z} + vreducebf16 $123, %ymm23, %ymm22 {%k7} {z} -// CHECK: vreducenepbf16 $123, %xmm23, %xmm22 +// CHECK: vreducebf16 $123, %xmm23, %xmm22 // CHECK: encoding: [0x62,0xa3,0x7f,0x08,0x56,0xf7,0x7b] - vreducenepbf16 $123, %xmm23, %xmm22 + vreducebf16 $123, %xmm23, %xmm22 -// CHECK: vreducenepbf16 $123, %xmm23, %xmm22 {%k7} +// CHECK: vreducebf16 $123, %xmm23, %xmm22 {%k7} // CHECK: encoding: [0x62,0xa3,0x7f,0x0f,0x56,0xf7,0x7b] - vreducenepbf16 $123, %xmm23, %xmm22 {%k7} + vreducebf16 $123, %xmm23, %xmm22 {%k7} -// CHECK: vreducenepbf16 $123, %xmm23, %xmm22 {%k7} {z} +// CHECK: vreducebf16 $123, %xmm23, %xmm22 {%k7} {z} // CHECK: encoding: [0x62,0xa3,0x7f,0x8f,0x56,0xf7,0x7b] - vreducenepbf16 $123, %xmm23, %xmm22 {%k7} {z} + vreducebf16 $123, %xmm23, %xmm22 {%k7} {z} -// CHECK: vreducenepbf16 $123, 268435456(%rbp,%r14,8), %xmm22 +// CHECK: vreducebf16 $123, 268435456(%rbp,%r14,8), %xmm22 // CHECK: encoding: [0x62,0xa3,0x7f,0x08,0x56,0xb4,0xf5,0x00,0x00,0x00,0x10,0x7b] - vreducenepbf16 $123, 268435456(%rbp,%r14,8), %xmm22 + vreducebf16 $123, 268435456(%rbp,%r14,8), %xmm22 -// CHECK: vreducenepbf16 $123, 291(%r8,%rax,4), %xmm22 {%k7} +// CHECK: vreducebf16 $123, 291(%r8,%rax,4), %xmm22 {%k7} // CHECK: encoding: [0x62,0xc3,0x7f,0x0f,0x56,0xb4,0x80,0x23,0x01,0x00,0x00,0x7b] - vreducenepbf16 $123, 291(%r8,%rax,4), %xmm22 {%k7} + vreducebf16 $123, 291(%r8,%rax,4), %xmm22 {%k7} -// CHECK: vreducenepbf16 $123, (%rip){1to8}, %xmm22 +// CHECK: vreducebf16 $123, (%rip){1to8}, %xmm22 // CHECK: encoding: [0x62,0xe3,0x7f,0x18,0x56,0x35,0x00,0x00,0x00,0x00,0x7b] - vreducenepbf16 $123, (%rip){1to8}, %xmm22 + vreducebf16 $123, (%rip){1to8}, %xmm22 -// CHECK: vreducenepbf16 $123, -512(,%rbp,2), %xmm22 +// CHECK: vreducebf16 $123, -512(,%rbp,2), %xmm22 // CHECK: encoding: [0x62,0xe3,0x7f,0x08,0x56,0x34,0x6d,0x00,0xfe,0xff,0xff,0x7b] - vreducenepbf16 $123, -512(,%rbp,2), %xmm22 + vreducebf16 $123, -512(,%rbp,2), %xmm22 -// CHECK: vreducenepbf16 $123, 2032(%rcx), %xmm22 {%k7} {z} +// CHECK: vreducebf16 $123, 2032(%rcx), %xmm22 {%k7} {z} // CHECK: encoding: [0x62,0xe3,0x7f,0x8f,0x56,0x71,0x7f,0x7b] - vreducenepbf16 $123, 2032(%rcx), %xmm22 {%k7} {z} + vreducebf16 $123, 2032(%rcx), %xmm22 {%k7} {z} -// CHECK: vreducenepbf16 $123, -256(%rdx){1to8}, %xmm22 {%k7} {z} +// CHECK: vreducebf16 $123, -256(%rdx){1to8}, %xmm22 {%k7} {z} // CHECK: encoding: [0x62,0xe3,0x7f,0x9f,0x56,0x72,0x80,0x7b] - vreducenepbf16 $123, -256(%rdx){1to8}, %xmm22 {%k7} {z} + vreducebf16 $123, -256(%rdx){1to8}, %xmm22 {%k7} {z} -// CHECK: vreducenepbf16 $123, 268435456(%rbp,%r14,8), %ymm22 +// CHECK: vreducebf16 $123, 268435456(%rbp,%r14,8), %ymm22 // CHECK: encoding: [0x62,0xa3,0x7f,0x28,0x56,0xb4,0xf5,0x00,0x00,0x00,0x10,0x7b] - vreducenepbf16 $123, 268435456(%rbp,%r14,8), %ymm22 + vreducebf16 $123, 268435456(%rbp,%r14,8), %ymm22 -// CHECK: vreducenepbf16 $123, 291(%r8,%rax,4), %ymm22 {%k7} +// CHECK: vreducebf16 $123, 291(%r8,%rax,4), %ymm22 {%k7} // CHECK: encoding: [0x62,0xc3,0x7f,0x2f,0x56,0xb4,0x80,0x23,0x01,0x00,0x00,0x7b] - vreducenepbf16 $123, 291(%r8,%rax,4), %ymm22 {%k7} + vreducebf16 $123, 291(%r8,%rax,4), %ymm22 {%k7} -// CHECK: vreducenepbf16 $123, (%rip){1to16}, %ymm22 +// CHECK: vreducebf16 $123, (%rip){1to16}, %ymm22 // CHECK: encoding: [0x62,0xe3,0x7f,0x38,0x56,0x35,0x00,0x00,0x00,0x00,0x7b] - vreducenepbf16 $123, (%rip){1to16}, %ymm22 + vreducebf16 $123, (%rip){1to16}, %ymm22 -// CHECK: vreducenepbf16 $123, -1024(,%rbp,2), %ymm22 +// CHECK: vreducebf16 $123, -1024(,%rbp,2), %ymm22 // CHECK: encoding: [0x62,0xe3,0x7f,0x28,0x56,0x34,0x6d,0x00,0xfc,0xff,0xff,0x7b] - vreducenepbf16 $123, -1024(,%rbp,2), %ymm22 + vreducebf16 $123, -1024(,%rbp,2), %ymm22 -// CHECK: vreducenepbf16 $123, 4064(%rcx), %ymm22 {%k7} {z} +// CHECK: vreducebf16 $123, 4064(%rcx), %ymm22 {%k7} {z} // CHECK: encoding: [0x62,0xe3,0x7f,0xaf,0x56,0x71,0x7f,0x7b] - vreducenepbf16 $123, 4064(%rcx), %ymm22 {%k7} {z} + vreducebf16 $123, 4064(%rcx), %ymm22 {%k7} {z} -// CHECK: vreducenepbf16 $123, -256(%rdx){1to16}, %ymm22 {%k7} {z} +// CHECK: vreducebf16 $123, -256(%rdx){1to16}, %ymm22 {%k7} {z} // CHECK: encoding: [0x62,0xe3,0x7f,0xbf,0x56,0x72,0x80,0x7b] - vreducenepbf16 $123, -256(%rdx){1to16}, %ymm22 {%k7} {z} + vreducebf16 $123, -256(%rdx){1to16}, %ymm22 {%k7} {z} -// CHECK: vreducenepbf16 $123, 268435456(%rbp,%r14,8), %zmm22 +// CHECK: vreducebf16 $123, 268435456(%rbp,%r14,8), %zmm22 // CHECK: encoding: [0x62,0xa3,0x7f,0x48,0x56,0xb4,0xf5,0x00,0x00,0x00,0x10,0x7b] - vreducenepbf16 $123, 268435456(%rbp,%r14,8), %zmm22 + vreducebf16 $123, 268435456(%rbp,%r14,8), %zmm22 -// CHECK: vreducenepbf16 $123, 291(%r8,%rax,4), %zmm22 {%k7} +// CHECK: vreducebf16 $123, 291(%r8,%rax,4), %zmm22 {%k7} // CHECK: encoding: [0x62,0xc3,0x7f,0x4f,0x56,0xb4,0x80,0x23,0x01,0x00,0x00,0x7b] - vreducenepbf16 $123, 291(%r8,%rax,4), %zmm22 {%k7} + vreducebf16 $123, 291(%r8,%rax,4), %zmm22 {%k7} -// CHECK: vreducenepbf16 $123, (%rip){1to32}, %zmm22 +// CHECK: vreducebf16 $123, (%rip){1to32}, %zmm22 // CHECK: encoding: [0x62,0xe3,0x7f,0x58,0x56,0x35,0x00,0x00,0x00,0x00,0x7b] - vreducenepbf16 $123, (%rip){1to32}, %zmm22 + vreducebf16 $123, (%rip){1to32}, %zmm22 -// CHECK: vreducenepbf16 $123, -2048(,%rbp,2), %zmm22 +// CHECK: vreducebf16 $123, -2048(,%rbp,2), %zmm22 // CHECK: encoding: [0x62,0xe3,0x7f,0x48,0x56,0x34,0x6d,0x00,0xf8,0xff,0xff,0x7b] - vreducenepbf16 $123, -2048(,%rbp,2), %zmm22 + vreducebf16 $123, -2048(,%rbp,2), %zmm22 -// CHECK: vreducenepbf16 $123, 8128(%rcx), %zmm22 {%k7} {z} +// CHECK: vreducebf16 $123, 8128(%rcx), %zmm22 {%k7} {z} // CHECK: encoding: [0x62,0xe3,0x7f,0xcf,0x56,0x71,0x7f,0x7b] - vreducenepbf16 $123, 8128(%rcx), %zmm22 {%k7} {z} + vreducebf16 $123, 8128(%rcx), %zmm22 {%k7} {z} -// CHECK: vreducenepbf16 $123, -256(%rdx){1to32}, %zmm22 {%k7} {z} +// CHECK: vreducebf16 $123, -256(%rdx){1to32}, %zmm22 {%k7} {z} // CHECK: encoding: [0x62,0xe3,0x7f,0xdf,0x56,0x72,0x80,0x7b] - vreducenepbf16 $123, -256(%rdx){1to32}, %zmm22 {%k7} {z} + vreducebf16 $123, -256(%rdx){1to32}, %zmm22 {%k7} {z} -// CHECK: vrndscalenepbf16 $123, %zmm23, %zmm22 +// CHECK: vrndscalebf16 $123, %zmm23, %zmm22 // CHECK: encoding: [0x62,0xa3,0x7f,0x48,0x08,0xf7,0x7b] - vrndscalenepbf16 $123, %zmm23, %zmm22 + vrndscalebf16 $123, %zmm23, %zmm22 -// CHECK: vrndscalenepbf16 $123, %zmm23, %zmm22 {%k7} +// CHECK: vrndscalebf16 $123, %zmm23, %zmm22 {%k7} // CHECK: encoding: [0x62,0xa3,0x7f,0x4f,0x08,0xf7,0x7b] - vrndscalenepbf16 $123, %zmm23, %zmm22 {%k7} + vrndscalebf16 $123, %zmm23, %zmm22 {%k7} -// CHECK: vrndscalenepbf16 $123, %zmm23, %zmm22 {%k7} {z} +// CHECK: vrndscalebf16 $123, %zmm23, %zmm22 {%k7} {z} // CHECK: encoding: [0x62,0xa3,0x7f,0xcf,0x08,0xf7,0x7b] - vrndscalenepbf16 $123, %zmm23, %zmm22 {%k7} {z} + vrndscalebf16 $123, %zmm23, %zmm22 {%k7} {z} -// CHECK: vrndscalenepbf16 $123, %ymm23, %ymm22 +// CHECK: vrndscalebf16 $123, %ymm23, %ymm22 // CHECK: encoding: [0x62,0xa3,0x7f,0x28,0x08,0xf7,0x7b] - vrndscalenepbf16 $123, %ymm23, %ymm22 + vrndscalebf16 $123, %ymm23, %ymm22 -// CHECK: vrndscalenepbf16 $123, %ymm23, %ymm22 {%k7} +// CHECK: vrndscalebf16 $123, %ymm23, %ymm22 {%k7} // CHECK: encoding: [0x62,0xa3,0x7f,0x2f,0x08,0xf7,0x7b] - vrndscalenepbf16 $123, %ymm23, %ymm22 {%k7} + vrndscalebf16 $123, %ymm23, %ymm22 {%k7} -// CHECK: vrndscalenepbf16 $123, %ymm23, %ymm22 {%k7} {z} +// CHECK: vrndscalebf16 $123, %ymm23, %ymm22 {%k7} {z} // CHECK: encoding: [0x62,0xa3,0x7f,0xaf,0x08,0xf7,0x7b] - vrndscalenepbf16 $123, %ymm23, %ymm22 {%k7} {z} + vrndscalebf16 $123, %ymm23, %ymm22 {%k7} {z} -// CHECK: vrndscalenepbf16 $123, %xmm23, %xmm22 +// CHECK: vrndscalebf16 $123, %xmm23, %xmm22 // CHECK: encoding: [0x62,0xa3,0x7f,0x08,0x08,0xf7,0x7b] - vrndscalenepbf16 $123, %xmm23, %xmm22 + vrndscalebf16 $123, %xmm23, %xmm22 -// CHECK: vrndscalenepbf16 $123, %xmm23, %xmm22 {%k7} +// CHECK: vrndscalebf16 $123, %xmm23, %xmm22 {%k7} // CHECK: encoding: [0x62,0xa3,0x7f,0x0f,0x08,0xf7,0x7b] - vrndscalenepbf16 $123, %xmm23, %xmm22 {%k7} + vrndscalebf16 $123, %xmm23, %xmm22 {%k7} -// CHECK: vrndscalenepbf16 $123, %xmm23, %xmm22 {%k7} {z} +// CHECK: vrndscalebf16 $123, %xmm23, %xmm22 {%k7} {z} // CHECK: encoding: [0x62,0xa3,0x7f,0x8f,0x08,0xf7,0x7b] - vrndscalenepbf16 $123, %xmm23, %xmm22 {%k7} {z} + vrndscalebf16 $123, %xmm23, %xmm22 {%k7} {z} -// CHECK: vrndscalenepbf16 $123, 268435456(%rbp,%r14,8), %xmm22 +// CHECK: vrndscalebf16 $123, 268435456(%rbp,%r14,8), %xmm22 // CHECK: encoding: [0x62,0xa3,0x7f,0x08,0x08,0xb4,0xf5,0x00,0x00,0x00,0x10,0x7b] - vrndscalenepbf16 $123, 268435456(%rbp,%r14,8), %xmm22 + vrndscalebf16 $123, 268435456(%rbp,%r14,8), %xmm22 -// CHECK: vrndscalenepbf16 $123, 291(%r8,%rax,4), %xmm22 {%k7} +// CHECK: vrndscalebf16 $123, 291(%r8,%rax,4), %xmm22 {%k7} // CHECK: encoding: [0x62,0xc3,0x7f,0x0f,0x08,0xb4,0x80,0x23,0x01,0x00,0x00,0x7b] - vrndscalenepbf16 $123, 291(%r8,%rax,4), %xmm22 {%k7} + vrndscalebf16 $123, 291(%r8,%rax,4), %xmm22 {%k7} -// CHECK: vrndscalenepbf16 $123, (%rip){1to8}, %xmm22 +// CHECK: vrndscalebf16 $123, (%rip){1to8}, %xmm22 // CHECK: encoding: [0x62,0xe3,0x7f,0x18,0x08,0x35,0x00,0x00,0x00,0x00,0x7b] - vrndscalenepbf16 $123, (%rip){1to8}, %xmm22 + vrndscalebf16 $123, (%rip){1to8}, %xmm22 -// CHECK: vrndscalenepbf16 $123, -512(,%rbp,2), %xmm22 +// CHECK: vrndscalebf16 $123, -512(,%rbp,2), %xmm22 // CHECK: encoding: [0x62,0xe3,0x7f,0x08,0x08,0x34,0x6d,0x00,0xfe,0xff,0xff,0x7b] - vrndscalenepbf16 $123, -512(,%rbp,2), %xmm22 + vrndscalebf16 $123, -512(,%rbp,2), %xmm22 -// CHECK: vrndscalenepbf16 $123, 2032(%rcx), %xmm22 {%k7} {z} +// CHECK: vrndscalebf16 $123, 2032(%rcx), %xmm22 {%k7} {z} // CHECK: encoding: [0x62,0xe3,0x7f,0x8f,0x08,0x71,0x7f,0x7b] - vrndscalenepbf16 $123, 2032(%rcx), %xmm22 {%k7} {z} + vrndscalebf16 $123, 2032(%rcx), %xmm22 {%k7} {z} -// CHECK: vrndscalenepbf16 $123, -256(%rdx){1to8}, %xmm22 {%k7} {z} +// CHECK: vrndscalebf16 $123, -256(%rdx){1to8}, %xmm22 {%k7} {z} // CHECK: encoding: [0x62,0xe3,0x7f,0x9f,0x08,0x72,0x80,0x7b] - vrndscalenepbf16 $123, -256(%rdx){1to8}, %xmm22 {%k7} {z} + vrndscalebf16 $123, -256(%rdx){1to8}, %xmm22 {%k7} {z} -// CHECK: vrndscalenepbf16 $123, 268435456(%rbp,%r14,8), %ymm22 +// CHECK: vrndscalebf16 $123, 268435456(%rbp,%r14,8), %ymm22 // CHECK: encoding: [0x62,0xa3,0x7f,0x28,0x08,0xb4,0xf5,0x00,0x00,0x00,0x10,0x7b] - vrndscalenepbf16 $123, 268435456(%rbp,%r14,8), %ymm22 + vrndscalebf16 $123, 268435456(%rbp,%r14,8), %ymm22 -// CHECK: vrndscalenepbf16 $123, 291(%r8,%rax,4), %ymm22 {%k7} +// CHECK: vrndscalebf16 $123, 291(%r8,%rax,4), %ymm22 {%k7} // CHECK: encoding: [0x62,0xc3,0x7f,0x2f,0x08,0xb4,0x80,0x23,0x01,0x00,0x00,0x7b] - vrndscalenepbf16 $123, 291(%r8,%rax,4), %ymm22 {%k7} + vrndscalebf16 $123, 291(%r8,%rax,4), %ymm22 {%k7} -// CHECK: vrndscalenepbf16 $123, (%rip){1to16}, %ymm22 +// CHECK: vrndscalebf16 $123, (%rip){1to16}, %ymm22 // CHECK: encoding: [0x62,0xe3,0x7f,0x38,0x08,0x35,0x00,0x00,0x00,0x00,0x7b] - vrndscalenepbf16 $123, (%rip){1to16}, %ymm22 + vrndscalebf16 $123, (%rip){1to16}, %ymm22 -// CHECK: vrndscalenepbf16 $123, -1024(,%rbp,2), %ymm22 +// CHECK: vrndscalebf16 $123, -1024(,%rbp,2), %ymm22 // CHECK: encoding: [0x62,0xe3,0x7f,0x28,0x08,0x34,0x6d,0x00,0xfc,0xff,0xff,0x7b] - vrndscalenepbf16 $123, -1024(,%rbp,2), %ymm22 + vrndscalebf16 $123, -1024(,%rbp,2), %ymm22 -// CHECK: vrndscalenepbf16 $123, 4064(%rcx), %ymm22 {%k7} {z} +// CHECK: vrndscalebf16 $123, 4064(%rcx), %ymm22 {%k7} {z} // CHECK: encoding: [0x62,0xe3,0x7f,0xaf,0x08,0x71,0x7f,0x7b] - vrndscalenepbf16 $123, 4064(%rcx), %ymm22 {%k7} {z} + vrndscalebf16 $123, 4064(%rcx), %ymm22 {%k7} {z} -// CHECK: vrndscalenepbf16 $123, -256(%rdx){1to16}, %ymm22 {%k7} {z} +// CHECK: vrndscalebf16 $123, -256(%rdx){1to16}, %ymm22 {%k7} {z} // CHECK: encoding: [0x62,0xe3,0x7f,0xbf,0x08,0x72,0x80,0x7b] - vrndscalenepbf16 $123, -256(%rdx){1to16}, %ymm22 {%k7} {z} + vrndscalebf16 $123, -256(%rdx){1to16}, %ymm22 {%k7} {z} -// CHECK: vrndscalenepbf16 $123, 268435456(%rbp,%r14,8), %zmm22 +// CHECK: vrndscalebf16 $123, 268435456(%rbp,%r14,8), %zmm22 // CHECK: encoding: [0x62,0xa3,0x7f,0x48,0x08,0xb4,0xf5,0x00,0x00,0x00,0x10,0x7b] - vrndscalenepbf16 $123, 268435456(%rbp,%r14,8), %zmm22 + vrndscalebf16 $123, 268435456(%rbp,%r14,8), %zmm22 -// CHECK: vrndscalenepbf16 $123, 291(%r8,%rax,4), %zmm22 {%k7} +// CHECK: vrndscalebf16 $123, 291(%r8,%rax,4), %zmm22 {%k7} // CHECK: encoding: [0x62,0xc3,0x7f,0x4f,0x08,0xb4,0x80,0x23,0x01,0x00,0x00,0x7b] - vrndscalenepbf16 $123, 291(%r8,%rax,4), %zmm22 {%k7} + vrndscalebf16 $123, 291(%r8,%rax,4), %zmm22 {%k7} -// CHECK: vrndscalenepbf16 $123, (%rip){1to32}, %zmm22 +// CHECK: vrndscalebf16 $123, (%rip){1to32}, %zmm22 // CHECK: encoding: [0x62,0xe3,0x7f,0x58,0x08,0x35,0x00,0x00,0x00,0x00,0x7b] - vrndscalenepbf16 $123, (%rip){1to32}, %zmm22 + vrndscalebf16 $123, (%rip){1to32}, %zmm22 -// CHECK: vrndscalenepbf16 $123, -2048(,%rbp,2), %zmm22 +// CHECK: vrndscalebf16 $123, -2048(,%rbp,2), %zmm22 // CHECK: encoding: [0x62,0xe3,0x7f,0x48,0x08,0x34,0x6d,0x00,0xf8,0xff,0xff,0x7b] - vrndscalenepbf16 $123, -2048(,%rbp,2), %zmm22 + vrndscalebf16 $123, -2048(,%rbp,2), %zmm22 -// CHECK: vrndscalenepbf16 $123, 8128(%rcx), %zmm22 {%k7} {z} +// CHECK: vrndscalebf16 $123, 8128(%rcx), %zmm22 {%k7} {z} // CHECK: encoding: [0x62,0xe3,0x7f,0xcf,0x08,0x71,0x7f,0x7b] - vrndscalenepbf16 $123, 8128(%rcx), %zmm22 {%k7} {z} + vrndscalebf16 $123, 8128(%rcx), %zmm22 {%k7} {z} -// CHECK: vrndscalenepbf16 $123, -256(%rdx){1to32}, %zmm22 {%k7} {z} +// CHECK: vrndscalebf16 $123, -256(%rdx){1to32}, %zmm22 {%k7} {z} // CHECK: encoding: [0x62,0xe3,0x7f,0xdf,0x08,0x72,0x80,0x7b] - vrndscalenepbf16 $123, -256(%rdx){1to32}, %zmm22 {%k7} {z} + vrndscalebf16 $123, -256(%rdx){1to32}, %zmm22 {%k7} {z} -// CHECK: vrsqrtpbf16 %xmm23, %xmm22 +// CHECK: vrsqrtbf16 %xmm23, %xmm22 // CHECK: encoding: [0x62,0xa6,0x7c,0x08,0x4e,0xf7] - vrsqrtpbf16 %xmm23, %xmm22 + vrsqrtbf16 %xmm23, %xmm22 -// CHECK: vrsqrtpbf16 %xmm23, %xmm22 {%k7} +// CHECK: vrsqrtbf16 %xmm23, %xmm22 {%k7} // CHECK: encoding: [0x62,0xa6,0x7c,0x0f,0x4e,0xf7] - vrsqrtpbf16 %xmm23, %xmm22 {%k7} + vrsqrtbf16 %xmm23, %xmm22 {%k7} -// CHECK: vrsqrtpbf16 %xmm23, %xmm22 {%k7} {z} +// CHECK: vrsqrtbf16 %xmm23, %xmm22 {%k7} {z} // CHECK: encoding: [0x62,0xa6,0x7c,0x8f,0x4e,0xf7] - vrsqrtpbf16 %xmm23, %xmm22 {%k7} {z} + vrsqrtbf16 %xmm23, %xmm22 {%k7} {z} -// CHECK: vrsqrtpbf16 %zmm23, %zmm22 +// CHECK: vrsqrtbf16 %zmm23, %zmm22 // CHECK: encoding: [0x62,0xa6,0x7c,0x48,0x4e,0xf7] - vrsqrtpbf16 %zmm23, %zmm22 + vrsqrtbf16 %zmm23, %zmm22 -// CHECK: vrsqrtpbf16 %zmm23, %zmm22 {%k7} +// CHECK: vrsqrtbf16 %zmm23, %zmm22 {%k7} // CHECK: encoding: [0x62,0xa6,0x7c,0x4f,0x4e,0xf7] - vrsqrtpbf16 %zmm23, %zmm22 {%k7} + vrsqrtbf16 %zmm23, %zmm22 {%k7} -// CHECK: vrsqrtpbf16 %zmm23, %zmm22 {%k7} {z} +// CHECK: vrsqrtbf16 %zmm23, %zmm22 {%k7} {z} // CHECK: encoding: [0x62,0xa6,0x7c,0xcf,0x4e,0xf7] - vrsqrtpbf16 %zmm23, %zmm22 {%k7} {z} + vrsqrtbf16 %zmm23, %zmm22 {%k7} {z} -// CHECK: vrsqrtpbf16 %ymm23, %ymm22 +// CHECK: vrsqrtbf16 %ymm23, %ymm22 // CHECK: encoding: [0x62,0xa6,0x7c,0x28,0x4e,0xf7] - vrsqrtpbf16 %ymm23, %ymm22 + vrsqrtbf16 %ymm23, %ymm22 -// CHECK: vrsqrtpbf16 %ymm23, %ymm22 {%k7} +// CHECK: vrsqrtbf16 %ymm23, %ymm22 {%k7} // CHECK: encoding: [0x62,0xa6,0x7c,0x2f,0x4e,0xf7] - vrsqrtpbf16 %ymm23, %ymm22 {%k7} + vrsqrtbf16 %ymm23, %ymm22 {%k7} -// CHECK: vrsqrtpbf16 %ymm23, %ymm22 {%k7} {z} +// CHECK: vrsqrtbf16 %ymm23, %ymm22 {%k7} {z} // CHECK: encoding: [0x62,0xa6,0x7c,0xaf,0x4e,0xf7] - vrsqrtpbf16 %ymm23, %ymm22 {%k7} {z} + vrsqrtbf16 %ymm23, %ymm22 {%k7} {z} -// CHECK: vrsqrtpbf16 268435456(%rbp,%r14,8), %xmm22 +// CHECK: vrsqrtbf16 268435456(%rbp,%r14,8), %xmm22 // CHECK: encoding: [0x62,0xa6,0x7c,0x08,0x4e,0xb4,0xf5,0x00,0x00,0x00,0x10] - vrsqrtpbf16 268435456(%rbp,%r14,8), %xmm22 + vrsqrtbf16 268435456(%rbp,%r14,8), %xmm22 -// CHECK: vrsqrtpbf16 291(%r8,%rax,4), %xmm22 {%k7} +// CHECK: vrsqrtbf16 291(%r8,%rax,4), %xmm22 {%k7} // CHECK: encoding: [0x62,0xc6,0x7c,0x0f,0x4e,0xb4,0x80,0x23,0x01,0x00,0x00] - vrsqrtpbf16 291(%r8,%rax,4), %xmm22 {%k7} + vrsqrtbf16 291(%r8,%rax,4), %xmm22 {%k7} -// CHECK: vrsqrtpbf16 (%rip){1to8}, %xmm22 +// CHECK: vrsqrtbf16 (%rip){1to8}, %xmm22 // CHECK: encoding: [0x62,0xe6,0x7c,0x18,0x4e,0x35,0x00,0x00,0x00,0x00] - vrsqrtpbf16 (%rip){1to8}, %xmm22 + vrsqrtbf16 (%rip){1to8}, %xmm22 -// CHECK: vrsqrtpbf16 -512(,%rbp,2), %xmm22 +// CHECK: vrsqrtbf16 -512(,%rbp,2), %xmm22 // CHECK: encoding: [0x62,0xe6,0x7c,0x08,0x4e,0x34,0x6d,0x00,0xfe,0xff,0xff] - vrsqrtpbf16 -512(,%rbp,2), %xmm22 + vrsqrtbf16 -512(,%rbp,2), %xmm22 -// CHECK: vrsqrtpbf16 2032(%rcx), %xmm22 {%k7} {z} +// CHECK: vrsqrtbf16 2032(%rcx), %xmm22 {%k7} {z} // CHECK: encoding: [0x62,0xe6,0x7c,0x8f,0x4e,0x71,0x7f] - vrsqrtpbf16 2032(%rcx), %xmm22 {%k7} {z} + vrsqrtbf16 2032(%rcx), %xmm22 {%k7} {z} -// CHECK: vrsqrtpbf16 -256(%rdx){1to8}, %xmm22 {%k7} {z} +// CHECK: vrsqrtbf16 -256(%rdx){1to8}, %xmm22 {%k7} {z} // CHECK: encoding: [0x62,0xe6,0x7c,0x9f,0x4e,0x72,0x80] - vrsqrtpbf16 -256(%rdx){1to8}, %xmm22 {%k7} {z} + vrsqrtbf16 -256(%rdx){1to8}, %xmm22 {%k7} {z} -// CHECK: vrsqrtpbf16 268435456(%rbp,%r14,8), %ymm22 +// CHECK: vrsqrtbf16 268435456(%rbp,%r14,8), %ymm22 // CHECK: encoding: [0x62,0xa6,0x7c,0x28,0x4e,0xb4,0xf5,0x00,0x00,0x00,0x10] - vrsqrtpbf16 268435456(%rbp,%r14,8), %ymm22 + vrsqrtbf16 268435456(%rbp,%r14,8), %ymm22 -// CHECK: vrsqrtpbf16 291(%r8,%rax,4), %ymm22 {%k7} +// CHECK: vrsqrtbf16 291(%r8,%rax,4), %ymm22 {%k7} // CHECK: encoding: [0x62,0xc6,0x7c,0x2f,0x4e,0xb4,0x80,0x23,0x01,0x00,0x00] - vrsqrtpbf16 291(%r8,%rax,4), %ymm22 {%k7} + vrsqrtbf16 291(%r8,%rax,4), %ymm22 {%k7} -// CHECK: vrsqrtpbf16 (%rip){1to16}, %ymm22 +// CHECK: vrsqrtbf16 (%rip){1to16}, %ymm22 // CHECK: encoding: [0x62,0xe6,0x7c,0x38,0x4e,0x35,0x00,0x00,0x00,0x00] - vrsqrtpbf16 (%rip){1to16}, %ymm22 + vrsqrtbf16 (%rip){1to16}, %ymm22 -// CHECK: vrsqrtpbf16 -1024(,%rbp,2), %ymm22 +// CHECK: vrsqrtbf16 -1024(,%rbp,2), %ymm22 // CHECK: encoding: [0x62,0xe6,0x7c,0x28,0x4e,0x34,0x6d,0x00,0xfc,0xff,0xff] - vrsqrtpbf16 -1024(,%rbp,2), %ymm22 + vrsqrtbf16 -1024(,%rbp,2), %ymm22 -// CHECK: vrsqrtpbf16 4064(%rcx), %ymm22 {%k7} {z} +// CHECK: vrsqrtbf16 4064(%rcx), %ymm22 {%k7} {z} // CHECK: encoding: [0x62,0xe6,0x7c,0xaf,0x4e,0x71,0x7f] - vrsqrtpbf16 4064(%rcx), %ymm22 {%k7} {z} + vrsqrtbf16 4064(%rcx), %ymm22 {%k7} {z} -// CHECK: vrsqrtpbf16 -256(%rdx){1to16}, %ymm22 {%k7} {z} +// CHECK: vrsqrtbf16 -256(%rdx){1to16}, %ymm22 {%k7} {z} // CHECK: encoding: [0x62,0xe6,0x7c,0xbf,0x4e,0x72,0x80] - vrsqrtpbf16 -256(%rdx){1to16}, %ymm22 {%k7} {z} + vrsqrtbf16 -256(%rdx){1to16}, %ymm22 {%k7} {z} -// CHECK: vrsqrtpbf16 268435456(%rbp,%r14,8), %zmm22 +// CHECK: vrsqrtbf16 268435456(%rbp,%r14,8), %zmm22 // CHECK: encoding: [0x62,0xa6,0x7c,0x48,0x4e,0xb4,0xf5,0x00,0x00,0x00,0x10] - vrsqrtpbf16 268435456(%rbp,%r14,8), %zmm22 + vrsqrtbf16 268435456(%rbp,%r14,8), %zmm22 -// CHECK: vrsqrtpbf16 291(%r8,%rax,4), %zmm22 {%k7} +// CHECK: vrsqrtbf16 291(%r8,%rax,4), %zmm22 {%k7} // CHECK: encoding: [0x62,0xc6,0x7c,0x4f,0x4e,0xb4,0x80,0x23,0x01,0x00,0x00] - vrsqrtpbf16 291(%r8,%rax,4), %zmm22 {%k7} + vrsqrtbf16 291(%r8,%rax,4), %zmm22 {%k7} -// CHECK: vrsqrtpbf16 (%rip){1to32}, %zmm22 +// CHECK: vrsqrtbf16 (%rip){1to32}, %zmm22 // CHECK: encoding: [0x62,0xe6,0x7c,0x58,0x4e,0x35,0x00,0x00,0x00,0x00] - vrsqrtpbf16 (%rip){1to32}, %zmm22 + vrsqrtbf16 (%rip){1to32}, %zmm22 -// CHECK: vrsqrtpbf16 -2048(,%rbp,2), %zmm22 +// CHECK: vrsqrtbf16 -2048(,%rbp,2), %zmm22 // CHECK: encoding: [0x62,0xe6,0x7c,0x48,0x4e,0x34,0x6d,0x00,0xf8,0xff,0xff] - vrsqrtpbf16 -2048(,%rbp,2), %zmm22 + vrsqrtbf16 -2048(,%rbp,2), %zmm22 -// CHECK: vrsqrtpbf16 8128(%rcx), %zmm22 {%k7} {z} +// CHECK: vrsqrtbf16 8128(%rcx), %zmm22 {%k7} {z} // CHECK: encoding: [0x62,0xe6,0x7c,0xcf,0x4e,0x71,0x7f] - vrsqrtpbf16 8128(%rcx), %zmm22 {%k7} {z} + vrsqrtbf16 8128(%rcx), %zmm22 {%k7} {z} -// CHECK: vrsqrtpbf16 -256(%rdx){1to32}, %zmm22 {%k7} {z} +// CHECK: vrsqrtbf16 -256(%rdx){1to32}, %zmm22 {%k7} {z} // CHECK: encoding: [0x62,0xe6,0x7c,0xdf,0x4e,0x72,0x80] - vrsqrtpbf16 -256(%rdx){1to32}, %zmm22 {%k7} {z} + vrsqrtbf16 -256(%rdx){1to32}, %zmm22 {%k7} {z} -// CHECK: vscalefpbf16 %ymm24, %ymm23, %ymm22 +// CHECK: vscalefbf16 %ymm24, %ymm23, %ymm22 // CHECK: encoding: [0x62,0x86,0x44,0x20,0x2c,0xf0] - vscalefpbf16 %ymm24, %ymm23, %ymm22 + vscalefbf16 %ymm24, %ymm23, %ymm22 -// CHECK: vscalefpbf16 %ymm24, %ymm23, %ymm22 {%k7} +// CHECK: vscalefbf16 %ymm24, %ymm23, %ymm22 {%k7} // CHECK: encoding: [0x62,0x86,0x44,0x27,0x2c,0xf0] - vscalefpbf16 %ymm24, %ymm23, %ymm22 {%k7} + vscalefbf16 %ymm24, %ymm23, %ymm22 {%k7} -// CHECK: vscalefpbf16 %ymm24, %ymm23, %ymm22 {%k7} {z} +// CHECK: vscalefbf16 %ymm24, %ymm23, %ymm22 {%k7} {z} // CHECK: encoding: [0x62,0x86,0x44,0xa7,0x2c,0xf0] - vscalefpbf16 %ymm24, %ymm23, %ymm22 {%k7} {z} + vscalefbf16 %ymm24, %ymm23, %ymm22 {%k7} {z} -// CHECK: vscalefpbf16 %zmm24, %zmm23, %zmm22 +// CHECK: vscalefbf16 %zmm24, %zmm23, %zmm22 // CHECK: encoding: [0x62,0x86,0x44,0x40,0x2c,0xf0] - vscalefpbf16 %zmm24, %zmm23, %zmm22 + vscalefbf16 %zmm24, %zmm23, %zmm22 -// CHECK: vscalefpbf16 %zmm24, %zmm23, %zmm22 {%k7} +// CHECK: vscalefbf16 %zmm24, %zmm23, %zmm22 {%k7} // CHECK: encoding: [0x62,0x86,0x44,0x47,0x2c,0xf0] - vscalefpbf16 %zmm24, %zmm23, %zmm22 {%k7} + vscalefbf16 %zmm24, %zmm23, %zmm22 {%k7} -// CHECK: vscalefpbf16 %zmm24, %zmm23, %zmm22 {%k7} {z} +// CHECK: vscalefbf16 %zmm24, %zmm23, %zmm22 {%k7} {z} // CHECK: encoding: [0x62,0x86,0x44,0xc7,0x2c,0xf0] - vscalefpbf16 %zmm24, %zmm23, %zmm22 {%k7} {z} + vscalefbf16 %zmm24, %zmm23, %zmm22 {%k7} {z} -// CHECK: vscalefpbf16 %xmm24, %xmm23, %xmm22 +// CHECK: vscalefbf16 %xmm24, %xmm23, %xmm22 // CHECK: encoding: [0x62,0x86,0x44,0x00,0x2c,0xf0] - vscalefpbf16 %xmm24, %xmm23, %xmm22 + vscalefbf16 %xmm24, %xmm23, %xmm22 -// CHECK: vscalefpbf16 %xmm24, %xmm23, %xmm22 {%k7} +// CHECK: vscalefbf16 %xmm24, %xmm23, %xmm22 {%k7} // CHECK: encoding: [0x62,0x86,0x44,0x07,0x2c,0xf0] - vscalefpbf16 %xmm24, %xmm23, %xmm22 {%k7} + vscalefbf16 %xmm24, %xmm23, %xmm22 {%k7} -// CHECK: vscalefpbf16 %xmm24, %xmm23, %xmm22 {%k7} {z} +// CHECK: vscalefbf16 %xmm24, %xmm23, %xmm22 {%k7} {z} // CHECK: encoding: [0x62,0x86,0x44,0x87,0x2c,0xf0] - vscalefpbf16 %xmm24, %xmm23, %xmm22 {%k7} {z} + vscalefbf16 %xmm24, %xmm23, %xmm22 {%k7} {z} -// CHECK: vscalefpbf16 268435456(%rbp,%r14,8), %zmm23, %zmm22 +// CHECK: vscalefbf16 268435456(%rbp,%r14,8), %zmm23, %zmm22 // CHECK: encoding: [0x62,0xa6,0x44,0x40,0x2c,0xb4,0xf5,0x00,0x00,0x00,0x10] - vscalefpbf16 268435456(%rbp,%r14,8), %zmm23, %zmm22 + vscalefbf16 268435456(%rbp,%r14,8), %zmm23, %zmm22 -// CHECK: vscalefpbf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7} +// CHECK: vscalefbf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7} // CHECK: encoding: [0x62,0xc6,0x44,0x47,0x2c,0xb4,0x80,0x23,0x01,0x00,0x00] - vscalefpbf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7} + vscalefbf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7} -// CHECK: vscalefpbf16 (%rip){1to32}, %zmm23, %zmm22 +// CHECK: vscalefbf16 (%rip){1to32}, %zmm23, %zmm22 // CHECK: encoding: [0x62,0xe6,0x44,0x50,0x2c,0x35,0x00,0x00,0x00,0x00] - vscalefpbf16 (%rip){1to32}, %zmm23, %zmm22 + vscalefbf16 (%rip){1to32}, %zmm23, %zmm22 -// CHECK: vscalefpbf16 -2048(,%rbp,2), %zmm23, %zmm22 +// CHECK: vscalefbf16 -2048(,%rbp,2), %zmm23, %zmm22 // CHECK: encoding: [0x62,0xe6,0x44,0x40,0x2c,0x34,0x6d,0x00,0xf8,0xff,0xff] - vscalefpbf16 -2048(,%rbp,2), %zmm23, %zmm22 + vscalefbf16 -2048(,%rbp,2), %zmm23, %zmm22 -// CHECK: vscalefpbf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z} +// CHECK: vscalefbf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z} // CHECK: encoding: [0x62,0xe6,0x44,0xc7,0x2c,0x71,0x7f] - vscalefpbf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z} + vscalefbf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z} -// CHECK: vscalefpbf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z} +// CHECK: vscalefbf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z} // CHECK: encoding: [0x62,0xe6,0x44,0xd7,0x2c,0x72,0x80] - vscalefpbf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z} + vscalefbf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z} -// CHECK: vscalefpbf16 268435456(%rbp,%r14,8), %ymm23, %ymm22 +// CHECK: vscalefbf16 268435456(%rbp,%r14,8), %ymm23, %ymm22 // CHECK: encoding: [0x62,0xa6,0x44,0x20,0x2c,0xb4,0xf5,0x00,0x00,0x00,0x10] - vscalefpbf16 268435456(%rbp,%r14,8), %ymm23, %ymm22 + vscalefbf16 268435456(%rbp,%r14,8), %ymm23, %ymm22 -// CHECK: vscalefpbf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7} +// CHECK: vscalefbf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7} // CHECK: encoding: [0x62,0xc6,0x44,0x27,0x2c,0xb4,0x80,0x23,0x01,0x00,0x00] - vscalefpbf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7} + vscalefbf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7} -// CHECK: vscalefpbf16 (%rip){1to16}, %ymm23, %ymm22 +// CHECK: vscalefbf16 (%rip){1to16}, %ymm23, %ymm22 // CHECK: encoding: [0x62,0xe6,0x44,0x30,0x2c,0x35,0x00,0x00,0x00,0x00] - vscalefpbf16 (%rip){1to16}, %ymm23, %ymm22 + vscalefbf16 (%rip){1to16}, %ymm23, %ymm22 -// CHECK: vscalefpbf16 -1024(,%rbp,2), %ymm23, %ymm22 +// CHECK: vscalefbf16 -1024(,%rbp,2), %ymm23, %ymm22 // CHECK: encoding: [0x62,0xe6,0x44,0x20,0x2c,0x34,0x6d,0x00,0xfc,0xff,0xff] - vscalefpbf16 -1024(,%rbp,2), %ymm23, %ymm22 + vscalefbf16 -1024(,%rbp,2), %ymm23, %ymm22 -// CHECK: vscalefpbf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z} +// CHECK: vscalefbf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z} // CHECK: encoding: [0x62,0xe6,0x44,0xa7,0x2c,0x71,0x7f] - vscalefpbf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z} + vscalefbf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z} -// CHECK: vscalefpbf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z} +// CHECK: vscalefbf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z} // CHECK: encoding: [0x62,0xe6,0x44,0xb7,0x2c,0x72,0x80] - vscalefpbf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z} + vscalefbf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z} -// CHECK: vscalefpbf16 268435456(%rbp,%r14,8), %xmm23, %xmm22 +// CHECK: vscalefbf16 268435456(%rbp,%r14,8), %xmm23, %xmm22 // CHECK: encoding: [0x62,0xa6,0x44,0x00,0x2c,0xb4,0xf5,0x00,0x00,0x00,0x10] - vscalefpbf16 268435456(%rbp,%r14,8), %xmm23, %xmm22 + vscalefbf16 268435456(%rbp,%r14,8), %xmm23, %xmm22 -// CHECK: vscalefpbf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7} +// CHECK: vscalefbf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7} // CHECK: encoding: [0x62,0xc6,0x44,0x07,0x2c,0xb4,0x80,0x23,0x01,0x00,0x00] - vscalefpbf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7} + vscalefbf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7} -// CHECK: vscalefpbf16 (%rip){1to8}, %xmm23, %xmm22 +// CHECK: vscalefbf16 (%rip){1to8}, %xmm23, %xmm22 // CHECK: encoding: [0x62,0xe6,0x44,0x10,0x2c,0x35,0x00,0x00,0x00,0x00] - vscalefpbf16 (%rip){1to8}, %xmm23, %xmm22 + vscalefbf16 (%rip){1to8}, %xmm23, %xmm22 -// CHECK: vscalefpbf16 -512(,%rbp,2), %xmm23, %xmm22 +// CHECK: vscalefbf16 -512(,%rbp,2), %xmm23, %xmm22 // CHECK: encoding: [0x62,0xe6,0x44,0x00,0x2c,0x34,0x6d,0x00,0xfe,0xff,0xff] - vscalefpbf16 -512(,%rbp,2), %xmm23, %xmm22 + vscalefbf16 -512(,%rbp,2), %xmm23, %xmm22 -// CHECK: vscalefpbf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z} +// CHECK: vscalefbf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z} // CHECK: encoding: [0x62,0xe6,0x44,0x87,0x2c,0x71,0x7f] - vscalefpbf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z} + vscalefbf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z} -// CHECK: vscalefpbf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z} +// CHECK: vscalefbf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z} // CHECK: encoding: [0x62,0xe6,0x44,0x97,0x2c,0x72,0x80] - vscalefpbf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z} + vscalefbf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z} -// CHECK: vsqrtnepbf16 %xmm23, %xmm22 +// CHECK: vsqrtbf16 %xmm23, %xmm22 // CHECK: encoding: [0x62,0xa5,0x7d,0x08,0x51,0xf7] - vsqrtnepbf16 %xmm23, %xmm22 + vsqrtbf16 %xmm23, %xmm22 -// CHECK: vsqrtnepbf16 %xmm23, %xmm22 {%k7} +// CHECK: vsqrtbf16 %xmm23, %xmm22 {%k7} // CHECK: encoding: [0x62,0xa5,0x7d,0x0f,0x51,0xf7] - vsqrtnepbf16 %xmm23, %xmm22 {%k7} + vsqrtbf16 %xmm23, %xmm22 {%k7} -// CHECK: vsqrtnepbf16 %xmm23, %xmm22 {%k7} {z} +// CHECK: vsqrtbf16 %xmm23, %xmm22 {%k7} {z} // CHECK: encoding: [0x62,0xa5,0x7d,0x8f,0x51,0xf7] - vsqrtnepbf16 %xmm23, %xmm22 {%k7} {z} + vsqrtbf16 %xmm23, %xmm22 {%k7} {z} -// CHECK: vsqrtnepbf16 %zmm23, %zmm22 +// CHECK: vsqrtbf16 %zmm23, %zmm22 // CHECK: encoding: [0x62,0xa5,0x7d,0x48,0x51,0xf7] - vsqrtnepbf16 %zmm23, %zmm22 + vsqrtbf16 %zmm23, %zmm22 -// CHECK: vsqrtnepbf16 %zmm23, %zmm22 {%k7} +// CHECK: vsqrtbf16 %zmm23, %zmm22 {%k7} // CHECK: encoding: [0x62,0xa5,0x7d,0x4f,0x51,0xf7] - vsqrtnepbf16 %zmm23, %zmm22 {%k7} + vsqrtbf16 %zmm23, %zmm22 {%k7} -// CHECK: vsqrtnepbf16 %zmm23, %zmm22 {%k7} {z} +// CHECK: vsqrtbf16 %zmm23, %zmm22 {%k7} {z} // CHECK: encoding: [0x62,0xa5,0x7d,0xcf,0x51,0xf7] - vsqrtnepbf16 %zmm23, %zmm22 {%k7} {z} + vsqrtbf16 %zmm23, %zmm22 {%k7} {z} -// CHECK: vsqrtnepbf16 %ymm23, %ymm22 +// CHECK: vsqrtbf16 %ymm23, %ymm22 // CHECK: encoding: [0x62,0xa5,0x7d,0x28,0x51,0xf7] - vsqrtnepbf16 %ymm23, %ymm22 + vsqrtbf16 %ymm23, %ymm22 -// CHECK: vsqrtnepbf16 %ymm23, %ymm22 {%k7} +// CHECK: vsqrtbf16 %ymm23, %ymm22 {%k7} // CHECK: encoding: [0x62,0xa5,0x7d,0x2f,0x51,0xf7] - vsqrtnepbf16 %ymm23, %ymm22 {%k7} + vsqrtbf16 %ymm23, %ymm22 {%k7} -// CHECK: vsqrtnepbf16 %ymm23, %ymm22 {%k7} {z} +// CHECK: vsqrtbf16 %ymm23, %ymm22 {%k7} {z} // CHECK: encoding: [0x62,0xa5,0x7d,0xaf,0x51,0xf7] - vsqrtnepbf16 %ymm23, %ymm22 {%k7} {z} + vsqrtbf16 %ymm23, %ymm22 {%k7} {z} -// CHECK: vsqrtnepbf16 268435456(%rbp,%r14,8), %xmm22 +// CHECK: vsqrtbf16 268435456(%rbp,%r14,8), %xmm22 // CHECK: encoding: [0x62,0xa5,0x7d,0x08,0x51,0xb4,0xf5,0x00,0x00,0x00,0x10] - vsqrtnepbf16 268435456(%rbp,%r14,8), %xmm22 + vsqrtbf16 268435456(%rbp,%r14,8), %xmm22 -// CHECK: vsqrtnepbf16 291(%r8,%rax,4), %xmm22 {%k7} +// CHECK: vsqrtbf16 291(%r8,%rax,4), %xmm22 {%k7} // CHECK: encoding: [0x62,0xc5,0x7d,0x0f,0x51,0xb4,0x80,0x23,0x01,0x00,0x00] - vsqrtnepbf16 291(%r8,%rax,4), %xmm22 {%k7} + vsqrtbf16 291(%r8,%rax,4), %xmm22 {%k7} -// CHECK: vsqrtnepbf16 (%rip){1to8}, %xmm22 +// CHECK: vsqrtbf16 (%rip){1to8}, %xmm22 // CHECK: encoding: [0x62,0xe5,0x7d,0x18,0x51,0x35,0x00,0x00,0x00,0x00] - vsqrtnepbf16 (%rip){1to8}, %xmm22 + vsqrtbf16 (%rip){1to8}, %xmm22 -// CHECK: vsqrtnepbf16 -512(,%rbp,2), %xmm22 +// CHECK: vsqrtbf16 -512(,%rbp,2), %xmm22 // CHECK: encoding: [0x62,0xe5,0x7d,0x08,0x51,0x34,0x6d,0x00,0xfe,0xff,0xff] - vsqrtnepbf16 -512(,%rbp,2), %xmm22 + vsqrtbf16 -512(,%rbp,2), %xmm22 -// CHECK: vsqrtnepbf16 2032(%rcx), %xmm22 {%k7} {z} +// CHECK: vsqrtbf16 2032(%rcx), %xmm22 {%k7} {z} // CHECK: encoding: [0x62,0xe5,0x7d,0x8f,0x51,0x71,0x7f] - vsqrtnepbf16 2032(%rcx), %xmm22 {%k7} {z} + vsqrtbf16 2032(%rcx), %xmm22 {%k7} {z} -// CHECK: vsqrtnepbf16 -256(%rdx){1to8}, %xmm22 {%k7} {z} +// CHECK: vsqrtbf16 -256(%rdx){1to8}, %xmm22 {%k7} {z} // CHECK: encoding: [0x62,0xe5,0x7d,0x9f,0x51,0x72,0x80] - vsqrtnepbf16 -256(%rdx){1to8}, %xmm22 {%k7} {z} + vsqrtbf16 -256(%rdx){1to8}, %xmm22 {%k7} {z} -// CHECK: vsqrtnepbf16 268435456(%rbp,%r14,8), %ymm22 +// CHECK: vsqrtbf16 268435456(%rbp,%r14,8), %ymm22 // CHECK: encoding: [0x62,0xa5,0x7d,0x28,0x51,0xb4,0xf5,0x00,0x00,0x00,0x10] - vsqrtnepbf16 268435456(%rbp,%r14,8), %ymm22 + vsqrtbf16 268435456(%rbp,%r14,8), %ymm22 -// CHECK: vsqrtnepbf16 291(%r8,%rax,4), %ymm22 {%k7} +// CHECK: vsqrtbf16 291(%r8,%rax,4), %ymm22 {%k7} // CHECK: encoding: [0x62,0xc5,0x7d,0x2f,0x51,0xb4,0x80,0x23,0x01,0x00,0x00] - vsqrtnepbf16 291(%r8,%rax,4), %ymm22 {%k7} + vsqrtbf16 291(%r8,%rax,4), %ymm22 {%k7} -// CHECK: vsqrtnepbf16 (%rip){1to16}, %ymm22 +// CHECK: vsqrtbf16 (%rip){1to16}, %ymm22 // CHECK: encoding: [0x62,0xe5,0x7d,0x38,0x51,0x35,0x00,0x00,0x00,0x00] - vsqrtnepbf16 (%rip){1to16}, %ymm22 + vsqrtbf16 (%rip){1to16}, %ymm22 -// CHECK: vsqrtnepbf16 -1024(,%rbp,2), %ymm22 +// CHECK: vsqrtbf16 -1024(,%rbp,2), %ymm22 // CHECK: encoding: [0x62,0xe5,0x7d,0x28,0x51,0x34,0x6d,0x00,0xfc,0xff,0xff] - vsqrtnepbf16 -1024(,%rbp,2), %ymm22 + vsqrtbf16 -1024(,%rbp,2), %ymm22 -// CHECK: vsqrtnepbf16 4064(%rcx), %ymm22 {%k7} {z} +// CHECK: vsqrtbf16 4064(%rcx), %ymm22 {%k7} {z} // CHECK: encoding: [0x62,0xe5,0x7d,0xaf,0x51,0x71,0x7f] - vsqrtnepbf16 4064(%rcx), %ymm22 {%k7} {z} + vsqrtbf16 4064(%rcx), %ymm22 {%k7} {z} -// CHECK: vsqrtnepbf16 -256(%rdx){1to16}, %ymm22 {%k7} {z} +// CHECK: vsqrtbf16 -256(%rdx){1to16}, %ymm22 {%k7} {z} // CHECK: encoding: [0x62,0xe5,0x7d,0xbf,0x51,0x72,0x80] - vsqrtnepbf16 -256(%rdx){1to16}, %ymm22 {%k7} {z} + vsqrtbf16 -256(%rdx){1to16}, %ymm22 {%k7} {z} -// CHECK: vsqrtnepbf16 268435456(%rbp,%r14,8), %zmm22 +// CHECK: vsqrtbf16 268435456(%rbp,%r14,8), %zmm22 // CHECK: encoding: [0x62,0xa5,0x7d,0x48,0x51,0xb4,0xf5,0x00,0x00,0x00,0x10] - vsqrtnepbf16 268435456(%rbp,%r14,8), %zmm22 + vsqrtbf16 268435456(%rbp,%r14,8), %zmm22 -// CHECK: vsqrtnepbf16 291(%r8,%rax,4), %zmm22 {%k7} +// CHECK: vsqrtbf16 291(%r8,%rax,4), %zmm22 {%k7} // CHECK: encoding: [0x62,0xc5,0x7d,0x4f,0x51,0xb4,0x80,0x23,0x01,0x00,0x00] - vsqrtnepbf16 291(%r8,%rax,4), %zmm22 {%k7} + vsqrtbf16 291(%r8,%rax,4), %zmm22 {%k7} -// CHECK: vsqrtnepbf16 (%rip){1to32}, %zmm22 +// CHECK: vsqrtbf16 (%rip){1to32}, %zmm22 // CHECK: encoding: [0x62,0xe5,0x7d,0x58,0x51,0x35,0x00,0x00,0x00,0x00] - vsqrtnepbf16 (%rip){1to32}, %zmm22 + vsqrtbf16 (%rip){1to32}, %zmm22 -// CHECK: vsqrtnepbf16 -2048(,%rbp,2), %zmm22 +// CHECK: vsqrtbf16 -2048(,%rbp,2), %zmm22 // CHECK: encoding: [0x62,0xe5,0x7d,0x48,0x51,0x34,0x6d,0x00,0xf8,0xff,0xff] - vsqrtnepbf16 -2048(,%rbp,2), %zmm22 + vsqrtbf16 -2048(,%rbp,2), %zmm22 -// CHECK: vsqrtnepbf16 8128(%rcx), %zmm22 {%k7} {z} +// CHECK: vsqrtbf16 8128(%rcx), %zmm22 {%k7} {z} // CHECK: encoding: [0x62,0xe5,0x7d,0xcf,0x51,0x71,0x7f] - vsqrtnepbf16 8128(%rcx), %zmm22 {%k7} {z} + vsqrtbf16 8128(%rcx), %zmm22 {%k7} {z} -// CHECK: vsqrtnepbf16 -256(%rdx){1to32}, %zmm22 {%k7} {z} +// CHECK: vsqrtbf16 -256(%rdx){1to32}, %zmm22 {%k7} {z} // CHECK: encoding: [0x62,0xe5,0x7d,0xdf,0x51,0x72,0x80] - vsqrtnepbf16 -256(%rdx){1to32}, %zmm22 {%k7} {z} + vsqrtbf16 -256(%rdx){1to32}, %zmm22 {%k7} {z} -// CHECK: vsubnepbf16 %ymm24, %ymm23, %ymm22 +// CHECK: vsubbf16 %ymm24, %ymm23, %ymm22 // CHECK: encoding: [0x62,0x85,0x45,0x20,0x5c,0xf0] - vsubnepbf16 %ymm24, %ymm23, %ymm22 + vsubbf16 %ymm24, %ymm23, %ymm22 -// CHECK: vsubnepbf16 %ymm24, %ymm23, %ymm22 {%k7} +// CHECK: vsubbf16 %ymm24, %ymm23, %ymm22 {%k7} // CHECK: encoding: [0x62,0x85,0x45,0x27,0x5c,0xf0] - vsubnepbf16 %ymm24, %ymm23, %ymm22 {%k7} + vsubbf16 %ymm24, %ymm23, %ymm22 {%k7} -// CHECK: vsubnepbf16 %ymm24, %ymm23, %ymm22 {%k7} {z} +// CHECK: vsubbf16 %ymm24, %ymm23, %ymm22 {%k7} {z} // CHECK: encoding: [0x62,0x85,0x45,0xa7,0x5c,0xf0] - vsubnepbf16 %ymm24, %ymm23, %ymm22 {%k7} {z} + vsubbf16 %ymm24, %ymm23, %ymm22 {%k7} {z} -// CHECK: vsubnepbf16 %zmm24, %zmm23, %zmm22 +// CHECK: vsubbf16 %zmm24, %zmm23, %zmm22 // CHECK: encoding: [0x62,0x85,0x45,0x40,0x5c,0xf0] - vsubnepbf16 %zmm24, %zmm23, %zmm22 + vsubbf16 %zmm24, %zmm23, %zmm22 -// CHECK: vsubnepbf16 %zmm24, %zmm23, %zmm22 {%k7} +// CHECK: vsubbf16 %zmm24, %zmm23, %zmm22 {%k7} // CHECK: encoding: [0x62,0x85,0x45,0x47,0x5c,0xf0] - vsubnepbf16 %zmm24, %zmm23, %zmm22 {%k7} + vsubbf16 %zmm24, %zmm23, %zmm22 {%k7} -// CHECK: vsubnepbf16 %zmm24, %zmm23, %zmm22 {%k7} {z} +// CHECK: vsubbf16 %zmm24, %zmm23, %zmm22 {%k7} {z} // CHECK: encoding: [0x62,0x85,0x45,0xc7,0x5c,0xf0] - vsubnepbf16 %zmm24, %zmm23, %zmm22 {%k7} {z} + vsubbf16 %zmm24, %zmm23, %zmm22 {%k7} {z} -// CHECK: vsubnepbf16 %xmm24, %xmm23, %xmm22 +// CHECK: vsubbf16 %xmm24, %xmm23, %xmm22 // CHECK: encoding: [0x62,0x85,0x45,0x00,0x5c,0xf0] - vsubnepbf16 %xmm24, %xmm23, %xmm22 + vsubbf16 %xmm24, %xmm23, %xmm22 -// CHECK: vsubnepbf16 %xmm24, %xmm23, %xmm22 {%k7} +// CHECK: vsubbf16 %xmm24, %xmm23, %xmm22 {%k7} // CHECK: encoding: [0x62,0x85,0x45,0x07,0x5c,0xf0] - vsubnepbf16 %xmm24, %xmm23, %xmm22 {%k7} + vsubbf16 %xmm24, %xmm23, %xmm22 {%k7} -// CHECK: vsubnepbf16 %xmm24, %xmm23, %xmm22 {%k7} {z} +// CHECK: vsubbf16 %xmm24, %xmm23, %xmm22 {%k7} {z} // CHECK: encoding: [0x62,0x85,0x45,0x87,0x5c,0xf0] - vsubnepbf16 %xmm24, %xmm23, %xmm22 {%k7} {z} + vsubbf16 %xmm24, %xmm23, %xmm22 {%k7} {z} -// CHECK: vsubnepbf16 268435456(%rbp,%r14,8), %zmm23, %zmm22 +// CHECK: vsubbf16 268435456(%rbp,%r14,8), %zmm23, %zmm22 // CHECK: encoding: [0x62,0xa5,0x45,0x40,0x5c,0xb4,0xf5,0x00,0x00,0x00,0x10] - vsubnepbf16 268435456(%rbp,%r14,8), %zmm23, %zmm22 + vsubbf16 268435456(%rbp,%r14,8), %zmm23, %zmm22 -// CHECK: vsubnepbf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7} +// CHECK: vsubbf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7} // CHECK: encoding: [0x62,0xc5,0x45,0x47,0x5c,0xb4,0x80,0x23,0x01,0x00,0x00] - vsubnepbf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7} + vsubbf16 291(%r8,%rax,4), %zmm23, %zmm22 {%k7} -// CHECK: vsubnepbf16 (%rip){1to32}, %zmm23, %zmm22 +// CHECK: vsubbf16 (%rip){1to32}, %zmm23, %zmm22 // CHECK: encoding: [0x62,0xe5,0x45,0x50,0x5c,0x35,0x00,0x00,0x00,0x00] - vsubnepbf16 (%rip){1to32}, %zmm23, %zmm22 + vsubbf16 (%rip){1to32}, %zmm23, %zmm22 -// CHECK: vsubnepbf16 -2048(,%rbp,2), %zmm23, %zmm22 +// CHECK: vsubbf16 -2048(,%rbp,2), %zmm23, %zmm22 // CHECK: encoding: [0x62,0xe5,0x45,0x40,0x5c,0x34,0x6d,0x00,0xf8,0xff,0xff] - vsubnepbf16 -2048(,%rbp,2), %zmm23, %zmm22 + vsubbf16 -2048(,%rbp,2), %zmm23, %zmm22 -// CHECK: vsubnepbf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z} +// CHECK: vsubbf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z} // CHECK: encoding: [0x62,0xe5,0x45,0xc7,0x5c,0x71,0x7f] - vsubnepbf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z} + vsubbf16 8128(%rcx), %zmm23, %zmm22 {%k7} {z} -// CHECK: vsubnepbf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z} +// CHECK: vsubbf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z} // CHECK: encoding: [0x62,0xe5,0x45,0xd7,0x5c,0x72,0x80] - vsubnepbf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z} + vsubbf16 -256(%rdx){1to32}, %zmm23, %zmm22 {%k7} {z} -// CHECK: vsubnepbf16 268435456(%rbp,%r14,8), %ymm23, %ymm22 +// CHECK: vsubbf16 268435456(%rbp,%r14,8), %ymm23, %ymm22 // CHECK: encoding: [0x62,0xa5,0x45,0x20,0x5c,0xb4,0xf5,0x00,0x00,0x00,0x10] - vsubnepbf16 268435456(%rbp,%r14,8), %ymm23, %ymm22 + vsubbf16 268435456(%rbp,%r14,8), %ymm23, %ymm22 -// CHECK: vsubnepbf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7} +// CHECK: vsubbf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7} // CHECK: encoding: [0x62,0xc5,0x45,0x27,0x5c,0xb4,0x80,0x23,0x01,0x00,0x00] - vsubnepbf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7} + vsubbf16 291(%r8,%rax,4), %ymm23, %ymm22 {%k7} -// CHECK: vsubnepbf16 (%rip){1to16}, %ymm23, %ymm22 +// CHECK: vsubbf16 (%rip){1to16}, %ymm23, %ymm22 // CHECK: encoding: [0x62,0xe5,0x45,0x30,0x5c,0x35,0x00,0x00,0x00,0x00] - vsubnepbf16 (%rip){1to16}, %ymm23, %ymm22 + vsubbf16 (%rip){1to16}, %ymm23, %ymm22 -// CHECK: vsubnepbf16 -1024(,%rbp,2), %ymm23, %ymm22 +// CHECK: vsubbf16 -1024(,%rbp,2), %ymm23, %ymm22 // CHECK: encoding: [0x62,0xe5,0x45,0x20,0x5c,0x34,0x6d,0x00,0xfc,0xff,0xff] - vsubnepbf16 -1024(,%rbp,2), %ymm23, %ymm22 + vsubbf16 -1024(,%rbp,2), %ymm23, %ymm22 -// CHECK: vsubnepbf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z} +// CHECK: vsubbf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z} // CHECK: encoding: [0x62,0xe5,0x45,0xa7,0x5c,0x71,0x7f] - vsubnepbf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z} + vsubbf16 4064(%rcx), %ymm23, %ymm22 {%k7} {z} -// CHECK: vsubnepbf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z} +// CHECK: vsubbf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z} // CHECK: encoding: [0x62,0xe5,0x45,0xb7,0x5c,0x72,0x80] - vsubnepbf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z} + vsubbf16 -256(%rdx){1to16}, %ymm23, %ymm22 {%k7} {z} -// CHECK: vsubnepbf16 268435456(%rbp,%r14,8), %xmm23, %xmm22 +// CHECK: vsubbf16 268435456(%rbp,%r14,8), %xmm23, %xmm22 // CHECK: encoding: [0x62,0xa5,0x45,0x00,0x5c,0xb4,0xf5,0x00,0x00,0x00,0x10] - vsubnepbf16 268435456(%rbp,%r14,8), %xmm23, %xmm22 + vsubbf16 268435456(%rbp,%r14,8), %xmm23, %xmm22 -// CHECK: vsubnepbf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7} +// CHECK: vsubbf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7} // CHECK: encoding: [0x62,0xc5,0x45,0x07,0x5c,0xb4,0x80,0x23,0x01,0x00,0x00] - vsubnepbf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7} + vsubbf16 291(%r8,%rax,4), %xmm23, %xmm22 {%k7} -// CHECK: vsubnepbf16 (%rip){1to8}, %xmm23, %xmm22 +// CHECK: vsubbf16 (%rip){1to8}, %xmm23, %xmm22 // CHECK: encoding: [0x62,0xe5,0x45,0x10,0x5c,0x35,0x00,0x00,0x00,0x00] - vsubnepbf16 (%rip){1to8}, %xmm23, %xmm22 + vsubbf16 (%rip){1to8}, %xmm23, %xmm22 -// CHECK: vsubnepbf16 -512(,%rbp,2), %xmm23, %xmm22 +// CHECK: vsubbf16 -512(,%rbp,2), %xmm23, %xmm22 // CHECK: encoding: [0x62,0xe5,0x45,0x00,0x5c,0x34,0x6d,0x00,0xfe,0xff,0xff] - vsubnepbf16 -512(,%rbp,2), %xmm23, %xmm22 + vsubbf16 -512(,%rbp,2), %xmm23, %xmm22 -// CHECK: vsubnepbf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z} +// CHECK: vsubbf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z} // CHECK: encoding: [0x62,0xe5,0x45,0x87,0x5c,0x71,0x7f] - vsubnepbf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z} + vsubbf16 2032(%rcx), %xmm23, %xmm22 {%k7} {z} -// CHECK: vsubnepbf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z} +// CHECK: vsubbf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z} // CHECK: encoding: [0x62,0xe5,0x45,0x97,0x5c,0x72,0x80] - vsubnepbf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z} + vsubbf16 -256(%rdx){1to8}, %xmm23, %xmm22 {%k7} {z} diff --git a/llvm/test/MC/X86/avx10.2-bf16-64-intel.s b/llvm/test/MC/X86/avx10.2-bf16-64-intel.s index 5f3dc45ba7745..a275979ad0a25 100644 --- a/llvm/test/MC/X86/avx10.2-bf16-64-intel.s +++ b/llvm/test/MC/X86/avx10.2-bf16-64-intel.s @@ -1,208 +1,208 @@ // RUN: llvm-mc -triple x86_64 -x86-asm-syntax=intel -output-asm-variant=1 --show-encoding %s | FileCheck %s -// CHECK: vaddnepbf16 ymm22, ymm23, ymm24 +// CHECK: vaddbf16 ymm22, ymm23, ymm24 // CHECK: encoding: [0x62,0x85,0x45,0x20,0x58,0xf0] - vaddnepbf16 ymm22, ymm23, ymm24 + vaddbf16 ymm22, ymm23, ymm24 -// CHECK: vaddnepbf16 ymm22 {k7}, ymm23, ymm24 +// CHECK: vaddbf16 ymm22 {k7}, ymm23, ymm24 // CHECK: encoding: [0x62,0x85,0x45,0x27,0x58,0xf0] - vaddnepbf16 ymm22 {k7}, ymm23, ymm24 + vaddbf16 ymm22 {k7}, ymm23, ymm24 -// CHECK: vaddnepbf16 ymm22 {k7} {z}, ymm23, ymm24 +// CHECK: vaddbf16 ymm22 {k7} {z}, ymm23, ymm24 // CHECK: encoding: [0x62,0x85,0x45,0xa7,0x58,0xf0] - vaddnepbf16 ymm22 {k7} {z}, ymm23, ymm24 + vaddbf16 ymm22 {k7} {z}, ymm23, ymm24 -// CHECK: vaddnepbf16 zmm22, zmm23, zmm24 +// CHECK: vaddbf16 zmm22, zmm23, zmm24 // CHECK: encoding: [0x62,0x85,0x45,0x40,0x58,0xf0] - vaddnepbf16 zmm22, zmm23, zmm24 + vaddbf16 zmm22, zmm23, zmm24 -// CHECK: vaddnepbf16 zmm22 {k7}, zmm23, zmm24 +// CHECK: vaddbf16 zmm22 {k7}, zmm23, zmm24 // CHECK: encoding: [0x62,0x85,0x45,0x47,0x58,0xf0] - vaddnepbf16 zmm22 {k7}, zmm23, zmm24 + vaddbf16 zmm22 {k7}, zmm23, zmm24 -// CHECK: vaddnepbf16 zmm22 {k7} {z}, zmm23, zmm24 +// CHECK: vaddbf16 zmm22 {k7} {z}, zmm23, zmm24 // CHECK: encoding: [0x62,0x85,0x45,0xc7,0x58,0xf0] - vaddnepbf16 zmm22 {k7} {z}, zmm23, zmm24 + vaddbf16 zmm22 {k7} {z}, zmm23, zmm24 -// CHECK: vaddnepbf16 xmm22, xmm23, xmm24 +// CHECK: vaddbf16 xmm22, xmm23, xmm24 // CHECK: encoding: [0x62,0x85,0x45,0x00,0x58,0xf0] - vaddnepbf16 xmm22, xmm23, xmm24 + vaddbf16 xmm22, xmm23, xmm24 -// CHECK: vaddnepbf16 xmm22 {k7}, xmm23, xmm24 +// CHECK: vaddbf16 xmm22 {k7}, xmm23, xmm24 // CHECK: encoding: [0x62,0x85,0x45,0x07,0x58,0xf0] - vaddnepbf16 xmm22 {k7}, xmm23, xmm24 + vaddbf16 xmm22 {k7}, xmm23, xmm24 -// CHECK: vaddnepbf16 xmm22 {k7} {z}, xmm23, xmm24 +// CHECK: vaddbf16 xmm22 {k7} {z}, xmm23, xmm24 // CHECK: encoding: [0x62,0x85,0x45,0x87,0x58,0xf0] - vaddnepbf16 xmm22 {k7} {z}, xmm23, xmm24 + vaddbf16 xmm22 {k7} {z}, xmm23, xmm24 -// CHECK: vaddnepbf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456] +// CHECK: vaddbf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456] // CHECK: encoding: [0x62,0xa5,0x45,0x40,0x58,0xb4,0xf5,0x00,0x00,0x00,0x10] - vaddnepbf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456] + vaddbf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456] -// CHECK: vaddnepbf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291] +// CHECK: vaddbf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291] // CHECK: encoding: [0x62,0xc5,0x45,0x47,0x58,0xb4,0x80,0x23,0x01,0x00,0x00] - vaddnepbf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291] + vaddbf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291] -// CHECK: vaddnepbf16 zmm22, zmm23, word ptr [rip]{1to32} +// CHECK: vaddbf16 zmm22, zmm23, word ptr [rip]{1to32} // CHECK: encoding: [0x62,0xe5,0x45,0x50,0x58,0x35,0x00,0x00,0x00,0x00] - vaddnepbf16 zmm22, zmm23, word ptr [rip]{1to32} + vaddbf16 zmm22, zmm23, word ptr [rip]{1to32} -// CHECK: vaddnepbf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048] +// CHECK: vaddbf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048] // CHECK: encoding: [0x62,0xe5,0x45,0x40,0x58,0x34,0x6d,0x00,0xf8,0xff,0xff] - vaddnepbf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048] + vaddbf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048] -// CHECK: vaddnepbf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128] +// CHECK: vaddbf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128] // CHECK: encoding: [0x62,0xe5,0x45,0xc7,0x58,0x71,0x7f] - vaddnepbf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128] + vaddbf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128] -// CHECK: vaddnepbf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32} +// CHECK: vaddbf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32} // CHECK: encoding: [0x62,0xe5,0x45,0xd7,0x58,0x72,0x80] - vaddnepbf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32} + vaddbf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32} -// CHECK: vaddnepbf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456] +// CHECK: vaddbf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456] // CHECK: encoding: [0x62,0xa5,0x45,0x20,0x58,0xb4,0xf5,0x00,0x00,0x00,0x10] - vaddnepbf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456] + vaddbf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456] -// CHECK: vaddnepbf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291] +// CHECK: vaddbf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291] // CHECK: encoding: [0x62,0xc5,0x45,0x27,0x58,0xb4,0x80,0x23,0x01,0x00,0x00] - vaddnepbf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291] + vaddbf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291] -// CHECK: vaddnepbf16 ymm22, ymm23, word ptr [rip]{1to16} +// CHECK: vaddbf16 ymm22, ymm23, word ptr [rip]{1to16} // CHECK: encoding: [0x62,0xe5,0x45,0x30,0x58,0x35,0x00,0x00,0x00,0x00] - vaddnepbf16 ymm22, ymm23, word ptr [rip]{1to16} + vaddbf16 ymm22, ymm23, word ptr [rip]{1to16} -// CHECK: vaddnepbf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024] +// CHECK: vaddbf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024] // CHECK: encoding: [0x62,0xe5,0x45,0x20,0x58,0x34,0x6d,0x00,0xfc,0xff,0xff] - vaddnepbf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024] + vaddbf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024] -// CHECK: vaddnepbf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064] +// CHECK: vaddbf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064] // CHECK: encoding: [0x62,0xe5,0x45,0xa7,0x58,0x71,0x7f] - vaddnepbf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064] + vaddbf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064] -// CHECK: vaddnepbf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16} +// CHECK: vaddbf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16} // CHECK: encoding: [0x62,0xe5,0x45,0xb7,0x58,0x72,0x80] - vaddnepbf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16} + vaddbf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16} -// CHECK: vaddnepbf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456] +// CHECK: vaddbf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456] // CHECK: encoding: [0x62,0xa5,0x45,0x00,0x58,0xb4,0xf5,0x00,0x00,0x00,0x10] - vaddnepbf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456] + vaddbf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456] -// CHECK: vaddnepbf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291] +// CHECK: vaddbf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291] // CHECK: encoding: [0x62,0xc5,0x45,0x07,0x58,0xb4,0x80,0x23,0x01,0x00,0x00] - vaddnepbf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291] + vaddbf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291] -// CHECK: vaddnepbf16 xmm22, xmm23, word ptr [rip]{1to8} +// CHECK: vaddbf16 xmm22, xmm23, word ptr [rip]{1to8} // CHECK: encoding: [0x62,0xe5,0x45,0x10,0x58,0x35,0x00,0x00,0x00,0x00] - vaddnepbf16 xmm22, xmm23, word ptr [rip]{1to8} + vaddbf16 xmm22, xmm23, word ptr [rip]{1to8} -// CHECK: vaddnepbf16 xmm22, xmm23, xmmword ptr [2*rbp - 512] +// CHECK: vaddbf16 xmm22, xmm23, xmmword ptr [2*rbp - 512] // CHECK: encoding: [0x62,0xe5,0x45,0x00,0x58,0x34,0x6d,0x00,0xfe,0xff,0xff] - vaddnepbf16 xmm22, xmm23, xmmword ptr [2*rbp - 512] + vaddbf16 xmm22, xmm23, xmmword ptr [2*rbp - 512] -// CHECK: vaddnepbf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032] +// CHECK: vaddbf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032] // CHECK: encoding: [0x62,0xe5,0x45,0x87,0x58,0x71,0x7f] - vaddnepbf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032] + vaddbf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032] -// CHECK: vaddnepbf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8} +// CHECK: vaddbf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8} // CHECK: encoding: [0x62,0xe5,0x45,0x97,0x58,0x72,0x80] - vaddnepbf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8} + vaddbf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8} -// CHECK: vcmppbf16 k5, ymm23, ymm24, 123 +// CHECK: vcmpbf16 k5, ymm23, ymm24, 123 // CHECK: encoding: [0x62,0x93,0x47,0x20,0xc2,0xe8,0x7b] - vcmppbf16 k5, ymm23, ymm24, 123 + vcmpbf16 k5, ymm23, ymm24, 123 -// CHECK: vcmppbf16 k5 {k7}, ymm23, ymm24, 123 +// CHECK: vcmpbf16 k5 {k7}, ymm23, ymm24, 123 // CHECK: encoding: [0x62,0x93,0x47,0x27,0xc2,0xe8,0x7b] - vcmppbf16 k5 {k7}, ymm23, ymm24, 123 + vcmpbf16 k5 {k7}, ymm23, ymm24, 123 -// CHECK: vcmppbf16 k5, xmm23, xmm24, 123 +// CHECK: vcmpbf16 k5, xmm23, xmm24, 123 // CHECK: encoding: [0x62,0x93,0x47,0x00,0xc2,0xe8,0x7b] - vcmppbf16 k5, xmm23, xmm24, 123 + vcmpbf16 k5, xmm23, xmm24, 123 -// CHECK: vcmppbf16 k5 {k7}, xmm23, xmm24, 123 +// CHECK: vcmpbf16 k5 {k7}, xmm23, xmm24, 123 // CHECK: encoding: [0x62,0x93,0x47,0x07,0xc2,0xe8,0x7b] - vcmppbf16 k5 {k7}, xmm23, xmm24, 123 + vcmpbf16 k5 {k7}, xmm23, xmm24, 123 -// CHECK: vcmppbf16 k5, zmm23, zmm24, 123 +// CHECK: vcmpbf16 k5, zmm23, zmm24, 123 // CHECK: encoding: [0x62,0x93,0x47,0x40,0xc2,0xe8,0x7b] - vcmppbf16 k5, zmm23, zmm24, 123 + vcmpbf16 k5, zmm23, zmm24, 123 -// CHECK: vcmppbf16 k5 {k7}, zmm23, zmm24, 123 +// CHECK: vcmpbf16 k5 {k7}, zmm23, zmm24, 123 // CHECK: encoding: [0x62,0x93,0x47,0x47,0xc2,0xe8,0x7b] - vcmppbf16 k5 {k7}, zmm23, zmm24, 123 + vcmpbf16 k5 {k7}, zmm23, zmm24, 123 -// CHECK: vcmppbf16 k5, zmm23, zmmword ptr [rbp + 8*r14 + 268435456], 123 +// CHECK: vcmpbf16 k5, zmm23, zmmword ptr [rbp + 8*r14 + 268435456], 123 // CHECK: encoding: [0x62,0xb3,0x47,0x40,0xc2,0xac,0xf5,0x00,0x00,0x00,0x10,0x7b] - vcmppbf16 k5, zmm23, zmmword ptr [rbp + 8*r14 + 268435456], 123 + vcmpbf16 k5, zmm23, zmmword ptr [rbp + 8*r14 + 268435456], 123 -// CHECK: vcmppbf16 k5 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291], 123 +// CHECK: vcmpbf16 k5 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291], 123 // CHECK: encoding: [0x62,0xd3,0x47,0x47,0xc2,0xac,0x80,0x23,0x01,0x00,0x00,0x7b] - vcmppbf16 k5 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291], 123 + vcmpbf16 k5 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291], 123 -// CHECK: vcmppbf16 k5, zmm23, word ptr [rip]{1to32}, 123 +// CHECK: vcmpbf16 k5, zmm23, word ptr [rip]{1to32}, 123 // CHECK: encoding: [0x62,0xf3,0x47,0x50,0xc2,0x2d,0x00,0x00,0x00,0x00,0x7b] - vcmppbf16 k5, zmm23, word ptr [rip]{1to32}, 123 + vcmpbf16 k5, zmm23, word ptr [rip]{1to32}, 123 -// CHECK: vcmppbf16 k5, zmm23, zmmword ptr [2*rbp - 2048], 123 +// CHECK: vcmpbf16 k5, zmm23, zmmword ptr [2*rbp - 2048], 123 // CHECK: encoding: [0x62,0xf3,0x47,0x40,0xc2,0x2c,0x6d,0x00,0xf8,0xff,0xff,0x7b] - vcmppbf16 k5, zmm23, zmmword ptr [2*rbp - 2048], 123 + vcmpbf16 k5, zmm23, zmmword ptr [2*rbp - 2048], 123 -// CHECK: vcmppbf16 k5 {k7}, zmm23, zmmword ptr [rcx + 8128], 123 +// CHECK: vcmpbf16 k5 {k7}, zmm23, zmmword ptr [rcx + 8128], 123 // CHECK: encoding: [0x62,0xf3,0x47,0x47,0xc2,0x69,0x7f,0x7b] - vcmppbf16 k5 {k7}, zmm23, zmmword ptr [rcx + 8128], 123 + vcmpbf16 k5 {k7}, zmm23, zmmword ptr [rcx + 8128], 123 -// CHECK: vcmppbf16 k5 {k7}, zmm23, word ptr [rdx - 256]{1to32}, 123 +// CHECK: vcmpbf16 k5 {k7}, zmm23, word ptr [rdx - 256]{1to32}, 123 // CHECK: encoding: [0x62,0xf3,0x47,0x57,0xc2,0x6a,0x80,0x7b] - vcmppbf16 k5 {k7}, zmm23, word ptr [rdx - 256]{1to32}, 123 + vcmpbf16 k5 {k7}, zmm23, word ptr [rdx - 256]{1to32}, 123 -// CHECK: vcmppbf16 k5, xmm23, xmmword ptr [rbp + 8*r14 + 268435456], 123 +// CHECK: vcmpbf16 k5, xmm23, xmmword ptr [rbp + 8*r14 + 268435456], 123 // CHECK: encoding: [0x62,0xb3,0x47,0x00,0xc2,0xac,0xf5,0x00,0x00,0x00,0x10,0x7b] - vcmppbf16 k5, xmm23, xmmword ptr [rbp + 8*r14 + 268435456], 123 + vcmpbf16 k5, xmm23, xmmword ptr [rbp + 8*r14 + 268435456], 123 -// CHECK: vcmppbf16 k5 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291], 123 +// CHECK: vcmpbf16 k5 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291], 123 // CHECK: encoding: [0x62,0xd3,0x47,0x07,0xc2,0xac,0x80,0x23,0x01,0x00,0x00,0x7b] - vcmppbf16 k5 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291], 123 + vcmpbf16 k5 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291], 123 -// CHECK: vcmppbf16 k5, xmm23, word ptr [rip]{1to8}, 123 +// CHECK: vcmpbf16 k5, xmm23, word ptr [rip]{1to8}, 123 // CHECK: encoding: [0x62,0xf3,0x47,0x10,0xc2,0x2d,0x00,0x00,0x00,0x00,0x7b] - vcmppbf16 k5, xmm23, word ptr [rip]{1to8}, 123 + vcmpbf16 k5, xmm23, word ptr [rip]{1to8}, 123 -// CHECK: vcmppbf16 k5, xmm23, xmmword ptr [2*rbp - 512], 123 +// CHECK: vcmpbf16 k5, xmm23, xmmword ptr [2*rbp - 512], 123 // CHECK: encoding: [0x62,0xf3,0x47,0x00,0xc2,0x2c,0x6d,0x00,0xfe,0xff,0xff,0x7b] - vcmppbf16 k5, xmm23, xmmword ptr [2*rbp - 512], 123 + vcmpbf16 k5, xmm23, xmmword ptr [2*rbp - 512], 123 -// CHECK: vcmppbf16 k5 {k7}, xmm23, xmmword ptr [rcx + 2032], 123 +// CHECK: vcmpbf16 k5 {k7}, xmm23, xmmword ptr [rcx + 2032], 123 // CHECK: encoding: [0x62,0xf3,0x47,0x07,0xc2,0x69,0x7f,0x7b] - vcmppbf16 k5 {k7}, xmm23, xmmword ptr [rcx + 2032], 123 + vcmpbf16 k5 {k7}, xmm23, xmmword ptr [rcx + 2032], 123 -// CHECK: vcmppbf16 k5 {k7}, xmm23, word ptr [rdx - 256]{1to8}, 123 +// CHECK: vcmpbf16 k5 {k7}, xmm23, word ptr [rdx - 256]{1to8}, 123 // CHECK: encoding: [0x62,0xf3,0x47,0x17,0xc2,0x6a,0x80,0x7b] - vcmppbf16 k5 {k7}, xmm23, word ptr [rdx - 256]{1to8}, 123 + vcmpbf16 k5 {k7}, xmm23, word ptr [rdx - 256]{1to8}, 123 -// CHECK: vcmppbf16 k5, ymm23, ymmword ptr [rbp + 8*r14 + 268435456], 123 +// CHECK: vcmpbf16 k5, ymm23, ymmword ptr [rbp + 8*r14 + 268435456], 123 // CHECK: encoding: [0x62,0xb3,0x47,0x20,0xc2,0xac,0xf5,0x00,0x00,0x00,0x10,0x7b] - vcmppbf16 k5, ymm23, ymmword ptr [rbp + 8*r14 + 268435456], 123 + vcmpbf16 k5, ymm23, ymmword ptr [rbp + 8*r14 + 268435456], 123 -// CHECK: vcmppbf16 k5 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291], 123 +// CHECK: vcmpbf16 k5 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291], 123 // CHECK: encoding: [0x62,0xd3,0x47,0x27,0xc2,0xac,0x80,0x23,0x01,0x00,0x00,0x7b] - vcmppbf16 k5 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291], 123 + vcmpbf16 k5 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291], 123 -// CHECK: vcmppbf16 k5, ymm23, word ptr [rip]{1to16}, 123 +// CHECK: vcmpbf16 k5, ymm23, word ptr [rip]{1to16}, 123 // CHECK: encoding: [0x62,0xf3,0x47,0x30,0xc2,0x2d,0x00,0x00,0x00,0x00,0x7b] - vcmppbf16 k5, ymm23, word ptr [rip]{1to16}, 123 + vcmpbf16 k5, ymm23, word ptr [rip]{1to16}, 123 -// CHECK: vcmppbf16 k5, ymm23, ymmword ptr [2*rbp - 1024], 123 +// CHECK: vcmpbf16 k5, ymm23, ymmword ptr [2*rbp - 1024], 123 // CHECK: encoding: [0x62,0xf3,0x47,0x20,0xc2,0x2c,0x6d,0x00,0xfc,0xff,0xff,0x7b] - vcmppbf16 k5, ymm23, ymmword ptr [2*rbp - 1024], 123 + vcmpbf16 k5, ymm23, ymmword ptr [2*rbp - 1024], 123 -// CHECK: vcmppbf16 k5 {k7}, ymm23, ymmword ptr [rcx + 4064], 123 +// CHECK: vcmpbf16 k5 {k7}, ymm23, ymmword ptr [rcx + 4064], 123 // CHECK: encoding: [0x62,0xf3,0x47,0x27,0xc2,0x69,0x7f,0x7b] - vcmppbf16 k5 {k7}, ymm23, ymmword ptr [rcx + 4064], 123 + vcmpbf16 k5 {k7}, ymm23, ymmword ptr [rcx + 4064], 123 -// CHECK: vcmppbf16 k5 {k7}, ymm23, word ptr [rdx - 256]{1to16}, 123 +// CHECK: vcmpbf16 k5 {k7}, ymm23, word ptr [rdx - 256]{1to16}, 123 // CHECK: encoding: [0x62,0xf3,0x47,0x37,0xc2,0x6a,0x80,0x7b] - vcmppbf16 k5 {k7}, ymm23, word ptr [rdx - 256]{1to16}, 123 + vcmpbf16 k5 {k7}, ymm23, word ptr [rdx - 256]{1to16}, 123 // CHECK: vcomsbf16 xmm22, xmm23 // CHECK: encoding: [0x62,0xa5,0x7d,0x08,0x2f,0xf7] @@ -232,2783 +232,2783 @@ // CHECK: encoding: [0x62,0xe5,0x7d,0x08,0x2f,0x72,0x80] vcomsbf16 xmm22, word ptr [rdx - 256] -// CHECK: vdivnepbf16 ymm22, ymm23, ymm24 +// CHECK: vdivbf16 ymm22, ymm23, ymm24 // CHECK: encoding: [0x62,0x85,0x45,0x20,0x5e,0xf0] - vdivnepbf16 ymm22, ymm23, ymm24 + vdivbf16 ymm22, ymm23, ymm24 -// CHECK: vdivnepbf16 ymm22 {k7}, ymm23, ymm24 +// CHECK: vdivbf16 ymm22 {k7}, ymm23, ymm24 // CHECK: encoding: [0x62,0x85,0x45,0x27,0x5e,0xf0] - vdivnepbf16 ymm22 {k7}, ymm23, ymm24 + vdivbf16 ymm22 {k7}, ymm23, ymm24 -// CHECK: vdivnepbf16 ymm22 {k7} {z}, ymm23, ymm24 +// CHECK: vdivbf16 ymm22 {k7} {z}, ymm23, ymm24 // CHECK: encoding: [0x62,0x85,0x45,0xa7,0x5e,0xf0] - vdivnepbf16 ymm22 {k7} {z}, ymm23, ymm24 + vdivbf16 ymm22 {k7} {z}, ymm23, ymm24 -// CHECK: vdivnepbf16 zmm22, zmm23, zmm24 +// CHECK: vdivbf16 zmm22, zmm23, zmm24 // CHECK: encoding: [0x62,0x85,0x45,0x40,0x5e,0xf0] - vdivnepbf16 zmm22, zmm23, zmm24 + vdivbf16 zmm22, zmm23, zmm24 -// CHECK: vdivnepbf16 zmm22 {k7}, zmm23, zmm24 +// CHECK: vdivbf16 zmm22 {k7}, zmm23, zmm24 // CHECK: encoding: [0x62,0x85,0x45,0x47,0x5e,0xf0] - vdivnepbf16 zmm22 {k7}, zmm23, zmm24 + vdivbf16 zmm22 {k7}, zmm23, zmm24 -// CHECK: vdivnepbf16 zmm22 {k7} {z}, zmm23, zmm24 +// CHECK: vdivbf16 zmm22 {k7} {z}, zmm23, zmm24 // CHECK: encoding: [0x62,0x85,0x45,0xc7,0x5e,0xf0] - vdivnepbf16 zmm22 {k7} {z}, zmm23, zmm24 + vdivbf16 zmm22 {k7} {z}, zmm23, zmm24 -// CHECK: vdivnepbf16 xmm22, xmm23, xmm24 +// CHECK: vdivbf16 xmm22, xmm23, xmm24 // CHECK: encoding: [0x62,0x85,0x45,0x00,0x5e,0xf0] - vdivnepbf16 xmm22, xmm23, xmm24 + vdivbf16 xmm22, xmm23, xmm24 -// CHECK: vdivnepbf16 xmm22 {k7}, xmm23, xmm24 +// CHECK: vdivbf16 xmm22 {k7}, xmm23, xmm24 // CHECK: encoding: [0x62,0x85,0x45,0x07,0x5e,0xf0] - vdivnepbf16 xmm22 {k7}, xmm23, xmm24 + vdivbf16 xmm22 {k7}, xmm23, xmm24 -// CHECK: vdivnepbf16 xmm22 {k7} {z}, xmm23, xmm24 +// CHECK: vdivbf16 xmm22 {k7} {z}, xmm23, xmm24 // CHECK: encoding: [0x62,0x85,0x45,0x87,0x5e,0xf0] - vdivnepbf16 xmm22 {k7} {z}, xmm23, xmm24 + vdivbf16 xmm22 {k7} {z}, xmm23, xmm24 -// CHECK: vdivnepbf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456] +// CHECK: vdivbf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456] // CHECK: encoding: [0x62,0xa5,0x45,0x40,0x5e,0xb4,0xf5,0x00,0x00,0x00,0x10] - vdivnepbf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456] + vdivbf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456] -// CHECK: vdivnepbf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291] +// CHECK: vdivbf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291] // CHECK: encoding: [0x62,0xc5,0x45,0x47,0x5e,0xb4,0x80,0x23,0x01,0x00,0x00] - vdivnepbf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291] + vdivbf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291] -// CHECK: vdivnepbf16 zmm22, zmm23, word ptr [rip]{1to32} +// CHECK: vdivbf16 zmm22, zmm23, word ptr [rip]{1to32} // CHECK: encoding: [0x62,0xe5,0x45,0x50,0x5e,0x35,0x00,0x00,0x00,0x00] - vdivnepbf16 zmm22, zmm23, word ptr [rip]{1to32} + vdivbf16 zmm22, zmm23, word ptr [rip]{1to32} -// CHECK: vdivnepbf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048] +// CHECK: vdivbf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048] // CHECK: encoding: [0x62,0xe5,0x45,0x40,0x5e,0x34,0x6d,0x00,0xf8,0xff,0xff] - vdivnepbf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048] + vdivbf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048] -// CHECK: vdivnepbf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128] +// CHECK: vdivbf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128] // CHECK: encoding: [0x62,0xe5,0x45,0xc7,0x5e,0x71,0x7f] - vdivnepbf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128] + vdivbf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128] -// CHECK: vdivnepbf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32} +// CHECK: vdivbf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32} // CHECK: encoding: [0x62,0xe5,0x45,0xd7,0x5e,0x72,0x80] - vdivnepbf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32} + vdivbf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32} -// CHECK: vdivnepbf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456] +// CHECK: vdivbf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456] // CHECK: encoding: [0x62,0xa5,0x45,0x20,0x5e,0xb4,0xf5,0x00,0x00,0x00,0x10] - vdivnepbf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456] + vdivbf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456] -// CHECK: vdivnepbf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291] +// CHECK: vdivbf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291] // CHECK: encoding: [0x62,0xc5,0x45,0x27,0x5e,0xb4,0x80,0x23,0x01,0x00,0x00] - vdivnepbf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291] + vdivbf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291] -// CHECK: vdivnepbf16 ymm22, ymm23, word ptr [rip]{1to16} +// CHECK: vdivbf16 ymm22, ymm23, word ptr [rip]{1to16} // CHECK: encoding: [0x62,0xe5,0x45,0x30,0x5e,0x35,0x00,0x00,0x00,0x00] - vdivnepbf16 ymm22, ymm23, word ptr [rip]{1to16} + vdivbf16 ymm22, ymm23, word ptr [rip]{1to16} -// CHECK: vdivnepbf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024] +// CHECK: vdivbf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024] // CHECK: encoding: [0x62,0xe5,0x45,0x20,0x5e,0x34,0x6d,0x00,0xfc,0xff,0xff] - vdivnepbf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024] + vdivbf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024] -// CHECK: vdivnepbf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064] +// CHECK: vdivbf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064] // CHECK: encoding: [0x62,0xe5,0x45,0xa7,0x5e,0x71,0x7f] - vdivnepbf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064] + vdivbf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064] -// CHECK: vdivnepbf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16} +// CHECK: vdivbf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16} // CHECK: encoding: [0x62,0xe5,0x45,0xb7,0x5e,0x72,0x80] - vdivnepbf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16} + vdivbf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16} -// CHECK: vdivnepbf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456] +// CHECK: vdivbf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456] // CHECK: encoding: [0x62,0xa5,0x45,0x00,0x5e,0xb4,0xf5,0x00,0x00,0x00,0x10] - vdivnepbf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456] + vdivbf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456] -// CHECK: vdivnepbf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291] +// CHECK: vdivbf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291] // CHECK: encoding: [0x62,0xc5,0x45,0x07,0x5e,0xb4,0x80,0x23,0x01,0x00,0x00] - vdivnepbf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291] + vdivbf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291] -// CHECK: vdivnepbf16 xmm22, xmm23, word ptr [rip]{1to8} +// CHECK: vdivbf16 xmm22, xmm23, word ptr [rip]{1to8} // CHECK: encoding: [0x62,0xe5,0x45,0x10,0x5e,0x35,0x00,0x00,0x00,0x00] - vdivnepbf16 xmm22, xmm23, word ptr [rip]{1to8} + vdivbf16 xmm22, xmm23, word ptr [rip]{1to8} -// CHECK: vdivnepbf16 xmm22, xmm23, xmmword ptr [2*rbp - 512] +// CHECK: vdivbf16 xmm22, xmm23, xmmword ptr [2*rbp - 512] // CHECK: encoding: [0x62,0xe5,0x45,0x00,0x5e,0x34,0x6d,0x00,0xfe,0xff,0xff] - vdivnepbf16 xmm22, xmm23, xmmword ptr [2*rbp - 512] + vdivbf16 xmm22, xmm23, xmmword ptr [2*rbp - 512] -// CHECK: vdivnepbf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032] +// CHECK: vdivbf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032] // CHECK: encoding: [0x62,0xe5,0x45,0x87,0x5e,0x71,0x7f] - vdivnepbf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032] + vdivbf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032] -// CHECK: vdivnepbf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8} +// CHECK: vdivbf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8} // CHECK: encoding: [0x62,0xe5,0x45,0x97,0x5e,0x72,0x80] - vdivnepbf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8} + vdivbf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8} -// CHECK: vfmadd132nepbf16 ymm22, ymm23, ymm24 +// CHECK: vfmadd132bf16 ymm22, ymm23, ymm24 // CHECK: encoding: [0x62,0x86,0x44,0x20,0x98,0xf0] - vfmadd132nepbf16 ymm22, ymm23, ymm24 + vfmadd132bf16 ymm22, ymm23, ymm24 -// CHECK: vfmadd132nepbf16 ymm22 {k7}, ymm23, ymm24 +// CHECK: vfmadd132bf16 ymm22 {k7}, ymm23, ymm24 // CHECK: encoding: [0x62,0x86,0x44,0x27,0x98,0xf0] - vfmadd132nepbf16 ymm22 {k7}, ymm23, ymm24 + vfmadd132bf16 ymm22 {k7}, ymm23, ymm24 -// CHECK: vfmadd132nepbf16 ymm22 {k7} {z}, ymm23, ymm24 +// CHECK: vfmadd132bf16 ymm22 {k7} {z}, ymm23, ymm24 // CHECK: encoding: [0x62,0x86,0x44,0xa7,0x98,0xf0] - vfmadd132nepbf16 ymm22 {k7} {z}, ymm23, ymm24 + vfmadd132bf16 ymm22 {k7} {z}, ymm23, ymm24 -// CHECK: vfmadd132nepbf16 zmm22, zmm23, zmm24 +// CHECK: vfmadd132bf16 zmm22, zmm23, zmm24 // CHECK: encoding: [0x62,0x86,0x44,0x40,0x98,0xf0] - vfmadd132nepbf16 zmm22, zmm23, zmm24 + vfmadd132bf16 zmm22, zmm23, zmm24 -// CHECK: vfmadd132nepbf16 zmm22 {k7}, zmm23, zmm24 +// CHECK: vfmadd132bf16 zmm22 {k7}, zmm23, zmm24 // CHECK: encoding: [0x62,0x86,0x44,0x47,0x98,0xf0] - vfmadd132nepbf16 zmm22 {k7}, zmm23, zmm24 + vfmadd132bf16 zmm22 {k7}, zmm23, zmm24 -// CHECK: vfmadd132nepbf16 zmm22 {k7} {z}, zmm23, zmm24 +// CHECK: vfmadd132bf16 zmm22 {k7} {z}, zmm23, zmm24 // CHECK: encoding: [0x62,0x86,0x44,0xc7,0x98,0xf0] - vfmadd132nepbf16 zmm22 {k7} {z}, zmm23, zmm24 + vfmadd132bf16 zmm22 {k7} {z}, zmm23, zmm24 -// CHECK: vfmadd132nepbf16 xmm22, xmm23, xmm24 +// CHECK: vfmadd132bf16 xmm22, xmm23, xmm24 // CHECK: encoding: [0x62,0x86,0x44,0x00,0x98,0xf0] - vfmadd132nepbf16 xmm22, xmm23, xmm24 + vfmadd132bf16 xmm22, xmm23, xmm24 -// CHECK: vfmadd132nepbf16 xmm22 {k7}, xmm23, xmm24 +// CHECK: vfmadd132bf16 xmm22 {k7}, xmm23, xmm24 // CHECK: encoding: [0x62,0x86,0x44,0x07,0x98,0xf0] - vfmadd132nepbf16 xmm22 {k7}, xmm23, xmm24 + vfmadd132bf16 xmm22 {k7}, xmm23, xmm24 -// CHECK: vfmadd132nepbf16 xmm22 {k7} {z}, xmm23, xmm24 +// CHECK: vfmadd132bf16 xmm22 {k7} {z}, xmm23, xmm24 // CHECK: encoding: [0x62,0x86,0x44,0x87,0x98,0xf0] - vfmadd132nepbf16 xmm22 {k7} {z}, xmm23, xmm24 + vfmadd132bf16 xmm22 {k7} {z}, xmm23, xmm24 -// CHECK: vfmadd132nepbf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456] +// CHECK: vfmadd132bf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456] // CHECK: encoding: [0x62,0xa6,0x44,0x40,0x98,0xb4,0xf5,0x00,0x00,0x00,0x10] - vfmadd132nepbf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456] + vfmadd132bf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456] -// CHECK: vfmadd132nepbf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291] +// CHECK: vfmadd132bf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291] // CHECK: encoding: [0x62,0xc6,0x44,0x47,0x98,0xb4,0x80,0x23,0x01,0x00,0x00] - vfmadd132nepbf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291] + vfmadd132bf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291] -// CHECK: vfmadd132nepbf16 zmm22, zmm23, word ptr [rip]{1to32} +// CHECK: vfmadd132bf16 zmm22, zmm23, word ptr [rip]{1to32} // CHECK: encoding: [0x62,0xe6,0x44,0x50,0x98,0x35,0x00,0x00,0x00,0x00] - vfmadd132nepbf16 zmm22, zmm23, word ptr [rip]{1to32} + vfmadd132bf16 zmm22, zmm23, word ptr [rip]{1to32} -// CHECK: vfmadd132nepbf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048] +// CHECK: vfmadd132bf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048] // CHECK: encoding: [0x62,0xe6,0x44,0x40,0x98,0x34,0x6d,0x00,0xf8,0xff,0xff] - vfmadd132nepbf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048] + vfmadd132bf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048] -// CHECK: vfmadd132nepbf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128] +// CHECK: vfmadd132bf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128] // CHECK: encoding: [0x62,0xe6,0x44,0xc7,0x98,0x71,0x7f] - vfmadd132nepbf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128] + vfmadd132bf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128] -// CHECK: vfmadd132nepbf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32} +// CHECK: vfmadd132bf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32} // CHECK: encoding: [0x62,0xe6,0x44,0xd7,0x98,0x72,0x80] - vfmadd132nepbf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32} + vfmadd132bf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32} -// CHECK: vfmadd132nepbf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456] +// CHECK: vfmadd132bf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456] // CHECK: encoding: [0x62,0xa6,0x44,0x20,0x98,0xb4,0xf5,0x00,0x00,0x00,0x10] - vfmadd132nepbf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456] + vfmadd132bf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456] -// CHECK: vfmadd132nepbf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291] +// CHECK: vfmadd132bf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291] // CHECK: encoding: [0x62,0xc6,0x44,0x27,0x98,0xb4,0x80,0x23,0x01,0x00,0x00] - vfmadd132nepbf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291] + vfmadd132bf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291] -// CHECK: vfmadd132nepbf16 ymm22, ymm23, word ptr [rip]{1to16} +// CHECK: vfmadd132bf16 ymm22, ymm23, word ptr [rip]{1to16} // CHECK: encoding: [0x62,0xe6,0x44,0x30,0x98,0x35,0x00,0x00,0x00,0x00] - vfmadd132nepbf16 ymm22, ymm23, word ptr [rip]{1to16} + vfmadd132bf16 ymm22, ymm23, word ptr [rip]{1to16} -// CHECK: vfmadd132nepbf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024] +// CHECK: vfmadd132bf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024] // CHECK: encoding: [0x62,0xe6,0x44,0x20,0x98,0x34,0x6d,0x00,0xfc,0xff,0xff] - vfmadd132nepbf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024] + vfmadd132bf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024] -// CHECK: vfmadd132nepbf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064] +// CHECK: vfmadd132bf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064] // CHECK: encoding: [0x62,0xe6,0x44,0xa7,0x98,0x71,0x7f] - vfmadd132nepbf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064] + vfmadd132bf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064] -// CHECK: vfmadd132nepbf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16} +// CHECK: vfmadd132bf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16} // CHECK: encoding: [0x62,0xe6,0x44,0xb7,0x98,0x72,0x80] - vfmadd132nepbf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16} + vfmadd132bf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16} -// CHECK: vfmadd132nepbf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456] +// CHECK: vfmadd132bf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456] // CHECK: encoding: [0x62,0xa6,0x44,0x00,0x98,0xb4,0xf5,0x00,0x00,0x00,0x10] - vfmadd132nepbf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456] + vfmadd132bf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456] -// CHECK: vfmadd132nepbf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291] +// CHECK: vfmadd132bf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291] // CHECK: encoding: [0x62,0xc6,0x44,0x07,0x98,0xb4,0x80,0x23,0x01,0x00,0x00] - vfmadd132nepbf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291] + vfmadd132bf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291] -// CHECK: vfmadd132nepbf16 xmm22, xmm23, word ptr [rip]{1to8} +// CHECK: vfmadd132bf16 xmm22, xmm23, word ptr [rip]{1to8} // CHECK: encoding: [0x62,0xe6,0x44,0x10,0x98,0x35,0x00,0x00,0x00,0x00] - vfmadd132nepbf16 xmm22, xmm23, word ptr [rip]{1to8} + vfmadd132bf16 xmm22, xmm23, word ptr [rip]{1to8} -// CHECK: vfmadd132nepbf16 xmm22, xmm23, xmmword ptr [2*rbp - 512] +// CHECK: vfmadd132bf16 xmm22, xmm23, xmmword ptr [2*rbp - 512] // CHECK: encoding: [0x62,0xe6,0x44,0x00,0x98,0x34,0x6d,0x00,0xfe,0xff,0xff] - vfmadd132nepbf16 xmm22, xmm23, xmmword ptr [2*rbp - 512] + vfmadd132bf16 xmm22, xmm23, xmmword ptr [2*rbp - 512] -// CHECK: vfmadd132nepbf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032] +// CHECK: vfmadd132bf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032] // CHECK: encoding: [0x62,0xe6,0x44,0x87,0x98,0x71,0x7f] - vfmadd132nepbf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032] + vfmadd132bf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032] -// CHECK: vfmadd132nepbf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8} +// CHECK: vfmadd132bf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8} // CHECK: encoding: [0x62,0xe6,0x44,0x97,0x98,0x72,0x80] - vfmadd132nepbf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8} + vfmadd132bf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8} -// CHECK: vfmadd213nepbf16 ymm22, ymm23, ymm24 +// CHECK: vfmadd213bf16 ymm22, ymm23, ymm24 // CHECK: encoding: [0x62,0x86,0x44,0x20,0xa8,0xf0] - vfmadd213nepbf16 ymm22, ymm23, ymm24 + vfmadd213bf16 ymm22, ymm23, ymm24 -// CHECK: vfmadd213nepbf16 ymm22 {k7}, ymm23, ymm24 +// CHECK: vfmadd213bf16 ymm22 {k7}, ymm23, ymm24 // CHECK: encoding: [0x62,0x86,0x44,0x27,0xa8,0xf0] - vfmadd213nepbf16 ymm22 {k7}, ymm23, ymm24 + vfmadd213bf16 ymm22 {k7}, ymm23, ymm24 -// CHECK: vfmadd213nepbf16 ymm22 {k7} {z}, ymm23, ymm24 +// CHECK: vfmadd213bf16 ymm22 {k7} {z}, ymm23, ymm24 // CHECK: encoding: [0x62,0x86,0x44,0xa7,0xa8,0xf0] - vfmadd213nepbf16 ymm22 {k7} {z}, ymm23, ymm24 + vfmadd213bf16 ymm22 {k7} {z}, ymm23, ymm24 -// CHECK: vfmadd213nepbf16 zmm22, zmm23, zmm24 +// CHECK: vfmadd213bf16 zmm22, zmm23, zmm24 // CHECK: encoding: [0x62,0x86,0x44,0x40,0xa8,0xf0] - vfmadd213nepbf16 zmm22, zmm23, zmm24 + vfmadd213bf16 zmm22, zmm23, zmm24 -// CHECK: vfmadd213nepbf16 zmm22 {k7}, zmm23, zmm24 +// CHECK: vfmadd213bf16 zmm22 {k7}, zmm23, zmm24 // CHECK: encoding: [0x62,0x86,0x44,0x47,0xa8,0xf0] - vfmadd213nepbf16 zmm22 {k7}, zmm23, zmm24 + vfmadd213bf16 zmm22 {k7}, zmm23, zmm24 -// CHECK: vfmadd213nepbf16 zmm22 {k7} {z}, zmm23, zmm24 +// CHECK: vfmadd213bf16 zmm22 {k7} {z}, zmm23, zmm24 // CHECK: encoding: [0x62,0x86,0x44,0xc7,0xa8,0xf0] - vfmadd213nepbf16 zmm22 {k7} {z}, zmm23, zmm24 + vfmadd213bf16 zmm22 {k7} {z}, zmm23, zmm24 -// CHECK: vfmadd213nepbf16 xmm22, xmm23, xmm24 +// CHECK: vfmadd213bf16 xmm22, xmm23, xmm24 // CHECK: encoding: [0x62,0x86,0x44,0x00,0xa8,0xf0] - vfmadd213nepbf16 xmm22, xmm23, xmm24 + vfmadd213bf16 xmm22, xmm23, xmm24 -// CHECK: vfmadd213nepbf16 xmm22 {k7}, xmm23, xmm24 +// CHECK: vfmadd213bf16 xmm22 {k7}, xmm23, xmm24 // CHECK: encoding: [0x62,0x86,0x44,0x07,0xa8,0xf0] - vfmadd213nepbf16 xmm22 {k7}, xmm23, xmm24 + vfmadd213bf16 xmm22 {k7}, xmm23, xmm24 -// CHECK: vfmadd213nepbf16 xmm22 {k7} {z}, xmm23, xmm24 +// CHECK: vfmadd213bf16 xmm22 {k7} {z}, xmm23, xmm24 // CHECK: encoding: [0x62,0x86,0x44,0x87,0xa8,0xf0] - vfmadd213nepbf16 xmm22 {k7} {z}, xmm23, xmm24 + vfmadd213bf16 xmm22 {k7} {z}, xmm23, xmm24 -// CHECK: vfmadd213nepbf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456] +// CHECK: vfmadd213bf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456] // CHECK: encoding: [0x62,0xa6,0x44,0x40,0xa8,0xb4,0xf5,0x00,0x00,0x00,0x10] - vfmadd213nepbf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456] + vfmadd213bf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456] -// CHECK: vfmadd213nepbf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291] +// CHECK: vfmadd213bf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291] // CHECK: encoding: [0x62,0xc6,0x44,0x47,0xa8,0xb4,0x80,0x23,0x01,0x00,0x00] - vfmadd213nepbf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291] + vfmadd213bf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291] -// CHECK: vfmadd213nepbf16 zmm22, zmm23, word ptr [rip]{1to32} +// CHECK: vfmadd213bf16 zmm22, zmm23, word ptr [rip]{1to32} // CHECK: encoding: [0x62,0xe6,0x44,0x50,0xa8,0x35,0x00,0x00,0x00,0x00] - vfmadd213nepbf16 zmm22, zmm23, word ptr [rip]{1to32} + vfmadd213bf16 zmm22, zmm23, word ptr [rip]{1to32} -// CHECK: vfmadd213nepbf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048] +// CHECK: vfmadd213bf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048] // CHECK: encoding: [0x62,0xe6,0x44,0x40,0xa8,0x34,0x6d,0x00,0xf8,0xff,0xff] - vfmadd213nepbf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048] + vfmadd213bf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048] -// CHECK: vfmadd213nepbf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128] +// CHECK: vfmadd213bf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128] // CHECK: encoding: [0x62,0xe6,0x44,0xc7,0xa8,0x71,0x7f] - vfmadd213nepbf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128] + vfmadd213bf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128] -// CHECK: vfmadd213nepbf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32} +// CHECK: vfmadd213bf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32} // CHECK: encoding: [0x62,0xe6,0x44,0xd7,0xa8,0x72,0x80] - vfmadd213nepbf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32} + vfmadd213bf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32} -// CHECK: vfmadd213nepbf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456] +// CHECK: vfmadd213bf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456] // CHECK: encoding: [0x62,0xa6,0x44,0x20,0xa8,0xb4,0xf5,0x00,0x00,0x00,0x10] - vfmadd213nepbf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456] + vfmadd213bf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456] -// CHECK: vfmadd213nepbf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291] +// CHECK: vfmadd213bf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291] // CHECK: encoding: [0x62,0xc6,0x44,0x27,0xa8,0xb4,0x80,0x23,0x01,0x00,0x00] - vfmadd213nepbf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291] + vfmadd213bf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291] -// CHECK: vfmadd213nepbf16 ymm22, ymm23, word ptr [rip]{1to16} +// CHECK: vfmadd213bf16 ymm22, ymm23, word ptr [rip]{1to16} // CHECK: encoding: [0x62,0xe6,0x44,0x30,0xa8,0x35,0x00,0x00,0x00,0x00] - vfmadd213nepbf16 ymm22, ymm23, word ptr [rip]{1to16} + vfmadd213bf16 ymm22, ymm23, word ptr [rip]{1to16} -// CHECK: vfmadd213nepbf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024] +// CHECK: vfmadd213bf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024] // CHECK: encoding: [0x62,0xe6,0x44,0x20,0xa8,0x34,0x6d,0x00,0xfc,0xff,0xff] - vfmadd213nepbf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024] + vfmadd213bf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024] -// CHECK: vfmadd213nepbf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064] +// CHECK: vfmadd213bf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064] // CHECK: encoding: [0x62,0xe6,0x44,0xa7,0xa8,0x71,0x7f] - vfmadd213nepbf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064] + vfmadd213bf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064] -// CHECK: vfmadd213nepbf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16} +// CHECK: vfmadd213bf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16} // CHECK: encoding: [0x62,0xe6,0x44,0xb7,0xa8,0x72,0x80] - vfmadd213nepbf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16} + vfmadd213bf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16} -// CHECK: vfmadd213nepbf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456] +// CHECK: vfmadd213bf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456] // CHECK: encoding: [0x62,0xa6,0x44,0x00,0xa8,0xb4,0xf5,0x00,0x00,0x00,0x10] - vfmadd213nepbf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456] + vfmadd213bf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456] -// CHECK: vfmadd213nepbf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291] +// CHECK: vfmadd213bf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291] // CHECK: encoding: [0x62,0xc6,0x44,0x07,0xa8,0xb4,0x80,0x23,0x01,0x00,0x00] - vfmadd213nepbf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291] + vfmadd213bf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291] -// CHECK: vfmadd213nepbf16 xmm22, xmm23, word ptr [rip]{1to8} +// CHECK: vfmadd213bf16 xmm22, xmm23, word ptr [rip]{1to8} // CHECK: encoding: [0x62,0xe6,0x44,0x10,0xa8,0x35,0x00,0x00,0x00,0x00] - vfmadd213nepbf16 xmm22, xmm23, word ptr [rip]{1to8} + vfmadd213bf16 xmm22, xmm23, word ptr [rip]{1to8} -// CHECK: vfmadd213nepbf16 xmm22, xmm23, xmmword ptr [2*rbp - 512] +// CHECK: vfmadd213bf16 xmm22, xmm23, xmmword ptr [2*rbp - 512] // CHECK: encoding: [0x62,0xe6,0x44,0x00,0xa8,0x34,0x6d,0x00,0xfe,0xff,0xff] - vfmadd213nepbf16 xmm22, xmm23, xmmword ptr [2*rbp - 512] + vfmadd213bf16 xmm22, xmm23, xmmword ptr [2*rbp - 512] -// CHECK: vfmadd213nepbf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032] +// CHECK: vfmadd213bf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032] // CHECK: encoding: [0x62,0xe6,0x44,0x87,0xa8,0x71,0x7f] - vfmadd213nepbf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032] + vfmadd213bf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032] -// CHECK: vfmadd213nepbf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8} +// CHECK: vfmadd213bf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8} // CHECK: encoding: [0x62,0xe6,0x44,0x97,0xa8,0x72,0x80] - vfmadd213nepbf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8} + vfmadd213bf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8} -// CHECK: vfmadd231nepbf16 ymm22, ymm23, ymm24 +// CHECK: vfmadd231bf16 ymm22, ymm23, ymm24 // CHECK: encoding: [0x62,0x86,0x44,0x20,0xb8,0xf0] - vfmadd231nepbf16 ymm22, ymm23, ymm24 + vfmadd231bf16 ymm22, ymm23, ymm24 -// CHECK: vfmadd231nepbf16 ymm22 {k7}, ymm23, ymm24 +// CHECK: vfmadd231bf16 ymm22 {k7}, ymm23, ymm24 // CHECK: encoding: [0x62,0x86,0x44,0x27,0xb8,0xf0] - vfmadd231nepbf16 ymm22 {k7}, ymm23, ymm24 + vfmadd231bf16 ymm22 {k7}, ymm23, ymm24 -// CHECK: vfmadd231nepbf16 ymm22 {k7} {z}, ymm23, ymm24 +// CHECK: vfmadd231bf16 ymm22 {k7} {z}, ymm23, ymm24 // CHECK: encoding: [0x62,0x86,0x44,0xa7,0xb8,0xf0] - vfmadd231nepbf16 ymm22 {k7} {z}, ymm23, ymm24 + vfmadd231bf16 ymm22 {k7} {z}, ymm23, ymm24 -// CHECK: vfmadd231nepbf16 zmm22, zmm23, zmm24 +// CHECK: vfmadd231bf16 zmm22, zmm23, zmm24 // CHECK: encoding: [0x62,0x86,0x44,0x40,0xb8,0xf0] - vfmadd231nepbf16 zmm22, zmm23, zmm24 + vfmadd231bf16 zmm22, zmm23, zmm24 -// CHECK: vfmadd231nepbf16 zmm22 {k7}, zmm23, zmm24 +// CHECK: vfmadd231bf16 zmm22 {k7}, zmm23, zmm24 // CHECK: encoding: [0x62,0x86,0x44,0x47,0xb8,0xf0] - vfmadd231nepbf16 zmm22 {k7}, zmm23, zmm24 + vfmadd231bf16 zmm22 {k7}, zmm23, zmm24 -// CHECK: vfmadd231nepbf16 zmm22 {k7} {z}, zmm23, zmm24 +// CHECK: vfmadd231bf16 zmm22 {k7} {z}, zmm23, zmm24 // CHECK: encoding: [0x62,0x86,0x44,0xc7,0xb8,0xf0] - vfmadd231nepbf16 zmm22 {k7} {z}, zmm23, zmm24 + vfmadd231bf16 zmm22 {k7} {z}, zmm23, zmm24 -// CHECK: vfmadd231nepbf16 xmm22, xmm23, xmm24 +// CHECK: vfmadd231bf16 xmm22, xmm23, xmm24 // CHECK: encoding: [0x62,0x86,0x44,0x00,0xb8,0xf0] - vfmadd231nepbf16 xmm22, xmm23, xmm24 + vfmadd231bf16 xmm22, xmm23, xmm24 -// CHECK: vfmadd231nepbf16 xmm22 {k7}, xmm23, xmm24 +// CHECK: vfmadd231bf16 xmm22 {k7}, xmm23, xmm24 // CHECK: encoding: [0x62,0x86,0x44,0x07,0xb8,0xf0] - vfmadd231nepbf16 xmm22 {k7}, xmm23, xmm24 + vfmadd231bf16 xmm22 {k7}, xmm23, xmm24 -// CHECK: vfmadd231nepbf16 xmm22 {k7} {z}, xmm23, xmm24 +// CHECK: vfmadd231bf16 xmm22 {k7} {z}, xmm23, xmm24 // CHECK: encoding: [0x62,0x86,0x44,0x87,0xb8,0xf0] - vfmadd231nepbf16 xmm22 {k7} {z}, xmm23, xmm24 + vfmadd231bf16 xmm22 {k7} {z}, xmm23, xmm24 -// CHECK: vfmadd231nepbf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456] +// CHECK: vfmadd231bf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456] // CHECK: encoding: [0x62,0xa6,0x44,0x40,0xb8,0xb4,0xf5,0x00,0x00,0x00,0x10] - vfmadd231nepbf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456] + vfmadd231bf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456] -// CHECK: vfmadd231nepbf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291] +// CHECK: vfmadd231bf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291] // CHECK: encoding: [0x62,0xc6,0x44,0x47,0xb8,0xb4,0x80,0x23,0x01,0x00,0x00] - vfmadd231nepbf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291] + vfmadd231bf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291] -// CHECK: vfmadd231nepbf16 zmm22, zmm23, word ptr [rip]{1to32} +// CHECK: vfmadd231bf16 zmm22, zmm23, word ptr [rip]{1to32} // CHECK: encoding: [0x62,0xe6,0x44,0x50,0xb8,0x35,0x00,0x00,0x00,0x00] - vfmadd231nepbf16 zmm22, zmm23, word ptr [rip]{1to32} + vfmadd231bf16 zmm22, zmm23, word ptr [rip]{1to32} -// CHECK: vfmadd231nepbf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048] +// CHECK: vfmadd231bf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048] // CHECK: encoding: [0x62,0xe6,0x44,0x40,0xb8,0x34,0x6d,0x00,0xf8,0xff,0xff] - vfmadd231nepbf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048] + vfmadd231bf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048] -// CHECK: vfmadd231nepbf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128] +// CHECK: vfmadd231bf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128] // CHECK: encoding: [0x62,0xe6,0x44,0xc7,0xb8,0x71,0x7f] - vfmadd231nepbf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128] + vfmadd231bf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128] -// CHECK: vfmadd231nepbf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32} +// CHECK: vfmadd231bf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32} // CHECK: encoding: [0x62,0xe6,0x44,0xd7,0xb8,0x72,0x80] - vfmadd231nepbf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32} + vfmadd231bf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32} -// CHECK: vfmadd231nepbf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456] +// CHECK: vfmadd231bf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456] // CHECK: encoding: [0x62,0xa6,0x44,0x20,0xb8,0xb4,0xf5,0x00,0x00,0x00,0x10] - vfmadd231nepbf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456] + vfmadd231bf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456] -// CHECK: vfmadd231nepbf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291] +// CHECK: vfmadd231bf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291] // CHECK: encoding: [0x62,0xc6,0x44,0x27,0xb8,0xb4,0x80,0x23,0x01,0x00,0x00] - vfmadd231nepbf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291] + vfmadd231bf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291] -// CHECK: vfmadd231nepbf16 ymm22, ymm23, word ptr [rip]{1to16} +// CHECK: vfmadd231bf16 ymm22, ymm23, word ptr [rip]{1to16} // CHECK: encoding: [0x62,0xe6,0x44,0x30,0xb8,0x35,0x00,0x00,0x00,0x00] - vfmadd231nepbf16 ymm22, ymm23, word ptr [rip]{1to16} + vfmadd231bf16 ymm22, ymm23, word ptr [rip]{1to16} -// CHECK: vfmadd231nepbf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024] +// CHECK: vfmadd231bf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024] // CHECK: encoding: [0x62,0xe6,0x44,0x20,0xb8,0x34,0x6d,0x00,0xfc,0xff,0xff] - vfmadd231nepbf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024] + vfmadd231bf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024] -// CHECK: vfmadd231nepbf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064] +// CHECK: vfmadd231bf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064] // CHECK: encoding: [0x62,0xe6,0x44,0xa7,0xb8,0x71,0x7f] - vfmadd231nepbf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064] + vfmadd231bf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064] -// CHECK: vfmadd231nepbf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16} +// CHECK: vfmadd231bf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16} // CHECK: encoding: [0x62,0xe6,0x44,0xb7,0xb8,0x72,0x80] - vfmadd231nepbf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16} + vfmadd231bf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16} -// CHECK: vfmadd231nepbf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456] +// CHECK: vfmadd231bf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456] // CHECK: encoding: [0x62,0xa6,0x44,0x00,0xb8,0xb4,0xf5,0x00,0x00,0x00,0x10] - vfmadd231nepbf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456] + vfmadd231bf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456] -// CHECK: vfmadd231nepbf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291] +// CHECK: vfmadd231bf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291] // CHECK: encoding: [0x62,0xc6,0x44,0x07,0xb8,0xb4,0x80,0x23,0x01,0x00,0x00] - vfmadd231nepbf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291] + vfmadd231bf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291] -// CHECK: vfmadd231nepbf16 xmm22, xmm23, word ptr [rip]{1to8} +// CHECK: vfmadd231bf16 xmm22, xmm23, word ptr [rip]{1to8} // CHECK: encoding: [0x62,0xe6,0x44,0x10,0xb8,0x35,0x00,0x00,0x00,0x00] - vfmadd231nepbf16 xmm22, xmm23, word ptr [rip]{1to8} + vfmadd231bf16 xmm22, xmm23, word ptr [rip]{1to8} -// CHECK: vfmadd231nepbf16 xmm22, xmm23, xmmword ptr [2*rbp - 512] +// CHECK: vfmadd231bf16 xmm22, xmm23, xmmword ptr [2*rbp - 512] // CHECK: encoding: [0x62,0xe6,0x44,0x00,0xb8,0x34,0x6d,0x00,0xfe,0xff,0xff] - vfmadd231nepbf16 xmm22, xmm23, xmmword ptr [2*rbp - 512] + vfmadd231bf16 xmm22, xmm23, xmmword ptr [2*rbp - 512] -// CHECK: vfmadd231nepbf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032] +// CHECK: vfmadd231bf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032] // CHECK: encoding: [0x62,0xe6,0x44,0x87,0xb8,0x71,0x7f] - vfmadd231nepbf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032] + vfmadd231bf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032] -// CHECK: vfmadd231nepbf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8} +// CHECK: vfmadd231bf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8} // CHECK: encoding: [0x62,0xe6,0x44,0x97,0xb8,0x72,0x80] - vfmadd231nepbf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8} + vfmadd231bf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8} -// CHECK: vfmsub132nepbf16 ymm22, ymm23, ymm24 +// CHECK: vfmsub132bf16 ymm22, ymm23, ymm24 // CHECK: encoding: [0x62,0x86,0x44,0x20,0x9a,0xf0] - vfmsub132nepbf16 ymm22, ymm23, ymm24 + vfmsub132bf16 ymm22, ymm23, ymm24 -// CHECK: vfmsub132nepbf16 ymm22 {k7}, ymm23, ymm24 +// CHECK: vfmsub132bf16 ymm22 {k7}, ymm23, ymm24 // CHECK: encoding: [0x62,0x86,0x44,0x27,0x9a,0xf0] - vfmsub132nepbf16 ymm22 {k7}, ymm23, ymm24 + vfmsub132bf16 ymm22 {k7}, ymm23, ymm24 -// CHECK: vfmsub132nepbf16 ymm22 {k7} {z}, ymm23, ymm24 +// CHECK: vfmsub132bf16 ymm22 {k7} {z}, ymm23, ymm24 // CHECK: encoding: [0x62,0x86,0x44,0xa7,0x9a,0xf0] - vfmsub132nepbf16 ymm22 {k7} {z}, ymm23, ymm24 + vfmsub132bf16 ymm22 {k7} {z}, ymm23, ymm24 -// CHECK: vfmsub132nepbf16 zmm22, zmm23, zmm24 +// CHECK: vfmsub132bf16 zmm22, zmm23, zmm24 // CHECK: encoding: [0x62,0x86,0x44,0x40,0x9a,0xf0] - vfmsub132nepbf16 zmm22, zmm23, zmm24 + vfmsub132bf16 zmm22, zmm23, zmm24 -// CHECK: vfmsub132nepbf16 zmm22 {k7}, zmm23, zmm24 +// CHECK: vfmsub132bf16 zmm22 {k7}, zmm23, zmm24 // CHECK: encoding: [0x62,0x86,0x44,0x47,0x9a,0xf0] - vfmsub132nepbf16 zmm22 {k7}, zmm23, zmm24 + vfmsub132bf16 zmm22 {k7}, zmm23, zmm24 -// CHECK: vfmsub132nepbf16 zmm22 {k7} {z}, zmm23, zmm24 +// CHECK: vfmsub132bf16 zmm22 {k7} {z}, zmm23, zmm24 // CHECK: encoding: [0x62,0x86,0x44,0xc7,0x9a,0xf0] - vfmsub132nepbf16 zmm22 {k7} {z}, zmm23, zmm24 + vfmsub132bf16 zmm22 {k7} {z}, zmm23, zmm24 -// CHECK: vfmsub132nepbf16 xmm22, xmm23, xmm24 +// CHECK: vfmsub132bf16 xmm22, xmm23, xmm24 // CHECK: encoding: [0x62,0x86,0x44,0x00,0x9a,0xf0] - vfmsub132nepbf16 xmm22, xmm23, xmm24 + vfmsub132bf16 xmm22, xmm23, xmm24 -// CHECK: vfmsub132nepbf16 xmm22 {k7}, xmm23, xmm24 +// CHECK: vfmsub132bf16 xmm22 {k7}, xmm23, xmm24 // CHECK: encoding: [0x62,0x86,0x44,0x07,0x9a,0xf0] - vfmsub132nepbf16 xmm22 {k7}, xmm23, xmm24 + vfmsub132bf16 xmm22 {k7}, xmm23, xmm24 -// CHECK: vfmsub132nepbf16 xmm22 {k7} {z}, xmm23, xmm24 +// CHECK: vfmsub132bf16 xmm22 {k7} {z}, xmm23, xmm24 // CHECK: encoding: [0x62,0x86,0x44,0x87,0x9a,0xf0] - vfmsub132nepbf16 xmm22 {k7} {z}, xmm23, xmm24 + vfmsub132bf16 xmm22 {k7} {z}, xmm23, xmm24 -// CHECK: vfmsub132nepbf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456] +// CHECK: vfmsub132bf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456] // CHECK: encoding: [0x62,0xa6,0x44,0x40,0x9a,0xb4,0xf5,0x00,0x00,0x00,0x10] - vfmsub132nepbf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456] + vfmsub132bf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456] -// CHECK: vfmsub132nepbf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291] +// CHECK: vfmsub132bf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291] // CHECK: encoding: [0x62,0xc6,0x44,0x47,0x9a,0xb4,0x80,0x23,0x01,0x00,0x00] - vfmsub132nepbf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291] + vfmsub132bf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291] -// CHECK: vfmsub132nepbf16 zmm22, zmm23, word ptr [rip]{1to32} +// CHECK: vfmsub132bf16 zmm22, zmm23, word ptr [rip]{1to32} // CHECK: encoding: [0x62,0xe6,0x44,0x50,0x9a,0x35,0x00,0x00,0x00,0x00] - vfmsub132nepbf16 zmm22, zmm23, word ptr [rip]{1to32} + vfmsub132bf16 zmm22, zmm23, word ptr [rip]{1to32} -// CHECK: vfmsub132nepbf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048] +// CHECK: vfmsub132bf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048] // CHECK: encoding: [0x62,0xe6,0x44,0x40,0x9a,0x34,0x6d,0x00,0xf8,0xff,0xff] - vfmsub132nepbf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048] + vfmsub132bf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048] -// CHECK: vfmsub132nepbf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128] +// CHECK: vfmsub132bf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128] // CHECK: encoding: [0x62,0xe6,0x44,0xc7,0x9a,0x71,0x7f] - vfmsub132nepbf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128] + vfmsub132bf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128] -// CHECK: vfmsub132nepbf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32} +// CHECK: vfmsub132bf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32} // CHECK: encoding: [0x62,0xe6,0x44,0xd7,0x9a,0x72,0x80] - vfmsub132nepbf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32} + vfmsub132bf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32} -// CHECK: vfmsub132nepbf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456] +// CHECK: vfmsub132bf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456] // CHECK: encoding: [0x62,0xa6,0x44,0x20,0x9a,0xb4,0xf5,0x00,0x00,0x00,0x10] - vfmsub132nepbf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456] + vfmsub132bf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456] -// CHECK: vfmsub132nepbf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291] +// CHECK: vfmsub132bf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291] // CHECK: encoding: [0x62,0xc6,0x44,0x27,0x9a,0xb4,0x80,0x23,0x01,0x00,0x00] - vfmsub132nepbf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291] + vfmsub132bf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291] -// CHECK: vfmsub132nepbf16 ymm22, ymm23, word ptr [rip]{1to16} +// CHECK: vfmsub132bf16 ymm22, ymm23, word ptr [rip]{1to16} // CHECK: encoding: [0x62,0xe6,0x44,0x30,0x9a,0x35,0x00,0x00,0x00,0x00] - vfmsub132nepbf16 ymm22, ymm23, word ptr [rip]{1to16} + vfmsub132bf16 ymm22, ymm23, word ptr [rip]{1to16} -// CHECK: vfmsub132nepbf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024] +// CHECK: vfmsub132bf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024] // CHECK: encoding: [0x62,0xe6,0x44,0x20,0x9a,0x34,0x6d,0x00,0xfc,0xff,0xff] - vfmsub132nepbf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024] + vfmsub132bf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024] -// CHECK: vfmsub132nepbf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064] +// CHECK: vfmsub132bf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064] // CHECK: encoding: [0x62,0xe6,0x44,0xa7,0x9a,0x71,0x7f] - vfmsub132nepbf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064] + vfmsub132bf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064] -// CHECK: vfmsub132nepbf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16} +// CHECK: vfmsub132bf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16} // CHECK: encoding: [0x62,0xe6,0x44,0xb7,0x9a,0x72,0x80] - vfmsub132nepbf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16} + vfmsub132bf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16} -// CHECK: vfmsub132nepbf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456] +// CHECK: vfmsub132bf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456] // CHECK: encoding: [0x62,0xa6,0x44,0x00,0x9a,0xb4,0xf5,0x00,0x00,0x00,0x10] - vfmsub132nepbf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456] + vfmsub132bf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456] -// CHECK: vfmsub132nepbf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291] +// CHECK: vfmsub132bf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291] // CHECK: encoding: [0x62,0xc6,0x44,0x07,0x9a,0xb4,0x80,0x23,0x01,0x00,0x00] - vfmsub132nepbf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291] + vfmsub132bf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291] -// CHECK: vfmsub132nepbf16 xmm22, xmm23, word ptr [rip]{1to8} +// CHECK: vfmsub132bf16 xmm22, xmm23, word ptr [rip]{1to8} // CHECK: encoding: [0x62,0xe6,0x44,0x10,0x9a,0x35,0x00,0x00,0x00,0x00] - vfmsub132nepbf16 xmm22, xmm23, word ptr [rip]{1to8} + vfmsub132bf16 xmm22, xmm23, word ptr [rip]{1to8} -// CHECK: vfmsub132nepbf16 xmm22, xmm23, xmmword ptr [2*rbp - 512] +// CHECK: vfmsub132bf16 xmm22, xmm23, xmmword ptr [2*rbp - 512] // CHECK: encoding: [0x62,0xe6,0x44,0x00,0x9a,0x34,0x6d,0x00,0xfe,0xff,0xff] - vfmsub132nepbf16 xmm22, xmm23, xmmword ptr [2*rbp - 512] + vfmsub132bf16 xmm22, xmm23, xmmword ptr [2*rbp - 512] -// CHECK: vfmsub132nepbf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032] +// CHECK: vfmsub132bf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032] // CHECK: encoding: [0x62,0xe6,0x44,0x87,0x9a,0x71,0x7f] - vfmsub132nepbf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032] + vfmsub132bf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032] -// CHECK: vfmsub132nepbf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8} +// CHECK: vfmsub132bf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8} // CHECK: encoding: [0x62,0xe6,0x44,0x97,0x9a,0x72,0x80] - vfmsub132nepbf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8} + vfmsub132bf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8} -// CHECK: vfmsub213nepbf16 ymm22, ymm23, ymm24 +// CHECK: vfmsub213bf16 ymm22, ymm23, ymm24 // CHECK: encoding: [0x62,0x86,0x44,0x20,0xaa,0xf0] - vfmsub213nepbf16 ymm22, ymm23, ymm24 + vfmsub213bf16 ymm22, ymm23, ymm24 -// CHECK: vfmsub213nepbf16 ymm22 {k7}, ymm23, ymm24 +// CHECK: vfmsub213bf16 ymm22 {k7}, ymm23, ymm24 // CHECK: encoding: [0x62,0x86,0x44,0x27,0xaa,0xf0] - vfmsub213nepbf16 ymm22 {k7}, ymm23, ymm24 + vfmsub213bf16 ymm22 {k7}, ymm23, ymm24 -// CHECK: vfmsub213nepbf16 ymm22 {k7} {z}, ymm23, ymm24 +// CHECK: vfmsub213bf16 ymm22 {k7} {z}, ymm23, ymm24 // CHECK: encoding: [0x62,0x86,0x44,0xa7,0xaa,0xf0] - vfmsub213nepbf16 ymm22 {k7} {z}, ymm23, ymm24 + vfmsub213bf16 ymm22 {k7} {z}, ymm23, ymm24 -// CHECK: vfmsub213nepbf16 zmm22, zmm23, zmm24 +// CHECK: vfmsub213bf16 zmm22, zmm23, zmm24 // CHECK: encoding: [0x62,0x86,0x44,0x40,0xaa,0xf0] - vfmsub213nepbf16 zmm22, zmm23, zmm24 + vfmsub213bf16 zmm22, zmm23, zmm24 -// CHECK: vfmsub213nepbf16 zmm22 {k7}, zmm23, zmm24 +// CHECK: vfmsub213bf16 zmm22 {k7}, zmm23, zmm24 // CHECK: encoding: [0x62,0x86,0x44,0x47,0xaa,0xf0] - vfmsub213nepbf16 zmm22 {k7}, zmm23, zmm24 + vfmsub213bf16 zmm22 {k7}, zmm23, zmm24 -// CHECK: vfmsub213nepbf16 zmm22 {k7} {z}, zmm23, zmm24 +// CHECK: vfmsub213bf16 zmm22 {k7} {z}, zmm23, zmm24 // CHECK: encoding: [0x62,0x86,0x44,0xc7,0xaa,0xf0] - vfmsub213nepbf16 zmm22 {k7} {z}, zmm23, zmm24 + vfmsub213bf16 zmm22 {k7} {z}, zmm23, zmm24 -// CHECK: vfmsub213nepbf16 xmm22, xmm23, xmm24 +// CHECK: vfmsub213bf16 xmm22, xmm23, xmm24 // CHECK: encoding: [0x62,0x86,0x44,0x00,0xaa,0xf0] - vfmsub213nepbf16 xmm22, xmm23, xmm24 + vfmsub213bf16 xmm22, xmm23, xmm24 -// CHECK: vfmsub213nepbf16 xmm22 {k7}, xmm23, xmm24 +// CHECK: vfmsub213bf16 xmm22 {k7}, xmm23, xmm24 // CHECK: encoding: [0x62,0x86,0x44,0x07,0xaa,0xf0] - vfmsub213nepbf16 xmm22 {k7}, xmm23, xmm24 + vfmsub213bf16 xmm22 {k7}, xmm23, xmm24 -// CHECK: vfmsub213nepbf16 xmm22 {k7} {z}, xmm23, xmm24 +// CHECK: vfmsub213bf16 xmm22 {k7} {z}, xmm23, xmm24 // CHECK: encoding: [0x62,0x86,0x44,0x87,0xaa,0xf0] - vfmsub213nepbf16 xmm22 {k7} {z}, xmm23, xmm24 + vfmsub213bf16 xmm22 {k7} {z}, xmm23, xmm24 -// CHECK: vfmsub213nepbf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456] +// CHECK: vfmsub213bf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456] // CHECK: encoding: [0x62,0xa6,0x44,0x40,0xaa,0xb4,0xf5,0x00,0x00,0x00,0x10] - vfmsub213nepbf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456] + vfmsub213bf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456] -// CHECK: vfmsub213nepbf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291] +// CHECK: vfmsub213bf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291] // CHECK: encoding: [0x62,0xc6,0x44,0x47,0xaa,0xb4,0x80,0x23,0x01,0x00,0x00] - vfmsub213nepbf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291] + vfmsub213bf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291] -// CHECK: vfmsub213nepbf16 zmm22, zmm23, word ptr [rip]{1to32} +// CHECK: vfmsub213bf16 zmm22, zmm23, word ptr [rip]{1to32} // CHECK: encoding: [0x62,0xe6,0x44,0x50,0xaa,0x35,0x00,0x00,0x00,0x00] - vfmsub213nepbf16 zmm22, zmm23, word ptr [rip]{1to32} + vfmsub213bf16 zmm22, zmm23, word ptr [rip]{1to32} -// CHECK: vfmsub213nepbf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048] +// CHECK: vfmsub213bf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048] // CHECK: encoding: [0x62,0xe6,0x44,0x40,0xaa,0x34,0x6d,0x00,0xf8,0xff,0xff] - vfmsub213nepbf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048] + vfmsub213bf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048] -// CHECK: vfmsub213nepbf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128] +// CHECK: vfmsub213bf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128] // CHECK: encoding: [0x62,0xe6,0x44,0xc7,0xaa,0x71,0x7f] - vfmsub213nepbf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128] + vfmsub213bf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128] -// CHECK: vfmsub213nepbf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32} +// CHECK: vfmsub213bf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32} // CHECK: encoding: [0x62,0xe6,0x44,0xd7,0xaa,0x72,0x80] - vfmsub213nepbf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32} + vfmsub213bf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32} -// CHECK: vfmsub213nepbf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456] +// CHECK: vfmsub213bf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456] // CHECK: encoding: [0x62,0xa6,0x44,0x20,0xaa,0xb4,0xf5,0x00,0x00,0x00,0x10] - vfmsub213nepbf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456] + vfmsub213bf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456] -// CHECK: vfmsub213nepbf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291] +// CHECK: vfmsub213bf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291] // CHECK: encoding: [0x62,0xc6,0x44,0x27,0xaa,0xb4,0x80,0x23,0x01,0x00,0x00] - vfmsub213nepbf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291] + vfmsub213bf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291] -// CHECK: vfmsub213nepbf16 ymm22, ymm23, word ptr [rip]{1to16} +// CHECK: vfmsub213bf16 ymm22, ymm23, word ptr [rip]{1to16} // CHECK: encoding: [0x62,0xe6,0x44,0x30,0xaa,0x35,0x00,0x00,0x00,0x00] - vfmsub213nepbf16 ymm22, ymm23, word ptr [rip]{1to16} + vfmsub213bf16 ymm22, ymm23, word ptr [rip]{1to16} -// CHECK: vfmsub213nepbf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024] +// CHECK: vfmsub213bf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024] // CHECK: encoding: [0x62,0xe6,0x44,0x20,0xaa,0x34,0x6d,0x00,0xfc,0xff,0xff] - vfmsub213nepbf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024] + vfmsub213bf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024] -// CHECK: vfmsub213nepbf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064] +// CHECK: vfmsub213bf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064] // CHECK: encoding: [0x62,0xe6,0x44,0xa7,0xaa,0x71,0x7f] - vfmsub213nepbf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064] + vfmsub213bf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064] -// CHECK: vfmsub213nepbf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16} +// CHECK: vfmsub213bf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16} // CHECK: encoding: [0x62,0xe6,0x44,0xb7,0xaa,0x72,0x80] - vfmsub213nepbf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16} + vfmsub213bf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16} -// CHECK: vfmsub213nepbf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456] +// CHECK: vfmsub213bf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456] // CHECK: encoding: [0x62,0xa6,0x44,0x00,0xaa,0xb4,0xf5,0x00,0x00,0x00,0x10] - vfmsub213nepbf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456] + vfmsub213bf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456] -// CHECK: vfmsub213nepbf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291] +// CHECK: vfmsub213bf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291] // CHECK: encoding: [0x62,0xc6,0x44,0x07,0xaa,0xb4,0x80,0x23,0x01,0x00,0x00] - vfmsub213nepbf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291] + vfmsub213bf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291] -// CHECK: vfmsub213nepbf16 xmm22, xmm23, word ptr [rip]{1to8} +// CHECK: vfmsub213bf16 xmm22, xmm23, word ptr [rip]{1to8} // CHECK: encoding: [0x62,0xe6,0x44,0x10,0xaa,0x35,0x00,0x00,0x00,0x00] - vfmsub213nepbf16 xmm22, xmm23, word ptr [rip]{1to8} + vfmsub213bf16 xmm22, xmm23, word ptr [rip]{1to8} -// CHECK: vfmsub213nepbf16 xmm22, xmm23, xmmword ptr [2*rbp - 512] +// CHECK: vfmsub213bf16 xmm22, xmm23, xmmword ptr [2*rbp - 512] // CHECK: encoding: [0x62,0xe6,0x44,0x00,0xaa,0x34,0x6d,0x00,0xfe,0xff,0xff] - vfmsub213nepbf16 xmm22, xmm23, xmmword ptr [2*rbp - 512] + vfmsub213bf16 xmm22, xmm23, xmmword ptr [2*rbp - 512] -// CHECK: vfmsub213nepbf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032] +// CHECK: vfmsub213bf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032] // CHECK: encoding: [0x62,0xe6,0x44,0x87,0xaa,0x71,0x7f] - vfmsub213nepbf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032] + vfmsub213bf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032] -// CHECK: vfmsub213nepbf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8} +// CHECK: vfmsub213bf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8} // CHECK: encoding: [0x62,0xe6,0x44,0x97,0xaa,0x72,0x80] - vfmsub213nepbf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8} + vfmsub213bf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8} -// CHECK: vfmsub231nepbf16 ymm22, ymm23, ymm24 +// CHECK: vfmsub231bf16 ymm22, ymm23, ymm24 // CHECK: encoding: [0x62,0x86,0x44,0x20,0xba,0xf0] - vfmsub231nepbf16 ymm22, ymm23, ymm24 + vfmsub231bf16 ymm22, ymm23, ymm24 -// CHECK: vfmsub231nepbf16 ymm22 {k7}, ymm23, ymm24 +// CHECK: vfmsub231bf16 ymm22 {k7}, ymm23, ymm24 // CHECK: encoding: [0x62,0x86,0x44,0x27,0xba,0xf0] - vfmsub231nepbf16 ymm22 {k7}, ymm23, ymm24 + vfmsub231bf16 ymm22 {k7}, ymm23, ymm24 -// CHECK: vfmsub231nepbf16 ymm22 {k7} {z}, ymm23, ymm24 +// CHECK: vfmsub231bf16 ymm22 {k7} {z}, ymm23, ymm24 // CHECK: encoding: [0x62,0x86,0x44,0xa7,0xba,0xf0] - vfmsub231nepbf16 ymm22 {k7} {z}, ymm23, ymm24 + vfmsub231bf16 ymm22 {k7} {z}, ymm23, ymm24 -// CHECK: vfmsub231nepbf16 zmm22, zmm23, zmm24 +// CHECK: vfmsub231bf16 zmm22, zmm23, zmm24 // CHECK: encoding: [0x62,0x86,0x44,0x40,0xba,0xf0] - vfmsub231nepbf16 zmm22, zmm23, zmm24 + vfmsub231bf16 zmm22, zmm23, zmm24 -// CHECK: vfmsub231nepbf16 zmm22 {k7}, zmm23, zmm24 +// CHECK: vfmsub231bf16 zmm22 {k7}, zmm23, zmm24 // CHECK: encoding: [0x62,0x86,0x44,0x47,0xba,0xf0] - vfmsub231nepbf16 zmm22 {k7}, zmm23, zmm24 + vfmsub231bf16 zmm22 {k7}, zmm23, zmm24 -// CHECK: vfmsub231nepbf16 zmm22 {k7} {z}, zmm23, zmm24 +// CHECK: vfmsub231bf16 zmm22 {k7} {z}, zmm23, zmm24 // CHECK: encoding: [0x62,0x86,0x44,0xc7,0xba,0xf0] - vfmsub231nepbf16 zmm22 {k7} {z}, zmm23, zmm24 + vfmsub231bf16 zmm22 {k7} {z}, zmm23, zmm24 -// CHECK: vfmsub231nepbf16 xmm22, xmm23, xmm24 +// CHECK: vfmsub231bf16 xmm22, xmm23, xmm24 // CHECK: encoding: [0x62,0x86,0x44,0x00,0xba,0xf0] - vfmsub231nepbf16 xmm22, xmm23, xmm24 + vfmsub231bf16 xmm22, xmm23, xmm24 -// CHECK: vfmsub231nepbf16 xmm22 {k7}, xmm23, xmm24 +// CHECK: vfmsub231bf16 xmm22 {k7}, xmm23, xmm24 // CHECK: encoding: [0x62,0x86,0x44,0x07,0xba,0xf0] - vfmsub231nepbf16 xmm22 {k7}, xmm23, xmm24 + vfmsub231bf16 xmm22 {k7}, xmm23, xmm24 -// CHECK: vfmsub231nepbf16 xmm22 {k7} {z}, xmm23, xmm24 +// CHECK: vfmsub231bf16 xmm22 {k7} {z}, xmm23, xmm24 // CHECK: encoding: [0x62,0x86,0x44,0x87,0xba,0xf0] - vfmsub231nepbf16 xmm22 {k7} {z}, xmm23, xmm24 + vfmsub231bf16 xmm22 {k7} {z}, xmm23, xmm24 -// CHECK: vfmsub231nepbf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456] +// CHECK: vfmsub231bf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456] // CHECK: encoding: [0x62,0xa6,0x44,0x40,0xba,0xb4,0xf5,0x00,0x00,0x00,0x10] - vfmsub231nepbf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456] + vfmsub231bf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456] -// CHECK: vfmsub231nepbf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291] +// CHECK: vfmsub231bf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291] // CHECK: encoding: [0x62,0xc6,0x44,0x47,0xba,0xb4,0x80,0x23,0x01,0x00,0x00] - vfmsub231nepbf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291] + vfmsub231bf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291] -// CHECK: vfmsub231nepbf16 zmm22, zmm23, word ptr [rip]{1to32} +// CHECK: vfmsub231bf16 zmm22, zmm23, word ptr [rip]{1to32} // CHECK: encoding: [0x62,0xe6,0x44,0x50,0xba,0x35,0x00,0x00,0x00,0x00] - vfmsub231nepbf16 zmm22, zmm23, word ptr [rip]{1to32} + vfmsub231bf16 zmm22, zmm23, word ptr [rip]{1to32} -// CHECK: vfmsub231nepbf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048] +// CHECK: vfmsub231bf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048] // CHECK: encoding: [0x62,0xe6,0x44,0x40,0xba,0x34,0x6d,0x00,0xf8,0xff,0xff] - vfmsub231nepbf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048] + vfmsub231bf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048] -// CHECK: vfmsub231nepbf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128] +// CHECK: vfmsub231bf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128] // CHECK: encoding: [0x62,0xe6,0x44,0xc7,0xba,0x71,0x7f] - vfmsub231nepbf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128] + vfmsub231bf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128] -// CHECK: vfmsub231nepbf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32} +// CHECK: vfmsub231bf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32} // CHECK: encoding: [0x62,0xe6,0x44,0xd7,0xba,0x72,0x80] - vfmsub231nepbf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32} + vfmsub231bf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32} -// CHECK: vfmsub231nepbf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456] +// CHECK: vfmsub231bf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456] // CHECK: encoding: [0x62,0xa6,0x44,0x20,0xba,0xb4,0xf5,0x00,0x00,0x00,0x10] - vfmsub231nepbf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456] + vfmsub231bf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456] -// CHECK: vfmsub231nepbf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291] +// CHECK: vfmsub231bf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291] // CHECK: encoding: [0x62,0xc6,0x44,0x27,0xba,0xb4,0x80,0x23,0x01,0x00,0x00] - vfmsub231nepbf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291] + vfmsub231bf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291] -// CHECK: vfmsub231nepbf16 ymm22, ymm23, word ptr [rip]{1to16} +// CHECK: vfmsub231bf16 ymm22, ymm23, word ptr [rip]{1to16} // CHECK: encoding: [0x62,0xe6,0x44,0x30,0xba,0x35,0x00,0x00,0x00,0x00] - vfmsub231nepbf16 ymm22, ymm23, word ptr [rip]{1to16} + vfmsub231bf16 ymm22, ymm23, word ptr [rip]{1to16} -// CHECK: vfmsub231nepbf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024] +// CHECK: vfmsub231bf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024] // CHECK: encoding: [0x62,0xe6,0x44,0x20,0xba,0x34,0x6d,0x00,0xfc,0xff,0xff] - vfmsub231nepbf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024] + vfmsub231bf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024] -// CHECK: vfmsub231nepbf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064] +// CHECK: vfmsub231bf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064] // CHECK: encoding: [0x62,0xe6,0x44,0xa7,0xba,0x71,0x7f] - vfmsub231nepbf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064] + vfmsub231bf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064] -// CHECK: vfmsub231nepbf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16} +// CHECK: vfmsub231bf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16} // CHECK: encoding: [0x62,0xe6,0x44,0xb7,0xba,0x72,0x80] - vfmsub231nepbf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16} + vfmsub231bf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16} -// CHECK: vfmsub231nepbf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456] +// CHECK: vfmsub231bf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456] // CHECK: encoding: [0x62,0xa6,0x44,0x00,0xba,0xb4,0xf5,0x00,0x00,0x00,0x10] - vfmsub231nepbf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456] + vfmsub231bf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456] -// CHECK: vfmsub231nepbf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291] +// CHECK: vfmsub231bf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291] // CHECK: encoding: [0x62,0xc6,0x44,0x07,0xba,0xb4,0x80,0x23,0x01,0x00,0x00] - vfmsub231nepbf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291] + vfmsub231bf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291] -// CHECK: vfmsub231nepbf16 xmm22, xmm23, word ptr [rip]{1to8} +// CHECK: vfmsub231bf16 xmm22, xmm23, word ptr [rip]{1to8} // CHECK: encoding: [0x62,0xe6,0x44,0x10,0xba,0x35,0x00,0x00,0x00,0x00] - vfmsub231nepbf16 xmm22, xmm23, word ptr [rip]{1to8} + vfmsub231bf16 xmm22, xmm23, word ptr [rip]{1to8} -// CHECK: vfmsub231nepbf16 xmm22, xmm23, xmmword ptr [2*rbp - 512] +// CHECK: vfmsub231bf16 xmm22, xmm23, xmmword ptr [2*rbp - 512] // CHECK: encoding: [0x62,0xe6,0x44,0x00,0xba,0x34,0x6d,0x00,0xfe,0xff,0xff] - vfmsub231nepbf16 xmm22, xmm23, xmmword ptr [2*rbp - 512] + vfmsub231bf16 xmm22, xmm23, xmmword ptr [2*rbp - 512] -// CHECK: vfmsub231nepbf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032] +// CHECK: vfmsub231bf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032] // CHECK: encoding: [0x62,0xe6,0x44,0x87,0xba,0x71,0x7f] - vfmsub231nepbf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032] + vfmsub231bf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032] -// CHECK: vfmsub231nepbf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8} +// CHECK: vfmsub231bf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8} // CHECK: encoding: [0x62,0xe6,0x44,0x97,0xba,0x72,0x80] - vfmsub231nepbf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8} + vfmsub231bf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8} -// CHECK: vfnmadd132nepbf16 ymm22, ymm23, ymm24 +// CHECK: vfnmadd132bf16 ymm22, ymm23, ymm24 // CHECK: encoding: [0x62,0x86,0x44,0x20,0x9c,0xf0] - vfnmadd132nepbf16 ymm22, ymm23, ymm24 + vfnmadd132bf16 ymm22, ymm23, ymm24 -// CHECK: vfnmadd132nepbf16 ymm22 {k7}, ymm23, ymm24 +// CHECK: vfnmadd132bf16 ymm22 {k7}, ymm23, ymm24 // CHECK: encoding: [0x62,0x86,0x44,0x27,0x9c,0xf0] - vfnmadd132nepbf16 ymm22 {k7}, ymm23, ymm24 + vfnmadd132bf16 ymm22 {k7}, ymm23, ymm24 -// CHECK: vfnmadd132nepbf16 ymm22 {k7} {z}, ymm23, ymm24 +// CHECK: vfnmadd132bf16 ymm22 {k7} {z}, ymm23, ymm24 // CHECK: encoding: [0x62,0x86,0x44,0xa7,0x9c,0xf0] - vfnmadd132nepbf16 ymm22 {k7} {z}, ymm23, ymm24 + vfnmadd132bf16 ymm22 {k7} {z}, ymm23, ymm24 -// CHECK: vfnmadd132nepbf16 zmm22, zmm23, zmm24 +// CHECK: vfnmadd132bf16 zmm22, zmm23, zmm24 // CHECK: encoding: [0x62,0x86,0x44,0x40,0x9c,0xf0] - vfnmadd132nepbf16 zmm22, zmm23, zmm24 + vfnmadd132bf16 zmm22, zmm23, zmm24 -// CHECK: vfnmadd132nepbf16 zmm22 {k7}, zmm23, zmm24 +// CHECK: vfnmadd132bf16 zmm22 {k7}, zmm23, zmm24 // CHECK: encoding: [0x62,0x86,0x44,0x47,0x9c,0xf0] - vfnmadd132nepbf16 zmm22 {k7}, zmm23, zmm24 + vfnmadd132bf16 zmm22 {k7}, zmm23, zmm24 -// CHECK: vfnmadd132nepbf16 zmm22 {k7} {z}, zmm23, zmm24 +// CHECK: vfnmadd132bf16 zmm22 {k7} {z}, zmm23, zmm24 // CHECK: encoding: [0x62,0x86,0x44,0xc7,0x9c,0xf0] - vfnmadd132nepbf16 zmm22 {k7} {z}, zmm23, zmm24 + vfnmadd132bf16 zmm22 {k7} {z}, zmm23, zmm24 -// CHECK: vfnmadd132nepbf16 xmm22, xmm23, xmm24 +// CHECK: vfnmadd132bf16 xmm22, xmm23, xmm24 // CHECK: encoding: [0x62,0x86,0x44,0x00,0x9c,0xf0] - vfnmadd132nepbf16 xmm22, xmm23, xmm24 + vfnmadd132bf16 xmm22, xmm23, xmm24 -// CHECK: vfnmadd132nepbf16 xmm22 {k7}, xmm23, xmm24 +// CHECK: vfnmadd132bf16 xmm22 {k7}, xmm23, xmm24 // CHECK: encoding: [0x62,0x86,0x44,0x07,0x9c,0xf0] - vfnmadd132nepbf16 xmm22 {k7}, xmm23, xmm24 + vfnmadd132bf16 xmm22 {k7}, xmm23, xmm24 -// CHECK: vfnmadd132nepbf16 xmm22 {k7} {z}, xmm23, xmm24 +// CHECK: vfnmadd132bf16 xmm22 {k7} {z}, xmm23, xmm24 // CHECK: encoding: [0x62,0x86,0x44,0x87,0x9c,0xf0] - vfnmadd132nepbf16 xmm22 {k7} {z}, xmm23, xmm24 + vfnmadd132bf16 xmm22 {k7} {z}, xmm23, xmm24 -// CHECK: vfnmadd132nepbf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456] +// CHECK: vfnmadd132bf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456] // CHECK: encoding: [0x62,0xa6,0x44,0x40,0x9c,0xb4,0xf5,0x00,0x00,0x00,0x10] - vfnmadd132nepbf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456] + vfnmadd132bf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456] -// CHECK: vfnmadd132nepbf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291] +// CHECK: vfnmadd132bf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291] // CHECK: encoding: [0x62,0xc6,0x44,0x47,0x9c,0xb4,0x80,0x23,0x01,0x00,0x00] - vfnmadd132nepbf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291] + vfnmadd132bf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291] -// CHECK: vfnmadd132nepbf16 zmm22, zmm23, word ptr [rip]{1to32} +// CHECK: vfnmadd132bf16 zmm22, zmm23, word ptr [rip]{1to32} // CHECK: encoding: [0x62,0xe6,0x44,0x50,0x9c,0x35,0x00,0x00,0x00,0x00] - vfnmadd132nepbf16 zmm22, zmm23, word ptr [rip]{1to32} + vfnmadd132bf16 zmm22, zmm23, word ptr [rip]{1to32} -// CHECK: vfnmadd132nepbf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048] +// CHECK: vfnmadd132bf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048] // CHECK: encoding: [0x62,0xe6,0x44,0x40,0x9c,0x34,0x6d,0x00,0xf8,0xff,0xff] - vfnmadd132nepbf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048] + vfnmadd132bf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048] -// CHECK: vfnmadd132nepbf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128] +// CHECK: vfnmadd132bf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128] // CHECK: encoding: [0x62,0xe6,0x44,0xc7,0x9c,0x71,0x7f] - vfnmadd132nepbf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128] + vfnmadd132bf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128] -// CHECK: vfnmadd132nepbf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32} +// CHECK: vfnmadd132bf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32} // CHECK: encoding: [0x62,0xe6,0x44,0xd7,0x9c,0x72,0x80] - vfnmadd132nepbf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32} + vfnmadd132bf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32} -// CHECK: vfnmadd132nepbf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456] +// CHECK: vfnmadd132bf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456] // CHECK: encoding: [0x62,0xa6,0x44,0x20,0x9c,0xb4,0xf5,0x00,0x00,0x00,0x10] - vfnmadd132nepbf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456] + vfnmadd132bf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456] -// CHECK: vfnmadd132nepbf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291] +// CHECK: vfnmadd132bf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291] // CHECK: encoding: [0x62,0xc6,0x44,0x27,0x9c,0xb4,0x80,0x23,0x01,0x00,0x00] - vfnmadd132nepbf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291] + vfnmadd132bf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291] -// CHECK: vfnmadd132nepbf16 ymm22, ymm23, word ptr [rip]{1to16} +// CHECK: vfnmadd132bf16 ymm22, ymm23, word ptr [rip]{1to16} // CHECK: encoding: [0x62,0xe6,0x44,0x30,0x9c,0x35,0x00,0x00,0x00,0x00] - vfnmadd132nepbf16 ymm22, ymm23, word ptr [rip]{1to16} + vfnmadd132bf16 ymm22, ymm23, word ptr [rip]{1to16} -// CHECK: vfnmadd132nepbf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024] +// CHECK: vfnmadd132bf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024] // CHECK: encoding: [0x62,0xe6,0x44,0x20,0x9c,0x34,0x6d,0x00,0xfc,0xff,0xff] - vfnmadd132nepbf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024] + vfnmadd132bf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024] -// CHECK: vfnmadd132nepbf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064] +// CHECK: vfnmadd132bf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064] // CHECK: encoding: [0x62,0xe6,0x44,0xa7,0x9c,0x71,0x7f] - vfnmadd132nepbf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064] + vfnmadd132bf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064] -// CHECK: vfnmadd132nepbf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16} +// CHECK: vfnmadd132bf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16} // CHECK: encoding: [0x62,0xe6,0x44,0xb7,0x9c,0x72,0x80] - vfnmadd132nepbf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16} + vfnmadd132bf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16} -// CHECK: vfnmadd132nepbf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456] +// CHECK: vfnmadd132bf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456] // CHECK: encoding: [0x62,0xa6,0x44,0x00,0x9c,0xb4,0xf5,0x00,0x00,0x00,0x10] - vfnmadd132nepbf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456] + vfnmadd132bf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456] -// CHECK: vfnmadd132nepbf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291] +// CHECK: vfnmadd132bf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291] // CHECK: encoding: [0x62,0xc6,0x44,0x07,0x9c,0xb4,0x80,0x23,0x01,0x00,0x00] - vfnmadd132nepbf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291] + vfnmadd132bf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291] -// CHECK: vfnmadd132nepbf16 xmm22, xmm23, word ptr [rip]{1to8} +// CHECK: vfnmadd132bf16 xmm22, xmm23, word ptr [rip]{1to8} // CHECK: encoding: [0x62,0xe6,0x44,0x10,0x9c,0x35,0x00,0x00,0x00,0x00] - vfnmadd132nepbf16 xmm22, xmm23, word ptr [rip]{1to8} + vfnmadd132bf16 xmm22, xmm23, word ptr [rip]{1to8} -// CHECK: vfnmadd132nepbf16 xmm22, xmm23, xmmword ptr [2*rbp - 512] +// CHECK: vfnmadd132bf16 xmm22, xmm23, xmmword ptr [2*rbp - 512] // CHECK: encoding: [0x62,0xe6,0x44,0x00,0x9c,0x34,0x6d,0x00,0xfe,0xff,0xff] - vfnmadd132nepbf16 xmm22, xmm23, xmmword ptr [2*rbp - 512] + vfnmadd132bf16 xmm22, xmm23, xmmword ptr [2*rbp - 512] -// CHECK: vfnmadd132nepbf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032] +// CHECK: vfnmadd132bf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032] // CHECK: encoding: [0x62,0xe6,0x44,0x87,0x9c,0x71,0x7f] - vfnmadd132nepbf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032] + vfnmadd132bf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032] -// CHECK: vfnmadd132nepbf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8} +// CHECK: vfnmadd132bf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8} // CHECK: encoding: [0x62,0xe6,0x44,0x97,0x9c,0x72,0x80] - vfnmadd132nepbf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8} + vfnmadd132bf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8} -// CHECK: vfnmadd213nepbf16 ymm22, ymm23, ymm24 +// CHECK: vfnmadd213bf16 ymm22, ymm23, ymm24 // CHECK: encoding: [0x62,0x86,0x44,0x20,0xac,0xf0] - vfnmadd213nepbf16 ymm22, ymm23, ymm24 + vfnmadd213bf16 ymm22, ymm23, ymm24 -// CHECK: vfnmadd213nepbf16 ymm22 {k7}, ymm23, ymm24 +// CHECK: vfnmadd213bf16 ymm22 {k7}, ymm23, ymm24 // CHECK: encoding: [0x62,0x86,0x44,0x27,0xac,0xf0] - vfnmadd213nepbf16 ymm22 {k7}, ymm23, ymm24 + vfnmadd213bf16 ymm22 {k7}, ymm23, ymm24 -// CHECK: vfnmadd213nepbf16 ymm22 {k7} {z}, ymm23, ymm24 +// CHECK: vfnmadd213bf16 ymm22 {k7} {z}, ymm23, ymm24 // CHECK: encoding: [0x62,0x86,0x44,0xa7,0xac,0xf0] - vfnmadd213nepbf16 ymm22 {k7} {z}, ymm23, ymm24 + vfnmadd213bf16 ymm22 {k7} {z}, ymm23, ymm24 -// CHECK: vfnmadd213nepbf16 zmm22, zmm23, zmm24 +// CHECK: vfnmadd213bf16 zmm22, zmm23, zmm24 // CHECK: encoding: [0x62,0x86,0x44,0x40,0xac,0xf0] - vfnmadd213nepbf16 zmm22, zmm23, zmm24 + vfnmadd213bf16 zmm22, zmm23, zmm24 -// CHECK: vfnmadd213nepbf16 zmm22 {k7}, zmm23, zmm24 +// CHECK: vfnmadd213bf16 zmm22 {k7}, zmm23, zmm24 // CHECK: encoding: [0x62,0x86,0x44,0x47,0xac,0xf0] - vfnmadd213nepbf16 zmm22 {k7}, zmm23, zmm24 + vfnmadd213bf16 zmm22 {k7}, zmm23, zmm24 -// CHECK: vfnmadd213nepbf16 zmm22 {k7} {z}, zmm23, zmm24 +// CHECK: vfnmadd213bf16 zmm22 {k7} {z}, zmm23, zmm24 // CHECK: encoding: [0x62,0x86,0x44,0xc7,0xac,0xf0] - vfnmadd213nepbf16 zmm22 {k7} {z}, zmm23, zmm24 + vfnmadd213bf16 zmm22 {k7} {z}, zmm23, zmm24 -// CHECK: vfnmadd213nepbf16 xmm22, xmm23, xmm24 +// CHECK: vfnmadd213bf16 xmm22, xmm23, xmm24 // CHECK: encoding: [0x62,0x86,0x44,0x00,0xac,0xf0] - vfnmadd213nepbf16 xmm22, xmm23, xmm24 + vfnmadd213bf16 xmm22, xmm23, xmm24 -// CHECK: vfnmadd213nepbf16 xmm22 {k7}, xmm23, xmm24 +// CHECK: vfnmadd213bf16 xmm22 {k7}, xmm23, xmm24 // CHECK: encoding: [0x62,0x86,0x44,0x07,0xac,0xf0] - vfnmadd213nepbf16 xmm22 {k7}, xmm23, xmm24 + vfnmadd213bf16 xmm22 {k7}, xmm23, xmm24 -// CHECK: vfnmadd213nepbf16 xmm22 {k7} {z}, xmm23, xmm24 +// CHECK: vfnmadd213bf16 xmm22 {k7} {z}, xmm23, xmm24 // CHECK: encoding: [0x62,0x86,0x44,0x87,0xac,0xf0] - vfnmadd213nepbf16 xmm22 {k7} {z}, xmm23, xmm24 + vfnmadd213bf16 xmm22 {k7} {z}, xmm23, xmm24 -// CHECK: vfnmadd213nepbf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456] +// CHECK: vfnmadd213bf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456] // CHECK: encoding: [0x62,0xa6,0x44,0x40,0xac,0xb4,0xf5,0x00,0x00,0x00,0x10] - vfnmadd213nepbf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456] + vfnmadd213bf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456] -// CHECK: vfnmadd213nepbf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291] +// CHECK: vfnmadd213bf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291] // CHECK: encoding: [0x62,0xc6,0x44,0x47,0xac,0xb4,0x80,0x23,0x01,0x00,0x00] - vfnmadd213nepbf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291] + vfnmadd213bf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291] -// CHECK: vfnmadd213nepbf16 zmm22, zmm23, word ptr [rip]{1to32} +// CHECK: vfnmadd213bf16 zmm22, zmm23, word ptr [rip]{1to32} // CHECK: encoding: [0x62,0xe6,0x44,0x50,0xac,0x35,0x00,0x00,0x00,0x00] - vfnmadd213nepbf16 zmm22, zmm23, word ptr [rip]{1to32} + vfnmadd213bf16 zmm22, zmm23, word ptr [rip]{1to32} -// CHECK: vfnmadd213nepbf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048] +// CHECK: vfnmadd213bf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048] // CHECK: encoding: [0x62,0xe6,0x44,0x40,0xac,0x34,0x6d,0x00,0xf8,0xff,0xff] - vfnmadd213nepbf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048] + vfnmadd213bf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048] -// CHECK: vfnmadd213nepbf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128] +// CHECK: vfnmadd213bf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128] // CHECK: encoding: [0x62,0xe6,0x44,0xc7,0xac,0x71,0x7f] - vfnmadd213nepbf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128] + vfnmadd213bf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128] -// CHECK: vfnmadd213nepbf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32} +// CHECK: vfnmadd213bf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32} // CHECK: encoding: [0x62,0xe6,0x44,0xd7,0xac,0x72,0x80] - vfnmadd213nepbf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32} + vfnmadd213bf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32} -// CHECK: vfnmadd213nepbf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456] +// CHECK: vfnmadd213bf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456] // CHECK: encoding: [0x62,0xa6,0x44,0x20,0xac,0xb4,0xf5,0x00,0x00,0x00,0x10] - vfnmadd213nepbf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456] + vfnmadd213bf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456] -// CHECK: vfnmadd213nepbf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291] +// CHECK: vfnmadd213bf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291] // CHECK: encoding: [0x62,0xc6,0x44,0x27,0xac,0xb4,0x80,0x23,0x01,0x00,0x00] - vfnmadd213nepbf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291] + vfnmadd213bf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291] -// CHECK: vfnmadd213nepbf16 ymm22, ymm23, word ptr [rip]{1to16} +// CHECK: vfnmadd213bf16 ymm22, ymm23, word ptr [rip]{1to16} // CHECK: encoding: [0x62,0xe6,0x44,0x30,0xac,0x35,0x00,0x00,0x00,0x00] - vfnmadd213nepbf16 ymm22, ymm23, word ptr [rip]{1to16} + vfnmadd213bf16 ymm22, ymm23, word ptr [rip]{1to16} -// CHECK: vfnmadd213nepbf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024] +// CHECK: vfnmadd213bf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024] // CHECK: encoding: [0x62,0xe6,0x44,0x20,0xac,0x34,0x6d,0x00,0xfc,0xff,0xff] - vfnmadd213nepbf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024] + vfnmadd213bf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024] -// CHECK: vfnmadd213nepbf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064] +// CHECK: vfnmadd213bf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064] // CHECK: encoding: [0x62,0xe6,0x44,0xa7,0xac,0x71,0x7f] - vfnmadd213nepbf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064] + vfnmadd213bf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064] -// CHECK: vfnmadd213nepbf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16} +// CHECK: vfnmadd213bf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16} // CHECK: encoding: [0x62,0xe6,0x44,0xb7,0xac,0x72,0x80] - vfnmadd213nepbf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16} + vfnmadd213bf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16} -// CHECK: vfnmadd213nepbf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456] +// CHECK: vfnmadd213bf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456] // CHECK: encoding: [0x62,0xa6,0x44,0x00,0xac,0xb4,0xf5,0x00,0x00,0x00,0x10] - vfnmadd213nepbf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456] + vfnmadd213bf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456] -// CHECK: vfnmadd213nepbf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291] +// CHECK: vfnmadd213bf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291] // CHECK: encoding: [0x62,0xc6,0x44,0x07,0xac,0xb4,0x80,0x23,0x01,0x00,0x00] - vfnmadd213nepbf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291] + vfnmadd213bf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291] -// CHECK: vfnmadd213nepbf16 xmm22, xmm23, word ptr [rip]{1to8} +// CHECK: vfnmadd213bf16 xmm22, xmm23, word ptr [rip]{1to8} // CHECK: encoding: [0x62,0xe6,0x44,0x10,0xac,0x35,0x00,0x00,0x00,0x00] - vfnmadd213nepbf16 xmm22, xmm23, word ptr [rip]{1to8} + vfnmadd213bf16 xmm22, xmm23, word ptr [rip]{1to8} -// CHECK: vfnmadd213nepbf16 xmm22, xmm23, xmmword ptr [2*rbp - 512] +// CHECK: vfnmadd213bf16 xmm22, xmm23, xmmword ptr [2*rbp - 512] // CHECK: encoding: [0x62,0xe6,0x44,0x00,0xac,0x34,0x6d,0x00,0xfe,0xff,0xff] - vfnmadd213nepbf16 xmm22, xmm23, xmmword ptr [2*rbp - 512] + vfnmadd213bf16 xmm22, xmm23, xmmword ptr [2*rbp - 512] -// CHECK: vfnmadd213nepbf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032] +// CHECK: vfnmadd213bf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032] // CHECK: encoding: [0x62,0xe6,0x44,0x87,0xac,0x71,0x7f] - vfnmadd213nepbf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032] + vfnmadd213bf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032] -// CHECK: vfnmadd213nepbf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8} +// CHECK: vfnmadd213bf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8} // CHECK: encoding: [0x62,0xe6,0x44,0x97,0xac,0x72,0x80] - vfnmadd213nepbf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8} + vfnmadd213bf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8} -// CHECK: vfnmadd231nepbf16 ymm22, ymm23, ymm24 +// CHECK: vfnmadd231bf16 ymm22, ymm23, ymm24 // CHECK: encoding: [0x62,0x86,0x44,0x20,0xbc,0xf0] - vfnmadd231nepbf16 ymm22, ymm23, ymm24 + vfnmadd231bf16 ymm22, ymm23, ymm24 -// CHECK: vfnmadd231nepbf16 ymm22 {k7}, ymm23, ymm24 +// CHECK: vfnmadd231bf16 ymm22 {k7}, ymm23, ymm24 // CHECK: encoding: [0x62,0x86,0x44,0x27,0xbc,0xf0] - vfnmadd231nepbf16 ymm22 {k7}, ymm23, ymm24 + vfnmadd231bf16 ymm22 {k7}, ymm23, ymm24 -// CHECK: vfnmadd231nepbf16 ymm22 {k7} {z}, ymm23, ymm24 +// CHECK: vfnmadd231bf16 ymm22 {k7} {z}, ymm23, ymm24 // CHECK: encoding: [0x62,0x86,0x44,0xa7,0xbc,0xf0] - vfnmadd231nepbf16 ymm22 {k7} {z}, ymm23, ymm24 + vfnmadd231bf16 ymm22 {k7} {z}, ymm23, ymm24 -// CHECK: vfnmadd231nepbf16 zmm22, zmm23, zmm24 +// CHECK: vfnmadd231bf16 zmm22, zmm23, zmm24 // CHECK: encoding: [0x62,0x86,0x44,0x40,0xbc,0xf0] - vfnmadd231nepbf16 zmm22, zmm23, zmm24 + vfnmadd231bf16 zmm22, zmm23, zmm24 -// CHECK: vfnmadd231nepbf16 zmm22 {k7}, zmm23, zmm24 +// CHECK: vfnmadd231bf16 zmm22 {k7}, zmm23, zmm24 // CHECK: encoding: [0x62,0x86,0x44,0x47,0xbc,0xf0] - vfnmadd231nepbf16 zmm22 {k7}, zmm23, zmm24 + vfnmadd231bf16 zmm22 {k7}, zmm23, zmm24 -// CHECK: vfnmadd231nepbf16 zmm22 {k7} {z}, zmm23, zmm24 +// CHECK: vfnmadd231bf16 zmm22 {k7} {z}, zmm23, zmm24 // CHECK: encoding: [0x62,0x86,0x44,0xc7,0xbc,0xf0] - vfnmadd231nepbf16 zmm22 {k7} {z}, zmm23, zmm24 + vfnmadd231bf16 zmm22 {k7} {z}, zmm23, zmm24 -// CHECK: vfnmadd231nepbf16 xmm22, xmm23, xmm24 +// CHECK: vfnmadd231bf16 xmm22, xmm23, xmm24 // CHECK: encoding: [0x62,0x86,0x44,0x00,0xbc,0xf0] - vfnmadd231nepbf16 xmm22, xmm23, xmm24 + vfnmadd231bf16 xmm22, xmm23, xmm24 -// CHECK: vfnmadd231nepbf16 xmm22 {k7}, xmm23, xmm24 +// CHECK: vfnmadd231bf16 xmm22 {k7}, xmm23, xmm24 // CHECK: encoding: [0x62,0x86,0x44,0x07,0xbc,0xf0] - vfnmadd231nepbf16 xmm22 {k7}, xmm23, xmm24 + vfnmadd231bf16 xmm22 {k7}, xmm23, xmm24 -// CHECK: vfnmadd231nepbf16 xmm22 {k7} {z}, xmm23, xmm24 +// CHECK: vfnmadd231bf16 xmm22 {k7} {z}, xmm23, xmm24 // CHECK: encoding: [0x62,0x86,0x44,0x87,0xbc,0xf0] - vfnmadd231nepbf16 xmm22 {k7} {z}, xmm23, xmm24 + vfnmadd231bf16 xmm22 {k7} {z}, xmm23, xmm24 -// CHECK: vfnmadd231nepbf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456] +// CHECK: vfnmadd231bf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456] // CHECK: encoding: [0x62,0xa6,0x44,0x40,0xbc,0xb4,0xf5,0x00,0x00,0x00,0x10] - vfnmadd231nepbf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456] + vfnmadd231bf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456] -// CHECK: vfnmadd231nepbf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291] +// CHECK: vfnmadd231bf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291] // CHECK: encoding: [0x62,0xc6,0x44,0x47,0xbc,0xb4,0x80,0x23,0x01,0x00,0x00] - vfnmadd231nepbf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291] + vfnmadd231bf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291] -// CHECK: vfnmadd231nepbf16 zmm22, zmm23, word ptr [rip]{1to32} +// CHECK: vfnmadd231bf16 zmm22, zmm23, word ptr [rip]{1to32} // CHECK: encoding: [0x62,0xe6,0x44,0x50,0xbc,0x35,0x00,0x00,0x00,0x00] - vfnmadd231nepbf16 zmm22, zmm23, word ptr [rip]{1to32} + vfnmadd231bf16 zmm22, zmm23, word ptr [rip]{1to32} -// CHECK: vfnmadd231nepbf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048] +// CHECK: vfnmadd231bf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048] // CHECK: encoding: [0x62,0xe6,0x44,0x40,0xbc,0x34,0x6d,0x00,0xf8,0xff,0xff] - vfnmadd231nepbf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048] + vfnmadd231bf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048] -// CHECK: vfnmadd231nepbf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128] +// CHECK: vfnmadd231bf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128] // CHECK: encoding: [0x62,0xe6,0x44,0xc7,0xbc,0x71,0x7f] - vfnmadd231nepbf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128] + vfnmadd231bf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128] -// CHECK: vfnmadd231nepbf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32} +// CHECK: vfnmadd231bf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32} // CHECK: encoding: [0x62,0xe6,0x44,0xd7,0xbc,0x72,0x80] - vfnmadd231nepbf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32} + vfnmadd231bf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32} -// CHECK: vfnmadd231nepbf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456] +// CHECK: vfnmadd231bf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456] // CHECK: encoding: [0x62,0xa6,0x44,0x20,0xbc,0xb4,0xf5,0x00,0x00,0x00,0x10] - vfnmadd231nepbf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456] + vfnmadd231bf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456] -// CHECK: vfnmadd231nepbf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291] +// CHECK: vfnmadd231bf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291] // CHECK: encoding: [0x62,0xc6,0x44,0x27,0xbc,0xb4,0x80,0x23,0x01,0x00,0x00] - vfnmadd231nepbf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291] + vfnmadd231bf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291] -// CHECK: vfnmadd231nepbf16 ymm22, ymm23, word ptr [rip]{1to16} +// CHECK: vfnmadd231bf16 ymm22, ymm23, word ptr [rip]{1to16} // CHECK: encoding: [0x62,0xe6,0x44,0x30,0xbc,0x35,0x00,0x00,0x00,0x00] - vfnmadd231nepbf16 ymm22, ymm23, word ptr [rip]{1to16} + vfnmadd231bf16 ymm22, ymm23, word ptr [rip]{1to16} -// CHECK: vfnmadd231nepbf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024] +// CHECK: vfnmadd231bf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024] // CHECK: encoding: [0x62,0xe6,0x44,0x20,0xbc,0x34,0x6d,0x00,0xfc,0xff,0xff] - vfnmadd231nepbf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024] + vfnmadd231bf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024] -// CHECK: vfnmadd231nepbf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064] +// CHECK: vfnmadd231bf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064] // CHECK: encoding: [0x62,0xe6,0x44,0xa7,0xbc,0x71,0x7f] - vfnmadd231nepbf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064] + vfnmadd231bf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064] -// CHECK: vfnmadd231nepbf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16} +// CHECK: vfnmadd231bf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16} // CHECK: encoding: [0x62,0xe6,0x44,0xb7,0xbc,0x72,0x80] - vfnmadd231nepbf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16} + vfnmadd231bf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16} -// CHECK: vfnmadd231nepbf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456] +// CHECK: vfnmadd231bf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456] // CHECK: encoding: [0x62,0xa6,0x44,0x00,0xbc,0xb4,0xf5,0x00,0x00,0x00,0x10] - vfnmadd231nepbf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456] + vfnmadd231bf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456] -// CHECK: vfnmadd231nepbf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291] +// CHECK: vfnmadd231bf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291] // CHECK: encoding: [0x62,0xc6,0x44,0x07,0xbc,0xb4,0x80,0x23,0x01,0x00,0x00] - vfnmadd231nepbf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291] + vfnmadd231bf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291] -// CHECK: vfnmadd231nepbf16 xmm22, xmm23, word ptr [rip]{1to8} +// CHECK: vfnmadd231bf16 xmm22, xmm23, word ptr [rip]{1to8} // CHECK: encoding: [0x62,0xe6,0x44,0x10,0xbc,0x35,0x00,0x00,0x00,0x00] - vfnmadd231nepbf16 xmm22, xmm23, word ptr [rip]{1to8} + vfnmadd231bf16 xmm22, xmm23, word ptr [rip]{1to8} -// CHECK: vfnmadd231nepbf16 xmm22, xmm23, xmmword ptr [2*rbp - 512] +// CHECK: vfnmadd231bf16 xmm22, xmm23, xmmword ptr [2*rbp - 512] // CHECK: encoding: [0x62,0xe6,0x44,0x00,0xbc,0x34,0x6d,0x00,0xfe,0xff,0xff] - vfnmadd231nepbf16 xmm22, xmm23, xmmword ptr [2*rbp - 512] + vfnmadd231bf16 xmm22, xmm23, xmmword ptr [2*rbp - 512] -// CHECK: vfnmadd231nepbf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032] +// CHECK: vfnmadd231bf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032] // CHECK: encoding: [0x62,0xe6,0x44,0x87,0xbc,0x71,0x7f] - vfnmadd231nepbf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032] + vfnmadd231bf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032] -// CHECK: vfnmadd231nepbf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8} +// CHECK: vfnmadd231bf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8} // CHECK: encoding: [0x62,0xe6,0x44,0x97,0xbc,0x72,0x80] - vfnmadd231nepbf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8} + vfnmadd231bf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8} -// CHECK: vfnmsub132nepbf16 ymm22, ymm23, ymm24 +// CHECK: vfnmsub132bf16 ymm22, ymm23, ymm24 // CHECK: encoding: [0x62,0x86,0x44,0x20,0x9e,0xf0] - vfnmsub132nepbf16 ymm22, ymm23, ymm24 + vfnmsub132bf16 ymm22, ymm23, ymm24 -// CHECK: vfnmsub132nepbf16 ymm22 {k7}, ymm23, ymm24 +// CHECK: vfnmsub132bf16 ymm22 {k7}, ymm23, ymm24 // CHECK: encoding: [0x62,0x86,0x44,0x27,0x9e,0xf0] - vfnmsub132nepbf16 ymm22 {k7}, ymm23, ymm24 + vfnmsub132bf16 ymm22 {k7}, ymm23, ymm24 -// CHECK: vfnmsub132nepbf16 ymm22 {k7} {z}, ymm23, ymm24 +// CHECK: vfnmsub132bf16 ymm22 {k7} {z}, ymm23, ymm24 // CHECK: encoding: [0x62,0x86,0x44,0xa7,0x9e,0xf0] - vfnmsub132nepbf16 ymm22 {k7} {z}, ymm23, ymm24 + vfnmsub132bf16 ymm22 {k7} {z}, ymm23, ymm24 -// CHECK: vfnmsub132nepbf16 zmm22, zmm23, zmm24 +// CHECK: vfnmsub132bf16 zmm22, zmm23, zmm24 // CHECK: encoding: [0x62,0x86,0x44,0x40,0x9e,0xf0] - vfnmsub132nepbf16 zmm22, zmm23, zmm24 + vfnmsub132bf16 zmm22, zmm23, zmm24 -// CHECK: vfnmsub132nepbf16 zmm22 {k7}, zmm23, zmm24 +// CHECK: vfnmsub132bf16 zmm22 {k7}, zmm23, zmm24 // CHECK: encoding: [0x62,0x86,0x44,0x47,0x9e,0xf0] - vfnmsub132nepbf16 zmm22 {k7}, zmm23, zmm24 + vfnmsub132bf16 zmm22 {k7}, zmm23, zmm24 -// CHECK: vfnmsub132nepbf16 zmm22 {k7} {z}, zmm23, zmm24 +// CHECK: vfnmsub132bf16 zmm22 {k7} {z}, zmm23, zmm24 // CHECK: encoding: [0x62,0x86,0x44,0xc7,0x9e,0xf0] - vfnmsub132nepbf16 zmm22 {k7} {z}, zmm23, zmm24 + vfnmsub132bf16 zmm22 {k7} {z}, zmm23, zmm24 -// CHECK: vfnmsub132nepbf16 xmm22, xmm23, xmm24 +// CHECK: vfnmsub132bf16 xmm22, xmm23, xmm24 // CHECK: encoding: [0x62,0x86,0x44,0x00,0x9e,0xf0] - vfnmsub132nepbf16 xmm22, xmm23, xmm24 + vfnmsub132bf16 xmm22, xmm23, xmm24 -// CHECK: vfnmsub132nepbf16 xmm22 {k7}, xmm23, xmm24 +// CHECK: vfnmsub132bf16 xmm22 {k7}, xmm23, xmm24 // CHECK: encoding: [0x62,0x86,0x44,0x07,0x9e,0xf0] - vfnmsub132nepbf16 xmm22 {k7}, xmm23, xmm24 + vfnmsub132bf16 xmm22 {k7}, xmm23, xmm24 -// CHECK: vfnmsub132nepbf16 xmm22 {k7} {z}, xmm23, xmm24 +// CHECK: vfnmsub132bf16 xmm22 {k7} {z}, xmm23, xmm24 // CHECK: encoding: [0x62,0x86,0x44,0x87,0x9e,0xf0] - vfnmsub132nepbf16 xmm22 {k7} {z}, xmm23, xmm24 + vfnmsub132bf16 xmm22 {k7} {z}, xmm23, xmm24 -// CHECK: vfnmsub132nepbf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456] +// CHECK: vfnmsub132bf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456] // CHECK: encoding: [0x62,0xa6,0x44,0x40,0x9e,0xb4,0xf5,0x00,0x00,0x00,0x10] - vfnmsub132nepbf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456] + vfnmsub132bf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456] -// CHECK: vfnmsub132nepbf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291] +// CHECK: vfnmsub132bf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291] // CHECK: encoding: [0x62,0xc6,0x44,0x47,0x9e,0xb4,0x80,0x23,0x01,0x00,0x00] - vfnmsub132nepbf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291] + vfnmsub132bf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291] -// CHECK: vfnmsub132nepbf16 zmm22, zmm23, word ptr [rip]{1to32} +// CHECK: vfnmsub132bf16 zmm22, zmm23, word ptr [rip]{1to32} // CHECK: encoding: [0x62,0xe6,0x44,0x50,0x9e,0x35,0x00,0x00,0x00,0x00] - vfnmsub132nepbf16 zmm22, zmm23, word ptr [rip]{1to32} + vfnmsub132bf16 zmm22, zmm23, word ptr [rip]{1to32} -// CHECK: vfnmsub132nepbf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048] +// CHECK: vfnmsub132bf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048] // CHECK: encoding: [0x62,0xe6,0x44,0x40,0x9e,0x34,0x6d,0x00,0xf8,0xff,0xff] - vfnmsub132nepbf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048] + vfnmsub132bf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048] -// CHECK: vfnmsub132nepbf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128] +// CHECK: vfnmsub132bf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128] // CHECK: encoding: [0x62,0xe6,0x44,0xc7,0x9e,0x71,0x7f] - vfnmsub132nepbf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128] + vfnmsub132bf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128] -// CHECK: vfnmsub132nepbf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32} +// CHECK: vfnmsub132bf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32} // CHECK: encoding: [0x62,0xe6,0x44,0xd7,0x9e,0x72,0x80] - vfnmsub132nepbf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32} + vfnmsub132bf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32} -// CHECK: vfnmsub132nepbf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456] +// CHECK: vfnmsub132bf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456] // CHECK: encoding: [0x62,0xa6,0x44,0x20,0x9e,0xb4,0xf5,0x00,0x00,0x00,0x10] - vfnmsub132nepbf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456] + vfnmsub132bf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456] -// CHECK: vfnmsub132nepbf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291] +// CHECK: vfnmsub132bf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291] // CHECK: encoding: [0x62,0xc6,0x44,0x27,0x9e,0xb4,0x80,0x23,0x01,0x00,0x00] - vfnmsub132nepbf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291] + vfnmsub132bf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291] -// CHECK: vfnmsub132nepbf16 ymm22, ymm23, word ptr [rip]{1to16} +// CHECK: vfnmsub132bf16 ymm22, ymm23, word ptr [rip]{1to16} // CHECK: encoding: [0x62,0xe6,0x44,0x30,0x9e,0x35,0x00,0x00,0x00,0x00] - vfnmsub132nepbf16 ymm22, ymm23, word ptr [rip]{1to16} + vfnmsub132bf16 ymm22, ymm23, word ptr [rip]{1to16} -// CHECK: vfnmsub132nepbf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024] +// CHECK: vfnmsub132bf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024] // CHECK: encoding: [0x62,0xe6,0x44,0x20,0x9e,0x34,0x6d,0x00,0xfc,0xff,0xff] - vfnmsub132nepbf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024] + vfnmsub132bf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024] -// CHECK: vfnmsub132nepbf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064] +// CHECK: vfnmsub132bf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064] // CHECK: encoding: [0x62,0xe6,0x44,0xa7,0x9e,0x71,0x7f] - vfnmsub132nepbf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064] + vfnmsub132bf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064] -// CHECK: vfnmsub132nepbf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16} +// CHECK: vfnmsub132bf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16} // CHECK: encoding: [0x62,0xe6,0x44,0xb7,0x9e,0x72,0x80] - vfnmsub132nepbf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16} + vfnmsub132bf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16} -// CHECK: vfnmsub132nepbf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456] +// CHECK: vfnmsub132bf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456] // CHECK: encoding: [0x62,0xa6,0x44,0x00,0x9e,0xb4,0xf5,0x00,0x00,0x00,0x10] - vfnmsub132nepbf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456] + vfnmsub132bf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456] -// CHECK: vfnmsub132nepbf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291] +// CHECK: vfnmsub132bf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291] // CHECK: encoding: [0x62,0xc6,0x44,0x07,0x9e,0xb4,0x80,0x23,0x01,0x00,0x00] - vfnmsub132nepbf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291] + vfnmsub132bf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291] -// CHECK: vfnmsub132nepbf16 xmm22, xmm23, word ptr [rip]{1to8} +// CHECK: vfnmsub132bf16 xmm22, xmm23, word ptr [rip]{1to8} // CHECK: encoding: [0x62,0xe6,0x44,0x10,0x9e,0x35,0x00,0x00,0x00,0x00] - vfnmsub132nepbf16 xmm22, xmm23, word ptr [rip]{1to8} + vfnmsub132bf16 xmm22, xmm23, word ptr [rip]{1to8} -// CHECK: vfnmsub132nepbf16 xmm22, xmm23, xmmword ptr [2*rbp - 512] +// CHECK: vfnmsub132bf16 xmm22, xmm23, xmmword ptr [2*rbp - 512] // CHECK: encoding: [0x62,0xe6,0x44,0x00,0x9e,0x34,0x6d,0x00,0xfe,0xff,0xff] - vfnmsub132nepbf16 xmm22, xmm23, xmmword ptr [2*rbp - 512] + vfnmsub132bf16 xmm22, xmm23, xmmword ptr [2*rbp - 512] -// CHECK: vfnmsub132nepbf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032] +// CHECK: vfnmsub132bf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032] // CHECK: encoding: [0x62,0xe6,0x44,0x87,0x9e,0x71,0x7f] - vfnmsub132nepbf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032] + vfnmsub132bf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032] -// CHECK: vfnmsub132nepbf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8} +// CHECK: vfnmsub132bf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8} // CHECK: encoding: [0x62,0xe6,0x44,0x97,0x9e,0x72,0x80] - vfnmsub132nepbf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8} + vfnmsub132bf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8} -// CHECK: vfnmsub213nepbf16 ymm22, ymm23, ymm24 +// CHECK: vfnmsub213bf16 ymm22, ymm23, ymm24 // CHECK: encoding: [0x62,0x86,0x44,0x20,0xae,0xf0] - vfnmsub213nepbf16 ymm22, ymm23, ymm24 + vfnmsub213bf16 ymm22, ymm23, ymm24 -// CHECK: vfnmsub213nepbf16 ymm22 {k7}, ymm23, ymm24 +// CHECK: vfnmsub213bf16 ymm22 {k7}, ymm23, ymm24 // CHECK: encoding: [0x62,0x86,0x44,0x27,0xae,0xf0] - vfnmsub213nepbf16 ymm22 {k7}, ymm23, ymm24 + vfnmsub213bf16 ymm22 {k7}, ymm23, ymm24 -// CHECK: vfnmsub213nepbf16 ymm22 {k7} {z}, ymm23, ymm24 +// CHECK: vfnmsub213bf16 ymm22 {k7} {z}, ymm23, ymm24 // CHECK: encoding: [0x62,0x86,0x44,0xa7,0xae,0xf0] - vfnmsub213nepbf16 ymm22 {k7} {z}, ymm23, ymm24 + vfnmsub213bf16 ymm22 {k7} {z}, ymm23, ymm24 -// CHECK: vfnmsub213nepbf16 zmm22, zmm23, zmm24 +// CHECK: vfnmsub213bf16 zmm22, zmm23, zmm24 // CHECK: encoding: [0x62,0x86,0x44,0x40,0xae,0xf0] - vfnmsub213nepbf16 zmm22, zmm23, zmm24 + vfnmsub213bf16 zmm22, zmm23, zmm24 -// CHECK: vfnmsub213nepbf16 zmm22 {k7}, zmm23, zmm24 +// CHECK: vfnmsub213bf16 zmm22 {k7}, zmm23, zmm24 // CHECK: encoding: [0x62,0x86,0x44,0x47,0xae,0xf0] - vfnmsub213nepbf16 zmm22 {k7}, zmm23, zmm24 + vfnmsub213bf16 zmm22 {k7}, zmm23, zmm24 -// CHECK: vfnmsub213nepbf16 zmm22 {k7} {z}, zmm23, zmm24 +// CHECK: vfnmsub213bf16 zmm22 {k7} {z}, zmm23, zmm24 // CHECK: encoding: [0x62,0x86,0x44,0xc7,0xae,0xf0] - vfnmsub213nepbf16 zmm22 {k7} {z}, zmm23, zmm24 + vfnmsub213bf16 zmm22 {k7} {z}, zmm23, zmm24 -// CHECK: vfnmsub213nepbf16 xmm22, xmm23, xmm24 +// CHECK: vfnmsub213bf16 xmm22, xmm23, xmm24 // CHECK: encoding: [0x62,0x86,0x44,0x00,0xae,0xf0] - vfnmsub213nepbf16 xmm22, xmm23, xmm24 + vfnmsub213bf16 xmm22, xmm23, xmm24 -// CHECK: vfnmsub213nepbf16 xmm22 {k7}, xmm23, xmm24 +// CHECK: vfnmsub213bf16 xmm22 {k7}, xmm23, xmm24 // CHECK: encoding: [0x62,0x86,0x44,0x07,0xae,0xf0] - vfnmsub213nepbf16 xmm22 {k7}, xmm23, xmm24 + vfnmsub213bf16 xmm22 {k7}, xmm23, xmm24 -// CHECK: vfnmsub213nepbf16 xmm22 {k7} {z}, xmm23, xmm24 +// CHECK: vfnmsub213bf16 xmm22 {k7} {z}, xmm23, xmm24 // CHECK: encoding: [0x62,0x86,0x44,0x87,0xae,0xf0] - vfnmsub213nepbf16 xmm22 {k7} {z}, xmm23, xmm24 + vfnmsub213bf16 xmm22 {k7} {z}, xmm23, xmm24 -// CHECK: vfnmsub213nepbf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456] +// CHECK: vfnmsub213bf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456] // CHECK: encoding: [0x62,0xa6,0x44,0x40,0xae,0xb4,0xf5,0x00,0x00,0x00,0x10] - vfnmsub213nepbf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456] + vfnmsub213bf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456] -// CHECK: vfnmsub213nepbf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291] +// CHECK: vfnmsub213bf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291] // CHECK: encoding: [0x62,0xc6,0x44,0x47,0xae,0xb4,0x80,0x23,0x01,0x00,0x00] - vfnmsub213nepbf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291] + vfnmsub213bf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291] -// CHECK: vfnmsub213nepbf16 zmm22, zmm23, word ptr [rip]{1to32} +// CHECK: vfnmsub213bf16 zmm22, zmm23, word ptr [rip]{1to32} // CHECK: encoding: [0x62,0xe6,0x44,0x50,0xae,0x35,0x00,0x00,0x00,0x00] - vfnmsub213nepbf16 zmm22, zmm23, word ptr [rip]{1to32} + vfnmsub213bf16 zmm22, zmm23, word ptr [rip]{1to32} -// CHECK: vfnmsub213nepbf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048] +// CHECK: vfnmsub213bf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048] // CHECK: encoding: [0x62,0xe6,0x44,0x40,0xae,0x34,0x6d,0x00,0xf8,0xff,0xff] - vfnmsub213nepbf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048] + vfnmsub213bf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048] -// CHECK: vfnmsub213nepbf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128] +// CHECK: vfnmsub213bf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128] // CHECK: encoding: [0x62,0xe6,0x44,0xc7,0xae,0x71,0x7f] - vfnmsub213nepbf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128] + vfnmsub213bf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128] -// CHECK: vfnmsub213nepbf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32} +// CHECK: vfnmsub213bf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32} // CHECK: encoding: [0x62,0xe6,0x44,0xd7,0xae,0x72,0x80] - vfnmsub213nepbf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32} + vfnmsub213bf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32} -// CHECK: vfnmsub213nepbf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456] +// CHECK: vfnmsub213bf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456] // CHECK: encoding: [0x62,0xa6,0x44,0x20,0xae,0xb4,0xf5,0x00,0x00,0x00,0x10] - vfnmsub213nepbf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456] + vfnmsub213bf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456] -// CHECK: vfnmsub213nepbf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291] +// CHECK: vfnmsub213bf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291] // CHECK: encoding: [0x62,0xc6,0x44,0x27,0xae,0xb4,0x80,0x23,0x01,0x00,0x00] - vfnmsub213nepbf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291] + vfnmsub213bf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291] -// CHECK: vfnmsub213nepbf16 ymm22, ymm23, word ptr [rip]{1to16} +// CHECK: vfnmsub213bf16 ymm22, ymm23, word ptr [rip]{1to16} // CHECK: encoding: [0x62,0xe6,0x44,0x30,0xae,0x35,0x00,0x00,0x00,0x00] - vfnmsub213nepbf16 ymm22, ymm23, word ptr [rip]{1to16} + vfnmsub213bf16 ymm22, ymm23, word ptr [rip]{1to16} -// CHECK: vfnmsub213nepbf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024] +// CHECK: vfnmsub213bf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024] // CHECK: encoding: [0x62,0xe6,0x44,0x20,0xae,0x34,0x6d,0x00,0xfc,0xff,0xff] - vfnmsub213nepbf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024] + vfnmsub213bf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024] -// CHECK: vfnmsub213nepbf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064] +// CHECK: vfnmsub213bf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064] // CHECK: encoding: [0x62,0xe6,0x44,0xa7,0xae,0x71,0x7f] - vfnmsub213nepbf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064] + vfnmsub213bf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064] -// CHECK: vfnmsub213nepbf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16} +// CHECK: vfnmsub213bf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16} // CHECK: encoding: [0x62,0xe6,0x44,0xb7,0xae,0x72,0x80] - vfnmsub213nepbf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16} + vfnmsub213bf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16} -// CHECK: vfnmsub213nepbf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456] +// CHECK: vfnmsub213bf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456] // CHECK: encoding: [0x62,0xa6,0x44,0x00,0xae,0xb4,0xf5,0x00,0x00,0x00,0x10] - vfnmsub213nepbf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456] + vfnmsub213bf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456] -// CHECK: vfnmsub213nepbf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291] +// CHECK: vfnmsub213bf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291] // CHECK: encoding: [0x62,0xc6,0x44,0x07,0xae,0xb4,0x80,0x23,0x01,0x00,0x00] - vfnmsub213nepbf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291] + vfnmsub213bf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291] -// CHECK: vfnmsub213nepbf16 xmm22, xmm23, word ptr [rip]{1to8} +// CHECK: vfnmsub213bf16 xmm22, xmm23, word ptr [rip]{1to8} // CHECK: encoding: [0x62,0xe6,0x44,0x10,0xae,0x35,0x00,0x00,0x00,0x00] - vfnmsub213nepbf16 xmm22, xmm23, word ptr [rip]{1to8} + vfnmsub213bf16 xmm22, xmm23, word ptr [rip]{1to8} -// CHECK: vfnmsub213nepbf16 xmm22, xmm23, xmmword ptr [2*rbp - 512] +// CHECK: vfnmsub213bf16 xmm22, xmm23, xmmword ptr [2*rbp - 512] // CHECK: encoding: [0x62,0xe6,0x44,0x00,0xae,0x34,0x6d,0x00,0xfe,0xff,0xff] - vfnmsub213nepbf16 xmm22, xmm23, xmmword ptr [2*rbp - 512] + vfnmsub213bf16 xmm22, xmm23, xmmword ptr [2*rbp - 512] -// CHECK: vfnmsub213nepbf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032] +// CHECK: vfnmsub213bf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032] // CHECK: encoding: [0x62,0xe6,0x44,0x87,0xae,0x71,0x7f] - vfnmsub213nepbf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032] + vfnmsub213bf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032] -// CHECK: vfnmsub213nepbf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8} +// CHECK: vfnmsub213bf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8} // CHECK: encoding: [0x62,0xe6,0x44,0x97,0xae,0x72,0x80] - vfnmsub213nepbf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8} + vfnmsub213bf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8} -// CHECK: vfnmsub231nepbf16 ymm22, ymm23, ymm24 +// CHECK: vfnmsub231bf16 ymm22, ymm23, ymm24 // CHECK: encoding: [0x62,0x86,0x44,0x20,0xbe,0xf0] - vfnmsub231nepbf16 ymm22, ymm23, ymm24 + vfnmsub231bf16 ymm22, ymm23, ymm24 -// CHECK: vfnmsub231nepbf16 ymm22 {k7}, ymm23, ymm24 +// CHECK: vfnmsub231bf16 ymm22 {k7}, ymm23, ymm24 // CHECK: encoding: [0x62,0x86,0x44,0x27,0xbe,0xf0] - vfnmsub231nepbf16 ymm22 {k7}, ymm23, ymm24 + vfnmsub231bf16 ymm22 {k7}, ymm23, ymm24 -// CHECK: vfnmsub231nepbf16 ymm22 {k7} {z}, ymm23, ymm24 +// CHECK: vfnmsub231bf16 ymm22 {k7} {z}, ymm23, ymm24 // CHECK: encoding: [0x62,0x86,0x44,0xa7,0xbe,0xf0] - vfnmsub231nepbf16 ymm22 {k7} {z}, ymm23, ymm24 + vfnmsub231bf16 ymm22 {k7} {z}, ymm23, ymm24 -// CHECK: vfnmsub231nepbf16 zmm22, zmm23, zmm24 +// CHECK: vfnmsub231bf16 zmm22, zmm23, zmm24 // CHECK: encoding: [0x62,0x86,0x44,0x40,0xbe,0xf0] - vfnmsub231nepbf16 zmm22, zmm23, zmm24 + vfnmsub231bf16 zmm22, zmm23, zmm24 -// CHECK: vfnmsub231nepbf16 zmm22 {k7}, zmm23, zmm24 +// CHECK: vfnmsub231bf16 zmm22 {k7}, zmm23, zmm24 // CHECK: encoding: [0x62,0x86,0x44,0x47,0xbe,0xf0] - vfnmsub231nepbf16 zmm22 {k7}, zmm23, zmm24 + vfnmsub231bf16 zmm22 {k7}, zmm23, zmm24 -// CHECK: vfnmsub231nepbf16 zmm22 {k7} {z}, zmm23, zmm24 +// CHECK: vfnmsub231bf16 zmm22 {k7} {z}, zmm23, zmm24 // CHECK: encoding: [0x62,0x86,0x44,0xc7,0xbe,0xf0] - vfnmsub231nepbf16 zmm22 {k7} {z}, zmm23, zmm24 + vfnmsub231bf16 zmm22 {k7} {z}, zmm23, zmm24 -// CHECK: vfnmsub231nepbf16 xmm22, xmm23, xmm24 +// CHECK: vfnmsub231bf16 xmm22, xmm23, xmm24 // CHECK: encoding: [0x62,0x86,0x44,0x00,0xbe,0xf0] - vfnmsub231nepbf16 xmm22, xmm23, xmm24 + vfnmsub231bf16 xmm22, xmm23, xmm24 -// CHECK: vfnmsub231nepbf16 xmm22 {k7}, xmm23, xmm24 +// CHECK: vfnmsub231bf16 xmm22 {k7}, xmm23, xmm24 // CHECK: encoding: [0x62,0x86,0x44,0x07,0xbe,0xf0] - vfnmsub231nepbf16 xmm22 {k7}, xmm23, xmm24 + vfnmsub231bf16 xmm22 {k7}, xmm23, xmm24 -// CHECK: vfnmsub231nepbf16 xmm22 {k7} {z}, xmm23, xmm24 +// CHECK: vfnmsub231bf16 xmm22 {k7} {z}, xmm23, xmm24 // CHECK: encoding: [0x62,0x86,0x44,0x87,0xbe,0xf0] - vfnmsub231nepbf16 xmm22 {k7} {z}, xmm23, xmm24 + vfnmsub231bf16 xmm22 {k7} {z}, xmm23, xmm24 -// CHECK: vfnmsub231nepbf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456] +// CHECK: vfnmsub231bf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456] // CHECK: encoding: [0x62,0xa6,0x44,0x40,0xbe,0xb4,0xf5,0x00,0x00,0x00,0x10] - vfnmsub231nepbf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456] + vfnmsub231bf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456] -// CHECK: vfnmsub231nepbf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291] +// CHECK: vfnmsub231bf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291] // CHECK: encoding: [0x62,0xc6,0x44,0x47,0xbe,0xb4,0x80,0x23,0x01,0x00,0x00] - vfnmsub231nepbf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291] + vfnmsub231bf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291] -// CHECK: vfnmsub231nepbf16 zmm22, zmm23, word ptr [rip]{1to32} +// CHECK: vfnmsub231bf16 zmm22, zmm23, word ptr [rip]{1to32} // CHECK: encoding: [0x62,0xe6,0x44,0x50,0xbe,0x35,0x00,0x00,0x00,0x00] - vfnmsub231nepbf16 zmm22, zmm23, word ptr [rip]{1to32} + vfnmsub231bf16 zmm22, zmm23, word ptr [rip]{1to32} -// CHECK: vfnmsub231nepbf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048] +// CHECK: vfnmsub231bf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048] // CHECK: encoding: [0x62,0xe6,0x44,0x40,0xbe,0x34,0x6d,0x00,0xf8,0xff,0xff] - vfnmsub231nepbf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048] + vfnmsub231bf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048] -// CHECK: vfnmsub231nepbf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128] +// CHECK: vfnmsub231bf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128] // CHECK: encoding: [0x62,0xe6,0x44,0xc7,0xbe,0x71,0x7f] - vfnmsub231nepbf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128] + vfnmsub231bf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128] -// CHECK: vfnmsub231nepbf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32} +// CHECK: vfnmsub231bf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32} // CHECK: encoding: [0x62,0xe6,0x44,0xd7,0xbe,0x72,0x80] - vfnmsub231nepbf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32} + vfnmsub231bf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32} -// CHECK: vfnmsub231nepbf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456] +// CHECK: vfnmsub231bf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456] // CHECK: encoding: [0x62,0xa6,0x44,0x20,0xbe,0xb4,0xf5,0x00,0x00,0x00,0x10] - vfnmsub231nepbf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456] + vfnmsub231bf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456] -// CHECK: vfnmsub231nepbf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291] +// CHECK: vfnmsub231bf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291] // CHECK: encoding: [0x62,0xc6,0x44,0x27,0xbe,0xb4,0x80,0x23,0x01,0x00,0x00] - vfnmsub231nepbf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291] + vfnmsub231bf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291] -// CHECK: vfnmsub231nepbf16 ymm22, ymm23, word ptr [rip]{1to16} +// CHECK: vfnmsub231bf16 ymm22, ymm23, word ptr [rip]{1to16} // CHECK: encoding: [0x62,0xe6,0x44,0x30,0xbe,0x35,0x00,0x00,0x00,0x00] - vfnmsub231nepbf16 ymm22, ymm23, word ptr [rip]{1to16} + vfnmsub231bf16 ymm22, ymm23, word ptr [rip]{1to16} -// CHECK: vfnmsub231nepbf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024] +// CHECK: vfnmsub231bf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024] // CHECK: encoding: [0x62,0xe6,0x44,0x20,0xbe,0x34,0x6d,0x00,0xfc,0xff,0xff] - vfnmsub231nepbf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024] + vfnmsub231bf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024] -// CHECK: vfnmsub231nepbf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064] +// CHECK: vfnmsub231bf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064] // CHECK: encoding: [0x62,0xe6,0x44,0xa7,0xbe,0x71,0x7f] - vfnmsub231nepbf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064] + vfnmsub231bf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064] -// CHECK: vfnmsub231nepbf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16} +// CHECK: vfnmsub231bf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16} // CHECK: encoding: [0x62,0xe6,0x44,0xb7,0xbe,0x72,0x80] - vfnmsub231nepbf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16} + vfnmsub231bf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16} -// CHECK: vfnmsub231nepbf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456] +// CHECK: vfnmsub231bf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456] // CHECK: encoding: [0x62,0xa6,0x44,0x00,0xbe,0xb4,0xf5,0x00,0x00,0x00,0x10] - vfnmsub231nepbf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456] + vfnmsub231bf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456] -// CHECK: vfnmsub231nepbf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291] +// CHECK: vfnmsub231bf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291] // CHECK: encoding: [0x62,0xc6,0x44,0x07,0xbe,0xb4,0x80,0x23,0x01,0x00,0x00] - vfnmsub231nepbf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291] + vfnmsub231bf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291] -// CHECK: vfnmsub231nepbf16 xmm22, xmm23, word ptr [rip]{1to8} +// CHECK: vfnmsub231bf16 xmm22, xmm23, word ptr [rip]{1to8} // CHECK: encoding: [0x62,0xe6,0x44,0x10,0xbe,0x35,0x00,0x00,0x00,0x00] - vfnmsub231nepbf16 xmm22, xmm23, word ptr [rip]{1to8} + vfnmsub231bf16 xmm22, xmm23, word ptr [rip]{1to8} -// CHECK: vfnmsub231nepbf16 xmm22, xmm23, xmmword ptr [2*rbp - 512] +// CHECK: vfnmsub231bf16 xmm22, xmm23, xmmword ptr [2*rbp - 512] // CHECK: encoding: [0x62,0xe6,0x44,0x00,0xbe,0x34,0x6d,0x00,0xfe,0xff,0xff] - vfnmsub231nepbf16 xmm22, xmm23, xmmword ptr [2*rbp - 512] + vfnmsub231bf16 xmm22, xmm23, xmmword ptr [2*rbp - 512] -// CHECK: vfnmsub231nepbf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032] +// CHECK: vfnmsub231bf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032] // CHECK: encoding: [0x62,0xe6,0x44,0x87,0xbe,0x71,0x7f] - vfnmsub231nepbf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032] + vfnmsub231bf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032] -// CHECK: vfnmsub231nepbf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8} +// CHECK: vfnmsub231bf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8} // CHECK: encoding: [0x62,0xe6,0x44,0x97,0xbe,0x72,0x80] - vfnmsub231nepbf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8} + vfnmsub231bf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8} -// CHECK: vfpclasspbf16 k5, zmm23, 123 +// CHECK: vfpclassbf16 k5, zmm23, 123 // CHECK: encoding: [0x62,0xb3,0x7f,0x48,0x66,0xef,0x7b] - vfpclasspbf16 k5, zmm23, 123 + vfpclassbf16 k5, zmm23, 123 -// CHECK: vfpclasspbf16 k5 {k7}, zmm23, 123 +// CHECK: vfpclassbf16 k5 {k7}, zmm23, 123 // CHECK: encoding: [0x62,0xb3,0x7f,0x4f,0x66,0xef,0x7b] - vfpclasspbf16 k5 {k7}, zmm23, 123 + vfpclassbf16 k5 {k7}, zmm23, 123 -// CHECK: vfpclasspbf16 k5, ymm23, 123 +// CHECK: vfpclassbf16 k5, ymm23, 123 // CHECK: encoding: [0x62,0xb3,0x7f,0x28,0x66,0xef,0x7b] - vfpclasspbf16 k5, ymm23, 123 + vfpclassbf16 k5, ymm23, 123 -// CHECK: vfpclasspbf16 k5 {k7}, ymm23, 123 +// CHECK: vfpclassbf16 k5 {k7}, ymm23, 123 // CHECK: encoding: [0x62,0xb3,0x7f,0x2f,0x66,0xef,0x7b] - vfpclasspbf16 k5 {k7}, ymm23, 123 + vfpclassbf16 k5 {k7}, ymm23, 123 -// CHECK: vfpclasspbf16 k5, xmm23, 123 +// CHECK: vfpclassbf16 k5, xmm23, 123 // CHECK: encoding: [0x62,0xb3,0x7f,0x08,0x66,0xef,0x7b] - vfpclasspbf16 k5, xmm23, 123 + vfpclassbf16 k5, xmm23, 123 -// CHECK: vfpclasspbf16 k5 {k7}, xmm23, 123 +// CHECK: vfpclassbf16 k5 {k7}, xmm23, 123 // CHECK: encoding: [0x62,0xb3,0x7f,0x0f,0x66,0xef,0x7b] - vfpclasspbf16 k5 {k7}, xmm23, 123 + vfpclassbf16 k5 {k7}, xmm23, 123 -// CHECK: vfpclasspbf16 k5, xmmword ptr [rbp + 8*r14 + 268435456], 123 +// CHECK: vfpclassbf16 k5, xmmword ptr [rbp + 8*r14 + 268435456], 123 // CHECK: encoding: [0x62,0xb3,0x7f,0x08,0x66,0xac,0xf5,0x00,0x00,0x00,0x10,0x7b] - vfpclasspbf16 k5, xmmword ptr [rbp + 8*r14 + 268435456], 123 + vfpclassbf16 k5, xmmword ptr [rbp + 8*r14 + 268435456], 123 -// CHECK: vfpclasspbf16 k5 {k7}, xmmword ptr [r8 + 4*rax + 291], 123 +// CHECK: vfpclassbf16 k5 {k7}, xmmword ptr [r8 + 4*rax + 291], 123 // CHECK: encoding: [0x62,0xd3,0x7f,0x0f,0x66,0xac,0x80,0x23,0x01,0x00,0x00,0x7b] - vfpclasspbf16 k5 {k7}, xmmword ptr [r8 + 4*rax + 291], 123 + vfpclassbf16 k5 {k7}, xmmword ptr [r8 + 4*rax + 291], 123 -// CHECK: vfpclasspbf16 k5, word ptr [rip]{1to8}, 123 +// CHECK: vfpclassbf16 k5, word ptr [rip]{1to8}, 123 // CHECK: encoding: [0x62,0xf3,0x7f,0x18,0x66,0x2d,0x00,0x00,0x00,0x00,0x7b] - vfpclasspbf16 k5, word ptr [rip]{1to8}, 123 + vfpclassbf16 k5, word ptr [rip]{1to8}, 123 -// CHECK: vfpclasspbf16 k5, xmmword ptr [2*rbp - 512], 123 +// CHECK: vfpclassbf16 k5, xmmword ptr [2*rbp - 512], 123 // CHECK: encoding: [0x62,0xf3,0x7f,0x08,0x66,0x2c,0x6d,0x00,0xfe,0xff,0xff,0x7b] - vfpclasspbf16 k5, xmmword ptr [2*rbp - 512], 123 + vfpclassbf16 k5, xmmword ptr [2*rbp - 512], 123 -// CHECK: vfpclasspbf16 k5 {k7}, xmmword ptr [rcx + 2032], 123 +// CHECK: vfpclassbf16 k5 {k7}, xmmword ptr [rcx + 2032], 123 // CHECK: encoding: [0x62,0xf3,0x7f,0x0f,0x66,0x69,0x7f,0x7b] - vfpclasspbf16 k5 {k7}, xmmword ptr [rcx + 2032], 123 + vfpclassbf16 k5 {k7}, xmmword ptr [rcx + 2032], 123 -// CHECK: vfpclasspbf16 k5 {k7}, word ptr [rdx - 256]{1to8}, 123 +// CHECK: vfpclassbf16 k5 {k7}, word ptr [rdx - 256]{1to8}, 123 // CHECK: encoding: [0x62,0xf3,0x7f,0x1f,0x66,0x6a,0x80,0x7b] - vfpclasspbf16 k5 {k7}, word ptr [rdx - 256]{1to8}, 123 + vfpclassbf16 k5 {k7}, word ptr [rdx - 256]{1to8}, 123 -// CHECK: vfpclasspbf16 k5, word ptr [rip]{1to16}, 123 +// CHECK: vfpclassbf16 k5, word ptr [rip]{1to16}, 123 // CHECK: encoding: [0x62,0xf3,0x7f,0x38,0x66,0x2d,0x00,0x00,0x00,0x00,0x7b] - vfpclasspbf16 k5, word ptr [rip]{1to16}, 123 + vfpclassbf16 k5, word ptr [rip]{1to16}, 123 -// CHECK: vfpclasspbf16 k5, ymmword ptr [2*rbp - 1024], 123 +// CHECK: vfpclassbf16 k5, ymmword ptr [2*rbp - 1024], 123 // CHECK: encoding: [0x62,0xf3,0x7f,0x28,0x66,0x2c,0x6d,0x00,0xfc,0xff,0xff,0x7b] - vfpclasspbf16 k5, ymmword ptr [2*rbp - 1024], 123 + vfpclassbf16 k5, ymmword ptr [2*rbp - 1024], 123 -// CHECK: vfpclasspbf16 k5 {k7}, ymmword ptr [rcx + 4064], 123 +// CHECK: vfpclassbf16 k5 {k7}, ymmword ptr [rcx + 4064], 123 // CHECK: encoding: [0x62,0xf3,0x7f,0x2f,0x66,0x69,0x7f,0x7b] - vfpclasspbf16 k5 {k7}, ymmword ptr [rcx + 4064], 123 + vfpclassbf16 k5 {k7}, ymmword ptr [rcx + 4064], 123 -// CHECK: vfpclasspbf16 k5 {k7}, word ptr [rdx - 256]{1to16}, 123 +// CHECK: vfpclassbf16 k5 {k7}, word ptr [rdx - 256]{1to16}, 123 // CHECK: encoding: [0x62,0xf3,0x7f,0x3f,0x66,0x6a,0x80,0x7b] - vfpclasspbf16 k5 {k7}, word ptr [rdx - 256]{1to16}, 123 + vfpclassbf16 k5 {k7}, word ptr [rdx - 256]{1to16}, 123 -// CHECK: vfpclasspbf16 k5, word ptr [rip]{1to32}, 123 +// CHECK: vfpclassbf16 k5, word ptr [rip]{1to32}, 123 // CHECK: encoding: [0x62,0xf3,0x7f,0x58,0x66,0x2d,0x00,0x00,0x00,0x00,0x7b] - vfpclasspbf16 k5, word ptr [rip]{1to32}, 123 + vfpclassbf16 k5, word ptr [rip]{1to32}, 123 -// CHECK: vfpclasspbf16 k5, zmmword ptr [2*rbp - 2048], 123 +// CHECK: vfpclassbf16 k5, zmmword ptr [2*rbp - 2048], 123 // CHECK: encoding: [0x62,0xf3,0x7f,0x48,0x66,0x2c,0x6d,0x00,0xf8,0xff,0xff,0x7b] - vfpclasspbf16 k5, zmmword ptr [2*rbp - 2048], 123 + vfpclassbf16 k5, zmmword ptr [2*rbp - 2048], 123 -// CHECK: vfpclasspbf16 k5 {k7}, zmmword ptr [rcx + 8128], 123 +// CHECK: vfpclassbf16 k5 {k7}, zmmword ptr [rcx + 8128], 123 // CHECK: encoding: [0x62,0xf3,0x7f,0x4f,0x66,0x69,0x7f,0x7b] - vfpclasspbf16 k5 {k7}, zmmword ptr [rcx + 8128], 123 + vfpclassbf16 k5 {k7}, zmmword ptr [rcx + 8128], 123 -// CHECK: vfpclasspbf16 k5 {k7}, word ptr [rdx - 256]{1to32}, 123 +// CHECK: vfpclassbf16 k5 {k7}, word ptr [rdx - 256]{1to32}, 123 // CHECK: encoding: [0x62,0xf3,0x7f,0x5f,0x66,0x6a,0x80,0x7b] - vfpclasspbf16 k5 {k7}, word ptr [rdx - 256]{1to32}, 123 + vfpclassbf16 k5 {k7}, word ptr [rdx - 256]{1to32}, 123 -// CHECK: vgetexppbf16 xmm22, xmm23 +// CHECK: vgetexpbf16 xmm22, xmm23 // CHECK: encoding: [0x62,0xa5,0x7d,0x08,0x42,0xf7] - vgetexppbf16 xmm22, xmm23 + vgetexpbf16 xmm22, xmm23 -// CHECK: vgetexppbf16 xmm22 {k7}, xmm23 +// CHECK: vgetexpbf16 xmm22 {k7}, xmm23 // CHECK: encoding: [0x62,0xa5,0x7d,0x0f,0x42,0xf7] - vgetexppbf16 xmm22 {k7}, xmm23 + vgetexpbf16 xmm22 {k7}, xmm23 -// CHECK: vgetexppbf16 xmm22 {k7} {z}, xmm23 +// CHECK: vgetexpbf16 xmm22 {k7} {z}, xmm23 // CHECK: encoding: [0x62,0xa5,0x7d,0x8f,0x42,0xf7] - vgetexppbf16 xmm22 {k7} {z}, xmm23 + vgetexpbf16 xmm22 {k7} {z}, xmm23 -// CHECK: vgetexppbf16 zmm22, zmm23 +// CHECK: vgetexpbf16 zmm22, zmm23 // CHECK: encoding: [0x62,0xa5,0x7d,0x48,0x42,0xf7] - vgetexppbf16 zmm22, zmm23 + vgetexpbf16 zmm22, zmm23 -// CHECK: vgetexppbf16 zmm22 {k7}, zmm23 +// CHECK: vgetexpbf16 zmm22 {k7}, zmm23 // CHECK: encoding: [0x62,0xa5,0x7d,0x4f,0x42,0xf7] - vgetexppbf16 zmm22 {k7}, zmm23 + vgetexpbf16 zmm22 {k7}, zmm23 -// CHECK: vgetexppbf16 zmm22 {k7} {z}, zmm23 +// CHECK: vgetexpbf16 zmm22 {k7} {z}, zmm23 // CHECK: encoding: [0x62,0xa5,0x7d,0xcf,0x42,0xf7] - vgetexppbf16 zmm22 {k7} {z}, zmm23 + vgetexpbf16 zmm22 {k7} {z}, zmm23 -// CHECK: vgetexppbf16 ymm22, ymm23 +// CHECK: vgetexpbf16 ymm22, ymm23 // CHECK: encoding: [0x62,0xa5,0x7d,0x28,0x42,0xf7] - vgetexppbf16 ymm22, ymm23 + vgetexpbf16 ymm22, ymm23 -// CHECK: vgetexppbf16 ymm22 {k7}, ymm23 +// CHECK: vgetexpbf16 ymm22 {k7}, ymm23 // CHECK: encoding: [0x62,0xa5,0x7d,0x2f,0x42,0xf7] - vgetexppbf16 ymm22 {k7}, ymm23 + vgetexpbf16 ymm22 {k7}, ymm23 -// CHECK: vgetexppbf16 ymm22 {k7} {z}, ymm23 +// CHECK: vgetexpbf16 ymm22 {k7} {z}, ymm23 // CHECK: encoding: [0x62,0xa5,0x7d,0xaf,0x42,0xf7] - vgetexppbf16 ymm22 {k7} {z}, ymm23 + vgetexpbf16 ymm22 {k7} {z}, ymm23 -// CHECK: vgetexppbf16 xmm22, xmmword ptr [rbp + 8*r14 + 268435456] +// CHECK: vgetexpbf16 xmm22, xmmword ptr [rbp + 8*r14 + 268435456] // CHECK: encoding: [0x62,0xa5,0x7d,0x08,0x42,0xb4,0xf5,0x00,0x00,0x00,0x10] - vgetexppbf16 xmm22, xmmword ptr [rbp + 8*r14 + 268435456] + vgetexpbf16 xmm22, xmmword ptr [rbp + 8*r14 + 268435456] -// CHECK: vgetexppbf16 xmm22 {k7}, xmmword ptr [r8 + 4*rax + 291] +// CHECK: vgetexpbf16 xmm22 {k7}, xmmword ptr [r8 + 4*rax + 291] // CHECK: encoding: [0x62,0xc5,0x7d,0x0f,0x42,0xb4,0x80,0x23,0x01,0x00,0x00] - vgetexppbf16 xmm22 {k7}, xmmword ptr [r8 + 4*rax + 291] + vgetexpbf16 xmm22 {k7}, xmmword ptr [r8 + 4*rax + 291] -// CHECK: vgetexppbf16 xmm22, word ptr [rip]{1to8} +// CHECK: vgetexpbf16 xmm22, word ptr [rip]{1to8} // CHECK: encoding: [0x62,0xe5,0x7d,0x18,0x42,0x35,0x00,0x00,0x00,0x00] - vgetexppbf16 xmm22, word ptr [rip]{1to8} + vgetexpbf16 xmm22, word ptr [rip]{1to8} -// CHECK: vgetexppbf16 xmm22, xmmword ptr [2*rbp - 512] +// CHECK: vgetexpbf16 xmm22, xmmword ptr [2*rbp - 512] // CHECK: encoding: [0x62,0xe5,0x7d,0x08,0x42,0x34,0x6d,0x00,0xfe,0xff,0xff] - vgetexppbf16 xmm22, xmmword ptr [2*rbp - 512] + vgetexpbf16 xmm22, xmmword ptr [2*rbp - 512] -// CHECK: vgetexppbf16 xmm22 {k7} {z}, xmmword ptr [rcx + 2032] +// CHECK: vgetexpbf16 xmm22 {k7} {z}, xmmword ptr [rcx + 2032] // CHECK: encoding: [0x62,0xe5,0x7d,0x8f,0x42,0x71,0x7f] - vgetexppbf16 xmm22 {k7} {z}, xmmword ptr [rcx + 2032] + vgetexpbf16 xmm22 {k7} {z}, xmmword ptr [rcx + 2032] -// CHECK: vgetexppbf16 xmm22 {k7} {z}, word ptr [rdx - 256]{1to8} +// CHECK: vgetexpbf16 xmm22 {k7} {z}, word ptr [rdx - 256]{1to8} // CHECK: encoding: [0x62,0xe5,0x7d,0x9f,0x42,0x72,0x80] - vgetexppbf16 xmm22 {k7} {z}, word ptr [rdx - 256]{1to8} + vgetexpbf16 xmm22 {k7} {z}, word ptr [rdx - 256]{1to8} -// CHECK: vgetexppbf16 ymm22, ymmword ptr [rbp + 8*r14 + 268435456] +// CHECK: vgetexpbf16 ymm22, ymmword ptr [rbp + 8*r14 + 268435456] // CHECK: encoding: [0x62,0xa5,0x7d,0x28,0x42,0xb4,0xf5,0x00,0x00,0x00,0x10] - vgetexppbf16 ymm22, ymmword ptr [rbp + 8*r14 + 268435456] + vgetexpbf16 ymm22, ymmword ptr [rbp + 8*r14 + 268435456] -// CHECK: vgetexppbf16 ymm22 {k7}, ymmword ptr [r8 + 4*rax + 291] +// CHECK: vgetexpbf16 ymm22 {k7}, ymmword ptr [r8 + 4*rax + 291] // CHECK: encoding: [0x62,0xc5,0x7d,0x2f,0x42,0xb4,0x80,0x23,0x01,0x00,0x00] - vgetexppbf16 ymm22 {k7}, ymmword ptr [r8 + 4*rax + 291] + vgetexpbf16 ymm22 {k7}, ymmword ptr [r8 + 4*rax + 291] -// CHECK: vgetexppbf16 ymm22, word ptr [rip]{1to16} +// CHECK: vgetexpbf16 ymm22, word ptr [rip]{1to16} // CHECK: encoding: [0x62,0xe5,0x7d,0x38,0x42,0x35,0x00,0x00,0x00,0x00] - vgetexppbf16 ymm22, word ptr [rip]{1to16} + vgetexpbf16 ymm22, word ptr [rip]{1to16} -// CHECK: vgetexppbf16 ymm22, ymmword ptr [2*rbp - 1024] +// CHECK: vgetexpbf16 ymm22, ymmword ptr [2*rbp - 1024] // CHECK: encoding: [0x62,0xe5,0x7d,0x28,0x42,0x34,0x6d,0x00,0xfc,0xff,0xff] - vgetexppbf16 ymm22, ymmword ptr [2*rbp - 1024] + vgetexpbf16 ymm22, ymmword ptr [2*rbp - 1024] -// CHECK: vgetexppbf16 ymm22 {k7} {z}, ymmword ptr [rcx + 4064] +// CHECK: vgetexpbf16 ymm22 {k7} {z}, ymmword ptr [rcx + 4064] // CHECK: encoding: [0x62,0xe5,0x7d,0xaf,0x42,0x71,0x7f] - vgetexppbf16 ymm22 {k7} {z}, ymmword ptr [rcx + 4064] + vgetexpbf16 ymm22 {k7} {z}, ymmword ptr [rcx + 4064] -// CHECK: vgetexppbf16 ymm22 {k7} {z}, word ptr [rdx - 256]{1to16} +// CHECK: vgetexpbf16 ymm22 {k7} {z}, word ptr [rdx - 256]{1to16} // CHECK: encoding: [0x62,0xe5,0x7d,0xbf,0x42,0x72,0x80] - vgetexppbf16 ymm22 {k7} {z}, word ptr [rdx - 256]{1to16} + vgetexpbf16 ymm22 {k7} {z}, word ptr [rdx - 256]{1to16} -// CHECK: vgetexppbf16 zmm22, zmmword ptr [rbp + 8*r14 + 268435456] +// CHECK: vgetexpbf16 zmm22, zmmword ptr [rbp + 8*r14 + 268435456] // CHECK: encoding: [0x62,0xa5,0x7d,0x48,0x42,0xb4,0xf5,0x00,0x00,0x00,0x10] - vgetexppbf16 zmm22, zmmword ptr [rbp + 8*r14 + 268435456] + vgetexpbf16 zmm22, zmmword ptr [rbp + 8*r14 + 268435456] -// CHECK: vgetexppbf16 zmm22 {k7}, zmmword ptr [r8 + 4*rax + 291] +// CHECK: vgetexpbf16 zmm22 {k7}, zmmword ptr [r8 + 4*rax + 291] // CHECK: encoding: [0x62,0xc5,0x7d,0x4f,0x42,0xb4,0x80,0x23,0x01,0x00,0x00] - vgetexppbf16 zmm22 {k7}, zmmword ptr [r8 + 4*rax + 291] + vgetexpbf16 zmm22 {k7}, zmmword ptr [r8 + 4*rax + 291] -// CHECK: vgetexppbf16 zmm22, word ptr [rip]{1to32} +// CHECK: vgetexpbf16 zmm22, word ptr [rip]{1to32} // CHECK: encoding: [0x62,0xe5,0x7d,0x58,0x42,0x35,0x00,0x00,0x00,0x00] - vgetexppbf16 zmm22, word ptr [rip]{1to32} + vgetexpbf16 zmm22, word ptr [rip]{1to32} -// CHECK: vgetexppbf16 zmm22, zmmword ptr [2*rbp - 2048] +// CHECK: vgetexpbf16 zmm22, zmmword ptr [2*rbp - 2048] // CHECK: encoding: [0x62,0xe5,0x7d,0x48,0x42,0x34,0x6d,0x00,0xf8,0xff,0xff] - vgetexppbf16 zmm22, zmmword ptr [2*rbp - 2048] + vgetexpbf16 zmm22, zmmword ptr [2*rbp - 2048] -// CHECK: vgetexppbf16 zmm22 {k7} {z}, zmmword ptr [rcx + 8128] +// CHECK: vgetexpbf16 zmm22 {k7} {z}, zmmword ptr [rcx + 8128] // CHECK: encoding: [0x62,0xe5,0x7d,0xcf,0x42,0x71,0x7f] - vgetexppbf16 zmm22 {k7} {z}, zmmword ptr [rcx + 8128] + vgetexpbf16 zmm22 {k7} {z}, zmmword ptr [rcx + 8128] -// CHECK: vgetexppbf16 zmm22 {k7} {z}, word ptr [rdx - 256]{1to32} +// CHECK: vgetexpbf16 zmm22 {k7} {z}, word ptr [rdx - 256]{1to32} // CHECK: encoding: [0x62,0xe5,0x7d,0xdf,0x42,0x72,0x80] - vgetexppbf16 zmm22 {k7} {z}, word ptr [rdx - 256]{1to32} + vgetexpbf16 zmm22 {k7} {z}, word ptr [rdx - 256]{1to32} -// CHECK: vgetmantpbf16 zmm22, zmm23, 123 +// CHECK: vgetmantbf16 zmm22, zmm23, 123 // CHECK: encoding: [0x62,0xa3,0x7f,0x48,0x26,0xf7,0x7b] - vgetmantpbf16 zmm22, zmm23, 123 + vgetmantbf16 zmm22, zmm23, 123 -// CHECK: vgetmantpbf16 zmm22 {k7}, zmm23, 123 +// CHECK: vgetmantbf16 zmm22 {k7}, zmm23, 123 // CHECK: encoding: [0x62,0xa3,0x7f,0x4f,0x26,0xf7,0x7b] - vgetmantpbf16 zmm22 {k7}, zmm23, 123 + vgetmantbf16 zmm22 {k7}, zmm23, 123 -// CHECK: vgetmantpbf16 zmm22 {k7} {z}, zmm23, 123 +// CHECK: vgetmantbf16 zmm22 {k7} {z}, zmm23, 123 // CHECK: encoding: [0x62,0xa3,0x7f,0xcf,0x26,0xf7,0x7b] - vgetmantpbf16 zmm22 {k7} {z}, zmm23, 123 + vgetmantbf16 zmm22 {k7} {z}, zmm23, 123 -// CHECK: vgetmantpbf16 ymm22, ymm23, 123 +// CHECK: vgetmantbf16 ymm22, ymm23, 123 // CHECK: encoding: [0x62,0xa3,0x7f,0x28,0x26,0xf7,0x7b] - vgetmantpbf16 ymm22, ymm23, 123 + vgetmantbf16 ymm22, ymm23, 123 -// CHECK: vgetmantpbf16 ymm22 {k7}, ymm23, 123 +// CHECK: vgetmantbf16 ymm22 {k7}, ymm23, 123 // CHECK: encoding: [0x62,0xa3,0x7f,0x2f,0x26,0xf7,0x7b] - vgetmantpbf16 ymm22 {k7}, ymm23, 123 + vgetmantbf16 ymm22 {k7}, ymm23, 123 -// CHECK: vgetmantpbf16 ymm22 {k7} {z}, ymm23, 123 +// CHECK: vgetmantbf16 ymm22 {k7} {z}, ymm23, 123 // CHECK: encoding: [0x62,0xa3,0x7f,0xaf,0x26,0xf7,0x7b] - vgetmantpbf16 ymm22 {k7} {z}, ymm23, 123 + vgetmantbf16 ymm22 {k7} {z}, ymm23, 123 -// CHECK: vgetmantpbf16 xmm22, xmm23, 123 +// CHECK: vgetmantbf16 xmm22, xmm23, 123 // CHECK: encoding: [0x62,0xa3,0x7f,0x08,0x26,0xf7,0x7b] - vgetmantpbf16 xmm22, xmm23, 123 + vgetmantbf16 xmm22, xmm23, 123 -// CHECK: vgetmantpbf16 xmm22 {k7}, xmm23, 123 +// CHECK: vgetmantbf16 xmm22 {k7}, xmm23, 123 // CHECK: encoding: [0x62,0xa3,0x7f,0x0f,0x26,0xf7,0x7b] - vgetmantpbf16 xmm22 {k7}, xmm23, 123 + vgetmantbf16 xmm22 {k7}, xmm23, 123 -// CHECK: vgetmantpbf16 xmm22 {k7} {z}, xmm23, 123 +// CHECK: vgetmantbf16 xmm22 {k7} {z}, xmm23, 123 // CHECK: encoding: [0x62,0xa3,0x7f,0x8f,0x26,0xf7,0x7b] - vgetmantpbf16 xmm22 {k7} {z}, xmm23, 123 + vgetmantbf16 xmm22 {k7} {z}, xmm23, 123 -// CHECK: vgetmantpbf16 xmm22, xmmword ptr [rbp + 8*r14 + 268435456], 123 +// CHECK: vgetmantbf16 xmm22, xmmword ptr [rbp + 8*r14 + 268435456], 123 // CHECK: encoding: [0x62,0xa3,0x7f,0x08,0x26,0xb4,0xf5,0x00,0x00,0x00,0x10,0x7b] - vgetmantpbf16 xmm22, xmmword ptr [rbp + 8*r14 + 268435456], 123 + vgetmantbf16 xmm22, xmmword ptr [rbp + 8*r14 + 268435456], 123 -// CHECK: vgetmantpbf16 xmm22 {k7}, xmmword ptr [r8 + 4*rax + 291], 123 +// CHECK: vgetmantbf16 xmm22 {k7}, xmmword ptr [r8 + 4*rax + 291], 123 // CHECK: encoding: [0x62,0xc3,0x7f,0x0f,0x26,0xb4,0x80,0x23,0x01,0x00,0x00,0x7b] - vgetmantpbf16 xmm22 {k7}, xmmword ptr [r8 + 4*rax + 291], 123 + vgetmantbf16 xmm22 {k7}, xmmword ptr [r8 + 4*rax + 291], 123 -// CHECK: vgetmantpbf16 xmm22, word ptr [rip]{1to8}, 123 +// CHECK: vgetmantbf16 xmm22, word ptr [rip]{1to8}, 123 // CHECK: encoding: [0x62,0xe3,0x7f,0x18,0x26,0x35,0x00,0x00,0x00,0x00,0x7b] - vgetmantpbf16 xmm22, word ptr [rip]{1to8}, 123 + vgetmantbf16 xmm22, word ptr [rip]{1to8}, 123 -// CHECK: vgetmantpbf16 xmm22, xmmword ptr [2*rbp - 512], 123 +// CHECK: vgetmantbf16 xmm22, xmmword ptr [2*rbp - 512], 123 // CHECK: encoding: [0x62,0xe3,0x7f,0x08,0x26,0x34,0x6d,0x00,0xfe,0xff,0xff,0x7b] - vgetmantpbf16 xmm22, xmmword ptr [2*rbp - 512], 123 + vgetmantbf16 xmm22, xmmword ptr [2*rbp - 512], 123 -// CHECK: vgetmantpbf16 xmm22 {k7} {z}, xmmword ptr [rcx + 2032], 123 +// CHECK: vgetmantbf16 xmm22 {k7} {z}, xmmword ptr [rcx + 2032], 123 // CHECK: encoding: [0x62,0xe3,0x7f,0x8f,0x26,0x71,0x7f,0x7b] - vgetmantpbf16 xmm22 {k7} {z}, xmmword ptr [rcx + 2032], 123 + vgetmantbf16 xmm22 {k7} {z}, xmmword ptr [rcx + 2032], 123 -// CHECK: vgetmantpbf16 xmm22 {k7} {z}, word ptr [rdx - 256]{1to8}, 123 +// CHECK: vgetmantbf16 xmm22 {k7} {z}, word ptr [rdx - 256]{1to8}, 123 // CHECK: encoding: [0x62,0xe3,0x7f,0x9f,0x26,0x72,0x80,0x7b] - vgetmantpbf16 xmm22 {k7} {z}, word ptr [rdx - 256]{1to8}, 123 + vgetmantbf16 xmm22 {k7} {z}, word ptr [rdx - 256]{1to8}, 123 -// CHECK: vgetmantpbf16 ymm22, ymmword ptr [rbp + 8*r14 + 268435456], 123 +// CHECK: vgetmantbf16 ymm22, ymmword ptr [rbp + 8*r14 + 268435456], 123 // CHECK: encoding: [0x62,0xa3,0x7f,0x28,0x26,0xb4,0xf5,0x00,0x00,0x00,0x10,0x7b] - vgetmantpbf16 ymm22, ymmword ptr [rbp + 8*r14 + 268435456], 123 + vgetmantbf16 ymm22, ymmword ptr [rbp + 8*r14 + 268435456], 123 -// CHECK: vgetmantpbf16 ymm22 {k7}, ymmword ptr [r8 + 4*rax + 291], 123 +// CHECK: vgetmantbf16 ymm22 {k7}, ymmword ptr [r8 + 4*rax + 291], 123 // CHECK: encoding: [0x62,0xc3,0x7f,0x2f,0x26,0xb4,0x80,0x23,0x01,0x00,0x00,0x7b] - vgetmantpbf16 ymm22 {k7}, ymmword ptr [r8 + 4*rax + 291], 123 + vgetmantbf16 ymm22 {k7}, ymmword ptr [r8 + 4*rax + 291], 123 -// CHECK: vgetmantpbf16 ymm22, word ptr [rip]{1to16}, 123 +// CHECK: vgetmantbf16 ymm22, word ptr [rip]{1to16}, 123 // CHECK: encoding: [0x62,0xe3,0x7f,0x38,0x26,0x35,0x00,0x00,0x00,0x00,0x7b] - vgetmantpbf16 ymm22, word ptr [rip]{1to16}, 123 + vgetmantbf16 ymm22, word ptr [rip]{1to16}, 123 -// CHECK: vgetmantpbf16 ymm22, ymmword ptr [2*rbp - 1024], 123 +// CHECK: vgetmantbf16 ymm22, ymmword ptr [2*rbp - 1024], 123 // CHECK: encoding: [0x62,0xe3,0x7f,0x28,0x26,0x34,0x6d,0x00,0xfc,0xff,0xff,0x7b] - vgetmantpbf16 ymm22, ymmword ptr [2*rbp - 1024], 123 + vgetmantbf16 ymm22, ymmword ptr [2*rbp - 1024], 123 -// CHECK: vgetmantpbf16 ymm22 {k7} {z}, ymmword ptr [rcx + 4064], 123 +// CHECK: vgetmantbf16 ymm22 {k7} {z}, ymmword ptr [rcx + 4064], 123 // CHECK: encoding: [0x62,0xe3,0x7f,0xaf,0x26,0x71,0x7f,0x7b] - vgetmantpbf16 ymm22 {k7} {z}, ymmword ptr [rcx + 4064], 123 + vgetmantbf16 ymm22 {k7} {z}, ymmword ptr [rcx + 4064], 123 -// CHECK: vgetmantpbf16 ymm22 {k7} {z}, word ptr [rdx - 256]{1to16}, 123 +// CHECK: vgetmantbf16 ymm22 {k7} {z}, word ptr [rdx - 256]{1to16}, 123 // CHECK: encoding: [0x62,0xe3,0x7f,0xbf,0x26,0x72,0x80,0x7b] - vgetmantpbf16 ymm22 {k7} {z}, word ptr [rdx - 256]{1to16}, 123 + vgetmantbf16 ymm22 {k7} {z}, word ptr [rdx - 256]{1to16}, 123 -// CHECK: vgetmantpbf16 zmm22, zmmword ptr [rbp + 8*r14 + 268435456], 123 +// CHECK: vgetmantbf16 zmm22, zmmword ptr [rbp + 8*r14 + 268435456], 123 // CHECK: encoding: [0x62,0xa3,0x7f,0x48,0x26,0xb4,0xf5,0x00,0x00,0x00,0x10,0x7b] - vgetmantpbf16 zmm22, zmmword ptr [rbp + 8*r14 + 268435456], 123 + vgetmantbf16 zmm22, zmmword ptr [rbp + 8*r14 + 268435456], 123 -// CHECK: vgetmantpbf16 zmm22 {k7}, zmmword ptr [r8 + 4*rax + 291], 123 +// CHECK: vgetmantbf16 zmm22 {k7}, zmmword ptr [r8 + 4*rax + 291], 123 // CHECK: encoding: [0x62,0xc3,0x7f,0x4f,0x26,0xb4,0x80,0x23,0x01,0x00,0x00,0x7b] - vgetmantpbf16 zmm22 {k7}, zmmword ptr [r8 + 4*rax + 291], 123 + vgetmantbf16 zmm22 {k7}, zmmword ptr [r8 + 4*rax + 291], 123 -// CHECK: vgetmantpbf16 zmm22, word ptr [rip]{1to32}, 123 +// CHECK: vgetmantbf16 zmm22, word ptr [rip]{1to32}, 123 // CHECK: encoding: [0x62,0xe3,0x7f,0x58,0x26,0x35,0x00,0x00,0x00,0x00,0x7b] - vgetmantpbf16 zmm22, word ptr [rip]{1to32}, 123 + vgetmantbf16 zmm22, word ptr [rip]{1to32}, 123 -// CHECK: vgetmantpbf16 zmm22, zmmword ptr [2*rbp - 2048], 123 +// CHECK: vgetmantbf16 zmm22, zmmword ptr [2*rbp - 2048], 123 // CHECK: encoding: [0x62,0xe3,0x7f,0x48,0x26,0x34,0x6d,0x00,0xf8,0xff,0xff,0x7b] - vgetmantpbf16 zmm22, zmmword ptr [2*rbp - 2048], 123 + vgetmantbf16 zmm22, zmmword ptr [2*rbp - 2048], 123 -// CHECK: vgetmantpbf16 zmm22 {k7} {z}, zmmword ptr [rcx + 8128], 123 +// CHECK: vgetmantbf16 zmm22 {k7} {z}, zmmword ptr [rcx + 8128], 123 // CHECK: encoding: [0x62,0xe3,0x7f,0xcf,0x26,0x71,0x7f,0x7b] - vgetmantpbf16 zmm22 {k7} {z}, zmmword ptr [rcx + 8128], 123 + vgetmantbf16 zmm22 {k7} {z}, zmmword ptr [rcx + 8128], 123 -// CHECK: vgetmantpbf16 zmm22 {k7} {z}, word ptr [rdx - 256]{1to32}, 123 +// CHECK: vgetmantbf16 zmm22 {k7} {z}, word ptr [rdx - 256]{1to32}, 123 // CHECK: encoding: [0x62,0xe3,0x7f,0xdf,0x26,0x72,0x80,0x7b] - vgetmantpbf16 zmm22 {k7} {z}, word ptr [rdx - 256]{1to32}, 123 + vgetmantbf16 zmm22 {k7} {z}, word ptr [rdx - 256]{1to32}, 123 -// CHECK: vmaxpbf16 ymm22, ymm23, ymm24 +// CHECK: vmaxbf16 ymm22, ymm23, ymm24 // CHECK: encoding: [0x62,0x85,0x45,0x20,0x5f,0xf0] - vmaxpbf16 ymm22, ymm23, ymm24 + vmaxbf16 ymm22, ymm23, ymm24 -// CHECK: vmaxpbf16 ymm22 {k7}, ymm23, ymm24 +// CHECK: vmaxbf16 ymm22 {k7}, ymm23, ymm24 // CHECK: encoding: [0x62,0x85,0x45,0x27,0x5f,0xf0] - vmaxpbf16 ymm22 {k7}, ymm23, ymm24 + vmaxbf16 ymm22 {k7}, ymm23, ymm24 -// CHECK: vmaxpbf16 ymm22 {k7} {z}, ymm23, ymm24 +// CHECK: vmaxbf16 ymm22 {k7} {z}, ymm23, ymm24 // CHECK: encoding: [0x62,0x85,0x45,0xa7,0x5f,0xf0] - vmaxpbf16 ymm22 {k7} {z}, ymm23, ymm24 + vmaxbf16 ymm22 {k7} {z}, ymm23, ymm24 -// CHECK: vmaxpbf16 zmm22, zmm23, zmm24 +// CHECK: vmaxbf16 zmm22, zmm23, zmm24 // CHECK: encoding: [0x62,0x85,0x45,0x40,0x5f,0xf0] - vmaxpbf16 zmm22, zmm23, zmm24 + vmaxbf16 zmm22, zmm23, zmm24 -// CHECK: vmaxpbf16 zmm22 {k7}, zmm23, zmm24 +// CHECK: vmaxbf16 zmm22 {k7}, zmm23, zmm24 // CHECK: encoding: [0x62,0x85,0x45,0x47,0x5f,0xf0] - vmaxpbf16 zmm22 {k7}, zmm23, zmm24 + vmaxbf16 zmm22 {k7}, zmm23, zmm24 -// CHECK: vmaxpbf16 zmm22 {k7} {z}, zmm23, zmm24 +// CHECK: vmaxbf16 zmm22 {k7} {z}, zmm23, zmm24 // CHECK: encoding: [0x62,0x85,0x45,0xc7,0x5f,0xf0] - vmaxpbf16 zmm22 {k7} {z}, zmm23, zmm24 + vmaxbf16 zmm22 {k7} {z}, zmm23, zmm24 -// CHECK: vmaxpbf16 xmm22, xmm23, xmm24 +// CHECK: vmaxbf16 xmm22, xmm23, xmm24 // CHECK: encoding: [0x62,0x85,0x45,0x00,0x5f,0xf0] - vmaxpbf16 xmm22, xmm23, xmm24 + vmaxbf16 xmm22, xmm23, xmm24 -// CHECK: vmaxpbf16 xmm22 {k7}, xmm23, xmm24 +// CHECK: vmaxbf16 xmm22 {k7}, xmm23, xmm24 // CHECK: encoding: [0x62,0x85,0x45,0x07,0x5f,0xf0] - vmaxpbf16 xmm22 {k7}, xmm23, xmm24 + vmaxbf16 xmm22 {k7}, xmm23, xmm24 -// CHECK: vmaxpbf16 xmm22 {k7} {z}, xmm23, xmm24 +// CHECK: vmaxbf16 xmm22 {k7} {z}, xmm23, xmm24 // CHECK: encoding: [0x62,0x85,0x45,0x87,0x5f,0xf0] - vmaxpbf16 xmm22 {k7} {z}, xmm23, xmm24 + vmaxbf16 xmm22 {k7} {z}, xmm23, xmm24 -// CHECK: vmaxpbf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456] +// CHECK: vmaxbf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456] // CHECK: encoding: [0x62,0xa5,0x45,0x40,0x5f,0xb4,0xf5,0x00,0x00,0x00,0x10] - vmaxpbf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456] + vmaxbf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456] -// CHECK: vmaxpbf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291] +// CHECK: vmaxbf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291] // CHECK: encoding: [0x62,0xc5,0x45,0x47,0x5f,0xb4,0x80,0x23,0x01,0x00,0x00] - vmaxpbf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291] + vmaxbf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291] -// CHECK: vmaxpbf16 zmm22, zmm23, word ptr [rip]{1to32} +// CHECK: vmaxbf16 zmm22, zmm23, word ptr [rip]{1to32} // CHECK: encoding: [0x62,0xe5,0x45,0x50,0x5f,0x35,0x00,0x00,0x00,0x00] - vmaxpbf16 zmm22, zmm23, word ptr [rip]{1to32} + vmaxbf16 zmm22, zmm23, word ptr [rip]{1to32} -// CHECK: vmaxpbf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048] +// CHECK: vmaxbf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048] // CHECK: encoding: [0x62,0xe5,0x45,0x40,0x5f,0x34,0x6d,0x00,0xf8,0xff,0xff] - vmaxpbf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048] + vmaxbf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048] -// CHECK: vmaxpbf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128] +// CHECK: vmaxbf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128] // CHECK: encoding: [0x62,0xe5,0x45,0xc7,0x5f,0x71,0x7f] - vmaxpbf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128] + vmaxbf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128] -// CHECK: vmaxpbf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32} +// CHECK: vmaxbf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32} // CHECK: encoding: [0x62,0xe5,0x45,0xd7,0x5f,0x72,0x80] - vmaxpbf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32} + vmaxbf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32} -// CHECK: vmaxpbf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456] +// CHECK: vmaxbf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456] // CHECK: encoding: [0x62,0xa5,0x45,0x20,0x5f,0xb4,0xf5,0x00,0x00,0x00,0x10] - vmaxpbf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456] + vmaxbf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456] -// CHECK: vmaxpbf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291] +// CHECK: vmaxbf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291] // CHECK: encoding: [0x62,0xc5,0x45,0x27,0x5f,0xb4,0x80,0x23,0x01,0x00,0x00] - vmaxpbf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291] + vmaxbf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291] -// CHECK: vmaxpbf16 ymm22, ymm23, word ptr [rip]{1to16} +// CHECK: vmaxbf16 ymm22, ymm23, word ptr [rip]{1to16} // CHECK: encoding: [0x62,0xe5,0x45,0x30,0x5f,0x35,0x00,0x00,0x00,0x00] - vmaxpbf16 ymm22, ymm23, word ptr [rip]{1to16} + vmaxbf16 ymm22, ymm23, word ptr [rip]{1to16} -// CHECK: vmaxpbf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024] +// CHECK: vmaxbf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024] // CHECK: encoding: [0x62,0xe5,0x45,0x20,0x5f,0x34,0x6d,0x00,0xfc,0xff,0xff] - vmaxpbf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024] + vmaxbf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024] -// CHECK: vmaxpbf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064] +// CHECK: vmaxbf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064] // CHECK: encoding: [0x62,0xe5,0x45,0xa7,0x5f,0x71,0x7f] - vmaxpbf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064] + vmaxbf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064] -// CHECK: vmaxpbf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16} +// CHECK: vmaxbf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16} // CHECK: encoding: [0x62,0xe5,0x45,0xb7,0x5f,0x72,0x80] - vmaxpbf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16} + vmaxbf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16} -// CHECK: vmaxpbf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456] +// CHECK: vmaxbf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456] // CHECK: encoding: [0x62,0xa5,0x45,0x00,0x5f,0xb4,0xf5,0x00,0x00,0x00,0x10] - vmaxpbf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456] + vmaxbf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456] -// CHECK: vmaxpbf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291] +// CHECK: vmaxbf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291] // CHECK: encoding: [0x62,0xc5,0x45,0x07,0x5f,0xb4,0x80,0x23,0x01,0x00,0x00] - vmaxpbf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291] + vmaxbf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291] -// CHECK: vmaxpbf16 xmm22, xmm23, word ptr [rip]{1to8} +// CHECK: vmaxbf16 xmm22, xmm23, word ptr [rip]{1to8} // CHECK: encoding: [0x62,0xe5,0x45,0x10,0x5f,0x35,0x00,0x00,0x00,0x00] - vmaxpbf16 xmm22, xmm23, word ptr [rip]{1to8} + vmaxbf16 xmm22, xmm23, word ptr [rip]{1to8} -// CHECK: vmaxpbf16 xmm22, xmm23, xmmword ptr [2*rbp - 512] +// CHECK: vmaxbf16 xmm22, xmm23, xmmword ptr [2*rbp - 512] // CHECK: encoding: [0x62,0xe5,0x45,0x00,0x5f,0x34,0x6d,0x00,0xfe,0xff,0xff] - vmaxpbf16 xmm22, xmm23, xmmword ptr [2*rbp - 512] + vmaxbf16 xmm22, xmm23, xmmword ptr [2*rbp - 512] -// CHECK: vmaxpbf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032] +// CHECK: vmaxbf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032] // CHECK: encoding: [0x62,0xe5,0x45,0x87,0x5f,0x71,0x7f] - vmaxpbf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032] + vmaxbf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032] -// CHECK: vmaxpbf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8} +// CHECK: vmaxbf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8} // CHECK: encoding: [0x62,0xe5,0x45,0x97,0x5f,0x72,0x80] - vmaxpbf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8} + vmaxbf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8} -// CHECK: vminpbf16 ymm22, ymm23, ymm24 +// CHECK: vminbf16 ymm22, ymm23, ymm24 // CHECK: encoding: [0x62,0x85,0x45,0x20,0x5d,0xf0] - vminpbf16 ymm22, ymm23, ymm24 + vminbf16 ymm22, ymm23, ymm24 -// CHECK: vminpbf16 ymm22 {k7}, ymm23, ymm24 +// CHECK: vminbf16 ymm22 {k7}, ymm23, ymm24 // CHECK: encoding: [0x62,0x85,0x45,0x27,0x5d,0xf0] - vminpbf16 ymm22 {k7}, ymm23, ymm24 + vminbf16 ymm22 {k7}, ymm23, ymm24 -// CHECK: vminpbf16 ymm22 {k7} {z}, ymm23, ymm24 +// CHECK: vminbf16 ymm22 {k7} {z}, ymm23, ymm24 // CHECK: encoding: [0x62,0x85,0x45,0xa7,0x5d,0xf0] - vminpbf16 ymm22 {k7} {z}, ymm23, ymm24 + vminbf16 ymm22 {k7} {z}, ymm23, ymm24 -// CHECK: vminpbf16 zmm22, zmm23, zmm24 +// CHECK: vminbf16 zmm22, zmm23, zmm24 // CHECK: encoding: [0x62,0x85,0x45,0x40,0x5d,0xf0] - vminpbf16 zmm22, zmm23, zmm24 + vminbf16 zmm22, zmm23, zmm24 -// CHECK: vminpbf16 zmm22 {k7}, zmm23, zmm24 +// CHECK: vminbf16 zmm22 {k7}, zmm23, zmm24 // CHECK: encoding: [0x62,0x85,0x45,0x47,0x5d,0xf0] - vminpbf16 zmm22 {k7}, zmm23, zmm24 + vminbf16 zmm22 {k7}, zmm23, zmm24 -// CHECK: vminpbf16 zmm22 {k7} {z}, zmm23, zmm24 +// CHECK: vminbf16 zmm22 {k7} {z}, zmm23, zmm24 // CHECK: encoding: [0x62,0x85,0x45,0xc7,0x5d,0xf0] - vminpbf16 zmm22 {k7} {z}, zmm23, zmm24 + vminbf16 zmm22 {k7} {z}, zmm23, zmm24 -// CHECK: vminpbf16 xmm22, xmm23, xmm24 +// CHECK: vminbf16 xmm22, xmm23, xmm24 // CHECK: encoding: [0x62,0x85,0x45,0x00,0x5d,0xf0] - vminpbf16 xmm22, xmm23, xmm24 + vminbf16 xmm22, xmm23, xmm24 -// CHECK: vminpbf16 xmm22 {k7}, xmm23, xmm24 +// CHECK: vminbf16 xmm22 {k7}, xmm23, xmm24 // CHECK: encoding: [0x62,0x85,0x45,0x07,0x5d,0xf0] - vminpbf16 xmm22 {k7}, xmm23, xmm24 + vminbf16 xmm22 {k7}, xmm23, xmm24 -// CHECK: vminpbf16 xmm22 {k7} {z}, xmm23, xmm24 +// CHECK: vminbf16 xmm22 {k7} {z}, xmm23, xmm24 // CHECK: encoding: [0x62,0x85,0x45,0x87,0x5d,0xf0] - vminpbf16 xmm22 {k7} {z}, xmm23, xmm24 + vminbf16 xmm22 {k7} {z}, xmm23, xmm24 -// CHECK: vminpbf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456] +// CHECK: vminbf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456] // CHECK: encoding: [0x62,0xa5,0x45,0x40,0x5d,0xb4,0xf5,0x00,0x00,0x00,0x10] - vminpbf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456] + vminbf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456] -// CHECK: vminpbf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291] +// CHECK: vminbf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291] // CHECK: encoding: [0x62,0xc5,0x45,0x47,0x5d,0xb4,0x80,0x23,0x01,0x00,0x00] - vminpbf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291] + vminbf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291] -// CHECK: vminpbf16 zmm22, zmm23, word ptr [rip]{1to32} +// CHECK: vminbf16 zmm22, zmm23, word ptr [rip]{1to32} // CHECK: encoding: [0x62,0xe5,0x45,0x50,0x5d,0x35,0x00,0x00,0x00,0x00] - vminpbf16 zmm22, zmm23, word ptr [rip]{1to32} + vminbf16 zmm22, zmm23, word ptr [rip]{1to32} -// CHECK: vminpbf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048] +// CHECK: vminbf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048] // CHECK: encoding: [0x62,0xe5,0x45,0x40,0x5d,0x34,0x6d,0x00,0xf8,0xff,0xff] - vminpbf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048] + vminbf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048] -// CHECK: vminpbf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128] +// CHECK: vminbf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128] // CHECK: encoding: [0x62,0xe5,0x45,0xc7,0x5d,0x71,0x7f] - vminpbf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128] + vminbf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128] -// CHECK: vminpbf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32} +// CHECK: vminbf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32} // CHECK: encoding: [0x62,0xe5,0x45,0xd7,0x5d,0x72,0x80] - vminpbf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32} + vminbf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32} -// CHECK: vminpbf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456] +// CHECK: vminbf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456] // CHECK: encoding: [0x62,0xa5,0x45,0x20,0x5d,0xb4,0xf5,0x00,0x00,0x00,0x10] - vminpbf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456] + vminbf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456] -// CHECK: vminpbf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291] +// CHECK: vminbf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291] // CHECK: encoding: [0x62,0xc5,0x45,0x27,0x5d,0xb4,0x80,0x23,0x01,0x00,0x00] - vminpbf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291] + vminbf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291] -// CHECK: vminpbf16 ymm22, ymm23, word ptr [rip]{1to16} +// CHECK: vminbf16 ymm22, ymm23, word ptr [rip]{1to16} // CHECK: encoding: [0x62,0xe5,0x45,0x30,0x5d,0x35,0x00,0x00,0x00,0x00] - vminpbf16 ymm22, ymm23, word ptr [rip]{1to16} + vminbf16 ymm22, ymm23, word ptr [rip]{1to16} -// CHECK: vminpbf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024] +// CHECK: vminbf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024] // CHECK: encoding: [0x62,0xe5,0x45,0x20,0x5d,0x34,0x6d,0x00,0xfc,0xff,0xff] - vminpbf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024] + vminbf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024] -// CHECK: vminpbf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064] +// CHECK: vminbf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064] // CHECK: encoding: [0x62,0xe5,0x45,0xa7,0x5d,0x71,0x7f] - vminpbf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064] + vminbf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064] -// CHECK: vminpbf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16} +// CHECK: vminbf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16} // CHECK: encoding: [0x62,0xe5,0x45,0xb7,0x5d,0x72,0x80] - vminpbf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16} + vminbf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16} -// CHECK: vminpbf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456] +// CHECK: vminbf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456] // CHECK: encoding: [0x62,0xa5,0x45,0x00,0x5d,0xb4,0xf5,0x00,0x00,0x00,0x10] - vminpbf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456] + vminbf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456] -// CHECK: vminpbf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291] +// CHECK: vminbf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291] // CHECK: encoding: [0x62,0xc5,0x45,0x07,0x5d,0xb4,0x80,0x23,0x01,0x00,0x00] - vminpbf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291] + vminbf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291] -// CHECK: vminpbf16 xmm22, xmm23, word ptr [rip]{1to8} +// CHECK: vminbf16 xmm22, xmm23, word ptr [rip]{1to8} // CHECK: encoding: [0x62,0xe5,0x45,0x10,0x5d,0x35,0x00,0x00,0x00,0x00] - vminpbf16 xmm22, xmm23, word ptr [rip]{1to8} + vminbf16 xmm22, xmm23, word ptr [rip]{1to8} -// CHECK: vminpbf16 xmm22, xmm23, xmmword ptr [2*rbp - 512] +// CHECK: vminbf16 xmm22, xmm23, xmmword ptr [2*rbp - 512] // CHECK: encoding: [0x62,0xe5,0x45,0x00,0x5d,0x34,0x6d,0x00,0xfe,0xff,0xff] - vminpbf16 xmm22, xmm23, xmmword ptr [2*rbp - 512] + vminbf16 xmm22, xmm23, xmmword ptr [2*rbp - 512] -// CHECK: vminpbf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032] +// CHECK: vminbf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032] // CHECK: encoding: [0x62,0xe5,0x45,0x87,0x5d,0x71,0x7f] - vminpbf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032] + vminbf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032] -// CHECK: vminpbf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8} +// CHECK: vminbf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8} // CHECK: encoding: [0x62,0xe5,0x45,0x97,0x5d,0x72,0x80] - vminpbf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8} + vminbf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8} -// CHECK: vmulnepbf16 ymm22, ymm23, ymm24 +// CHECK: vmulbf16 ymm22, ymm23, ymm24 // CHECK: encoding: [0x62,0x85,0x45,0x20,0x59,0xf0] - vmulnepbf16 ymm22, ymm23, ymm24 + vmulbf16 ymm22, ymm23, ymm24 -// CHECK: vmulnepbf16 ymm22 {k7}, ymm23, ymm24 +// CHECK: vmulbf16 ymm22 {k7}, ymm23, ymm24 // CHECK: encoding: [0x62,0x85,0x45,0x27,0x59,0xf0] - vmulnepbf16 ymm22 {k7}, ymm23, ymm24 + vmulbf16 ymm22 {k7}, ymm23, ymm24 -// CHECK: vmulnepbf16 ymm22 {k7} {z}, ymm23, ymm24 +// CHECK: vmulbf16 ymm22 {k7} {z}, ymm23, ymm24 // CHECK: encoding: [0x62,0x85,0x45,0xa7,0x59,0xf0] - vmulnepbf16 ymm22 {k7} {z}, ymm23, ymm24 + vmulbf16 ymm22 {k7} {z}, ymm23, ymm24 -// CHECK: vmulnepbf16 zmm22, zmm23, zmm24 +// CHECK: vmulbf16 zmm22, zmm23, zmm24 // CHECK: encoding: [0x62,0x85,0x45,0x40,0x59,0xf0] - vmulnepbf16 zmm22, zmm23, zmm24 + vmulbf16 zmm22, zmm23, zmm24 -// CHECK: vmulnepbf16 zmm22 {k7}, zmm23, zmm24 +// CHECK: vmulbf16 zmm22 {k7}, zmm23, zmm24 // CHECK: encoding: [0x62,0x85,0x45,0x47,0x59,0xf0] - vmulnepbf16 zmm22 {k7}, zmm23, zmm24 + vmulbf16 zmm22 {k7}, zmm23, zmm24 -// CHECK: vmulnepbf16 zmm22 {k7} {z}, zmm23, zmm24 +// CHECK: vmulbf16 zmm22 {k7} {z}, zmm23, zmm24 // CHECK: encoding: [0x62,0x85,0x45,0xc7,0x59,0xf0] - vmulnepbf16 zmm22 {k7} {z}, zmm23, zmm24 + vmulbf16 zmm22 {k7} {z}, zmm23, zmm24 -// CHECK: vmulnepbf16 xmm22, xmm23, xmm24 +// CHECK: vmulbf16 xmm22, xmm23, xmm24 // CHECK: encoding: [0x62,0x85,0x45,0x00,0x59,0xf0] - vmulnepbf16 xmm22, xmm23, xmm24 + vmulbf16 xmm22, xmm23, xmm24 -// CHECK: vmulnepbf16 xmm22 {k7}, xmm23, xmm24 +// CHECK: vmulbf16 xmm22 {k7}, xmm23, xmm24 // CHECK: encoding: [0x62,0x85,0x45,0x07,0x59,0xf0] - vmulnepbf16 xmm22 {k7}, xmm23, xmm24 + vmulbf16 xmm22 {k7}, xmm23, xmm24 -// CHECK: vmulnepbf16 xmm22 {k7} {z}, xmm23, xmm24 +// CHECK: vmulbf16 xmm22 {k7} {z}, xmm23, xmm24 // CHECK: encoding: [0x62,0x85,0x45,0x87,0x59,0xf0] - vmulnepbf16 xmm22 {k7} {z}, xmm23, xmm24 + vmulbf16 xmm22 {k7} {z}, xmm23, xmm24 -// CHECK: vmulnepbf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456] +// CHECK: vmulbf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456] // CHECK: encoding: [0x62,0xa5,0x45,0x40,0x59,0xb4,0xf5,0x00,0x00,0x00,0x10] - vmulnepbf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456] + vmulbf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456] -// CHECK: vmulnepbf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291] +// CHECK: vmulbf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291] // CHECK: encoding: [0x62,0xc5,0x45,0x47,0x59,0xb4,0x80,0x23,0x01,0x00,0x00] - vmulnepbf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291] + vmulbf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291] -// CHECK: vmulnepbf16 zmm22, zmm23, word ptr [rip]{1to32} +// CHECK: vmulbf16 zmm22, zmm23, word ptr [rip]{1to32} // CHECK: encoding: [0x62,0xe5,0x45,0x50,0x59,0x35,0x00,0x00,0x00,0x00] - vmulnepbf16 zmm22, zmm23, word ptr [rip]{1to32} + vmulbf16 zmm22, zmm23, word ptr [rip]{1to32} -// CHECK: vmulnepbf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048] +// CHECK: vmulbf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048] // CHECK: encoding: [0x62,0xe5,0x45,0x40,0x59,0x34,0x6d,0x00,0xf8,0xff,0xff] - vmulnepbf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048] + vmulbf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048] -// CHECK: vmulnepbf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128] +// CHECK: vmulbf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128] // CHECK: encoding: [0x62,0xe5,0x45,0xc7,0x59,0x71,0x7f] - vmulnepbf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128] + vmulbf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128] -// CHECK: vmulnepbf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32} +// CHECK: vmulbf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32} // CHECK: encoding: [0x62,0xe5,0x45,0xd7,0x59,0x72,0x80] - vmulnepbf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32} + vmulbf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32} -// CHECK: vmulnepbf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456] +// CHECK: vmulbf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456] // CHECK: encoding: [0x62,0xa5,0x45,0x20,0x59,0xb4,0xf5,0x00,0x00,0x00,0x10] - vmulnepbf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456] + vmulbf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456] -// CHECK: vmulnepbf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291] +// CHECK: vmulbf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291] // CHECK: encoding: [0x62,0xc5,0x45,0x27,0x59,0xb4,0x80,0x23,0x01,0x00,0x00] - vmulnepbf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291] + vmulbf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291] -// CHECK: vmulnepbf16 ymm22, ymm23, word ptr [rip]{1to16} +// CHECK: vmulbf16 ymm22, ymm23, word ptr [rip]{1to16} // CHECK: encoding: [0x62,0xe5,0x45,0x30,0x59,0x35,0x00,0x00,0x00,0x00] - vmulnepbf16 ymm22, ymm23, word ptr [rip]{1to16} + vmulbf16 ymm22, ymm23, word ptr [rip]{1to16} -// CHECK: vmulnepbf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024] +// CHECK: vmulbf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024] // CHECK: encoding: [0x62,0xe5,0x45,0x20,0x59,0x34,0x6d,0x00,0xfc,0xff,0xff] - vmulnepbf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024] + vmulbf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024] -// CHECK: vmulnepbf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064] +// CHECK: vmulbf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064] // CHECK: encoding: [0x62,0xe5,0x45,0xa7,0x59,0x71,0x7f] - vmulnepbf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064] + vmulbf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064] -// CHECK: vmulnepbf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16} +// CHECK: vmulbf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16} // CHECK: encoding: [0x62,0xe5,0x45,0xb7,0x59,0x72,0x80] - vmulnepbf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16} + vmulbf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16} -// CHECK: vmulnepbf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456] +// CHECK: vmulbf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456] // CHECK: encoding: [0x62,0xa5,0x45,0x00,0x59,0xb4,0xf5,0x00,0x00,0x00,0x10] - vmulnepbf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456] + vmulbf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456] -// CHECK: vmulnepbf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291] +// CHECK: vmulbf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291] // CHECK: encoding: [0x62,0xc5,0x45,0x07,0x59,0xb4,0x80,0x23,0x01,0x00,0x00] - vmulnepbf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291] + vmulbf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291] -// CHECK: vmulnepbf16 xmm22, xmm23, word ptr [rip]{1to8} +// CHECK: vmulbf16 xmm22, xmm23, word ptr [rip]{1to8} // CHECK: encoding: [0x62,0xe5,0x45,0x10,0x59,0x35,0x00,0x00,0x00,0x00] - vmulnepbf16 xmm22, xmm23, word ptr [rip]{1to8} + vmulbf16 xmm22, xmm23, word ptr [rip]{1to8} -// CHECK: vmulnepbf16 xmm22, xmm23, xmmword ptr [2*rbp - 512] +// CHECK: vmulbf16 xmm22, xmm23, xmmword ptr [2*rbp - 512] // CHECK: encoding: [0x62,0xe5,0x45,0x00,0x59,0x34,0x6d,0x00,0xfe,0xff,0xff] - vmulnepbf16 xmm22, xmm23, xmmword ptr [2*rbp - 512] + vmulbf16 xmm22, xmm23, xmmword ptr [2*rbp - 512] -// CHECK: vmulnepbf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032] +// CHECK: vmulbf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032] // CHECK: encoding: [0x62,0xe5,0x45,0x87,0x59,0x71,0x7f] - vmulnepbf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032] + vmulbf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032] -// CHECK: vmulnepbf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8} +// CHECK: vmulbf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8} // CHECK: encoding: [0x62,0xe5,0x45,0x97,0x59,0x72,0x80] - vmulnepbf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8} + vmulbf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8} -// CHECK: vrcppbf16 xmm22, xmm23 +// CHECK: vrcpbf16 xmm22, xmm23 // CHECK: encoding: [0x62,0xa6,0x7c,0x08,0x4c,0xf7] - vrcppbf16 xmm22, xmm23 + vrcpbf16 xmm22, xmm23 -// CHECK: vrcppbf16 xmm22 {k7}, xmm23 +// CHECK: vrcpbf16 xmm22 {k7}, xmm23 // CHECK: encoding: [0x62,0xa6,0x7c,0x0f,0x4c,0xf7] - vrcppbf16 xmm22 {k7}, xmm23 + vrcpbf16 xmm22 {k7}, xmm23 -// CHECK: vrcppbf16 xmm22 {k7} {z}, xmm23 +// CHECK: vrcpbf16 xmm22 {k7} {z}, xmm23 // CHECK: encoding: [0x62,0xa6,0x7c,0x8f,0x4c,0xf7] - vrcppbf16 xmm22 {k7} {z}, xmm23 + vrcpbf16 xmm22 {k7} {z}, xmm23 -// CHECK: vrcppbf16 zmm22, zmm23 +// CHECK: vrcpbf16 zmm22, zmm23 // CHECK: encoding: [0x62,0xa6,0x7c,0x48,0x4c,0xf7] - vrcppbf16 zmm22, zmm23 + vrcpbf16 zmm22, zmm23 -// CHECK: vrcppbf16 zmm22 {k7}, zmm23 +// CHECK: vrcpbf16 zmm22 {k7}, zmm23 // CHECK: encoding: [0x62,0xa6,0x7c,0x4f,0x4c,0xf7] - vrcppbf16 zmm22 {k7}, zmm23 + vrcpbf16 zmm22 {k7}, zmm23 -// CHECK: vrcppbf16 zmm22 {k7} {z}, zmm23 +// CHECK: vrcpbf16 zmm22 {k7} {z}, zmm23 // CHECK: encoding: [0x62,0xa6,0x7c,0xcf,0x4c,0xf7] - vrcppbf16 zmm22 {k7} {z}, zmm23 + vrcpbf16 zmm22 {k7} {z}, zmm23 -// CHECK: vrcppbf16 ymm22, ymm23 +// CHECK: vrcpbf16 ymm22, ymm23 // CHECK: encoding: [0x62,0xa6,0x7c,0x28,0x4c,0xf7] - vrcppbf16 ymm22, ymm23 + vrcpbf16 ymm22, ymm23 -// CHECK: vrcppbf16 ymm22 {k7}, ymm23 +// CHECK: vrcpbf16 ymm22 {k7}, ymm23 // CHECK: encoding: [0x62,0xa6,0x7c,0x2f,0x4c,0xf7] - vrcppbf16 ymm22 {k7}, ymm23 + vrcpbf16 ymm22 {k7}, ymm23 -// CHECK: vrcppbf16 ymm22 {k7} {z}, ymm23 +// CHECK: vrcpbf16 ymm22 {k7} {z}, ymm23 // CHECK: encoding: [0x62,0xa6,0x7c,0xaf,0x4c,0xf7] - vrcppbf16 ymm22 {k7} {z}, ymm23 + vrcpbf16 ymm22 {k7} {z}, ymm23 -// CHECK: vrcppbf16 xmm22, xmmword ptr [rbp + 8*r14 + 268435456] +// CHECK: vrcpbf16 xmm22, xmmword ptr [rbp + 8*r14 + 268435456] // CHECK: encoding: [0x62,0xa6,0x7c,0x08,0x4c,0xb4,0xf5,0x00,0x00,0x00,0x10] - vrcppbf16 xmm22, xmmword ptr [rbp + 8*r14 + 268435456] + vrcpbf16 xmm22, xmmword ptr [rbp + 8*r14 + 268435456] -// CHECK: vrcppbf16 xmm22 {k7}, xmmword ptr [r8 + 4*rax + 291] +// CHECK: vrcpbf16 xmm22 {k7}, xmmword ptr [r8 + 4*rax + 291] // CHECK: encoding: [0x62,0xc6,0x7c,0x0f,0x4c,0xb4,0x80,0x23,0x01,0x00,0x00] - vrcppbf16 xmm22 {k7}, xmmword ptr [r8 + 4*rax + 291] + vrcpbf16 xmm22 {k7}, xmmword ptr [r8 + 4*rax + 291] -// CHECK: vrcppbf16 xmm22, word ptr [rip]{1to8} +// CHECK: vrcpbf16 xmm22, word ptr [rip]{1to8} // CHECK: encoding: [0x62,0xe6,0x7c,0x18,0x4c,0x35,0x00,0x00,0x00,0x00] - vrcppbf16 xmm22, word ptr [rip]{1to8} + vrcpbf16 xmm22, word ptr [rip]{1to8} -// CHECK: vrcppbf16 xmm22, xmmword ptr [2*rbp - 512] +// CHECK: vrcpbf16 xmm22, xmmword ptr [2*rbp - 512] // CHECK: encoding: [0x62,0xe6,0x7c,0x08,0x4c,0x34,0x6d,0x00,0xfe,0xff,0xff] - vrcppbf16 xmm22, xmmword ptr [2*rbp - 512] + vrcpbf16 xmm22, xmmword ptr [2*rbp - 512] -// CHECK: vrcppbf16 xmm22 {k7} {z}, xmmword ptr [rcx + 2032] +// CHECK: vrcpbf16 xmm22 {k7} {z}, xmmword ptr [rcx + 2032] // CHECK: encoding: [0x62,0xe6,0x7c,0x8f,0x4c,0x71,0x7f] - vrcppbf16 xmm22 {k7} {z}, xmmword ptr [rcx + 2032] + vrcpbf16 xmm22 {k7} {z}, xmmword ptr [rcx + 2032] -// CHECK: vrcppbf16 xmm22 {k7} {z}, word ptr [rdx - 256]{1to8} +// CHECK: vrcpbf16 xmm22 {k7} {z}, word ptr [rdx - 256]{1to8} // CHECK: encoding: [0x62,0xe6,0x7c,0x9f,0x4c,0x72,0x80] - vrcppbf16 xmm22 {k7} {z}, word ptr [rdx - 256]{1to8} + vrcpbf16 xmm22 {k7} {z}, word ptr [rdx - 256]{1to8} -// CHECK: vrcppbf16 ymm22, ymmword ptr [rbp + 8*r14 + 268435456] +// CHECK: vrcpbf16 ymm22, ymmword ptr [rbp + 8*r14 + 268435456] // CHECK: encoding: [0x62,0xa6,0x7c,0x28,0x4c,0xb4,0xf5,0x00,0x00,0x00,0x10] - vrcppbf16 ymm22, ymmword ptr [rbp + 8*r14 + 268435456] + vrcpbf16 ymm22, ymmword ptr [rbp + 8*r14 + 268435456] -// CHECK: vrcppbf16 ymm22 {k7}, ymmword ptr [r8 + 4*rax + 291] +// CHECK: vrcpbf16 ymm22 {k7}, ymmword ptr [r8 + 4*rax + 291] // CHECK: encoding: [0x62,0xc6,0x7c,0x2f,0x4c,0xb4,0x80,0x23,0x01,0x00,0x00] - vrcppbf16 ymm22 {k7}, ymmword ptr [r8 + 4*rax + 291] + vrcpbf16 ymm22 {k7}, ymmword ptr [r8 + 4*rax + 291] -// CHECK: vrcppbf16 ymm22, word ptr [rip]{1to16} +// CHECK: vrcpbf16 ymm22, word ptr [rip]{1to16} // CHECK: encoding: [0x62,0xe6,0x7c,0x38,0x4c,0x35,0x00,0x00,0x00,0x00] - vrcppbf16 ymm22, word ptr [rip]{1to16} + vrcpbf16 ymm22, word ptr [rip]{1to16} -// CHECK: vrcppbf16 ymm22, ymmword ptr [2*rbp - 1024] +// CHECK: vrcpbf16 ymm22, ymmword ptr [2*rbp - 1024] // CHECK: encoding: [0x62,0xe6,0x7c,0x28,0x4c,0x34,0x6d,0x00,0xfc,0xff,0xff] - vrcppbf16 ymm22, ymmword ptr [2*rbp - 1024] + vrcpbf16 ymm22, ymmword ptr [2*rbp - 1024] -// CHECK: vrcppbf16 ymm22 {k7} {z}, ymmword ptr [rcx + 4064] +// CHECK: vrcpbf16 ymm22 {k7} {z}, ymmword ptr [rcx + 4064] // CHECK: encoding: [0x62,0xe6,0x7c,0xaf,0x4c,0x71,0x7f] - vrcppbf16 ymm22 {k7} {z}, ymmword ptr [rcx + 4064] + vrcpbf16 ymm22 {k7} {z}, ymmword ptr [rcx + 4064] -// CHECK: vrcppbf16 ymm22 {k7} {z}, word ptr [rdx - 256]{1to16} +// CHECK: vrcpbf16 ymm22 {k7} {z}, word ptr [rdx - 256]{1to16} // CHECK: encoding: [0x62,0xe6,0x7c,0xbf,0x4c,0x72,0x80] - vrcppbf16 ymm22 {k7} {z}, word ptr [rdx - 256]{1to16} + vrcpbf16 ymm22 {k7} {z}, word ptr [rdx - 256]{1to16} -// CHECK: vrcppbf16 zmm22, zmmword ptr [rbp + 8*r14 + 268435456] +// CHECK: vrcpbf16 zmm22, zmmword ptr [rbp + 8*r14 + 268435456] // CHECK: encoding: [0x62,0xa6,0x7c,0x48,0x4c,0xb4,0xf5,0x00,0x00,0x00,0x10] - vrcppbf16 zmm22, zmmword ptr [rbp + 8*r14 + 268435456] + vrcpbf16 zmm22, zmmword ptr [rbp + 8*r14 + 268435456] -// CHECK: vrcppbf16 zmm22 {k7}, zmmword ptr [r8 + 4*rax + 291] +// CHECK: vrcpbf16 zmm22 {k7}, zmmword ptr [r8 + 4*rax + 291] // CHECK: encoding: [0x62,0xc6,0x7c,0x4f,0x4c,0xb4,0x80,0x23,0x01,0x00,0x00] - vrcppbf16 zmm22 {k7}, zmmword ptr [r8 + 4*rax + 291] + vrcpbf16 zmm22 {k7}, zmmword ptr [r8 + 4*rax + 291] -// CHECK: vrcppbf16 zmm22, word ptr [rip]{1to32} +// CHECK: vrcpbf16 zmm22, word ptr [rip]{1to32} // CHECK: encoding: [0x62,0xe6,0x7c,0x58,0x4c,0x35,0x00,0x00,0x00,0x00] - vrcppbf16 zmm22, word ptr [rip]{1to32} + vrcpbf16 zmm22, word ptr [rip]{1to32} -// CHECK: vrcppbf16 zmm22, zmmword ptr [2*rbp - 2048] +// CHECK: vrcpbf16 zmm22, zmmword ptr [2*rbp - 2048] // CHECK: encoding: [0x62,0xe6,0x7c,0x48,0x4c,0x34,0x6d,0x00,0xf8,0xff,0xff] - vrcppbf16 zmm22, zmmword ptr [2*rbp - 2048] + vrcpbf16 zmm22, zmmword ptr [2*rbp - 2048] -// CHECK: vrcppbf16 zmm22 {k7} {z}, zmmword ptr [rcx + 8128] +// CHECK: vrcpbf16 zmm22 {k7} {z}, zmmword ptr [rcx + 8128] // CHECK: encoding: [0x62,0xe6,0x7c,0xcf,0x4c,0x71,0x7f] - vrcppbf16 zmm22 {k7} {z}, zmmword ptr [rcx + 8128] + vrcpbf16 zmm22 {k7} {z}, zmmword ptr [rcx + 8128] -// CHECK: vrcppbf16 zmm22 {k7} {z}, word ptr [rdx - 256]{1to32} +// CHECK: vrcpbf16 zmm22 {k7} {z}, word ptr [rdx - 256]{1to32} // CHECK: encoding: [0x62,0xe6,0x7c,0xdf,0x4c,0x72,0x80] - vrcppbf16 zmm22 {k7} {z}, word ptr [rdx - 256]{1to32} + vrcpbf16 zmm22 {k7} {z}, word ptr [rdx - 256]{1to32} -// CHECK: vreducenepbf16 zmm22, zmm23, 123 +// CHECK: vreducebf16 zmm22, zmm23, 123 // CHECK: encoding: [0x62,0xa3,0x7f,0x48,0x56,0xf7,0x7b] - vreducenepbf16 zmm22, zmm23, 123 + vreducebf16 zmm22, zmm23, 123 -// CHECK: vreducenepbf16 zmm22 {k7}, zmm23, 123 +// CHECK: vreducebf16 zmm22 {k7}, zmm23, 123 // CHECK: encoding: [0x62,0xa3,0x7f,0x4f,0x56,0xf7,0x7b] - vreducenepbf16 zmm22 {k7}, zmm23, 123 + vreducebf16 zmm22 {k7}, zmm23, 123 -// CHECK: vreducenepbf16 zmm22 {k7} {z}, zmm23, 123 +// CHECK: vreducebf16 zmm22 {k7} {z}, zmm23, 123 // CHECK: encoding: [0x62,0xa3,0x7f,0xcf,0x56,0xf7,0x7b] - vreducenepbf16 zmm22 {k7} {z}, zmm23, 123 + vreducebf16 zmm22 {k7} {z}, zmm23, 123 -// CHECK: vreducenepbf16 ymm22, ymm23, 123 +// CHECK: vreducebf16 ymm22, ymm23, 123 // CHECK: encoding: [0x62,0xa3,0x7f,0x28,0x56,0xf7,0x7b] - vreducenepbf16 ymm22, ymm23, 123 + vreducebf16 ymm22, ymm23, 123 -// CHECK: vreducenepbf16 ymm22 {k7}, ymm23, 123 +// CHECK: vreducebf16 ymm22 {k7}, ymm23, 123 // CHECK: encoding: [0x62,0xa3,0x7f,0x2f,0x56,0xf7,0x7b] - vreducenepbf16 ymm22 {k7}, ymm23, 123 + vreducebf16 ymm22 {k7}, ymm23, 123 -// CHECK: vreducenepbf16 ymm22 {k7} {z}, ymm23, 123 +// CHECK: vreducebf16 ymm22 {k7} {z}, ymm23, 123 // CHECK: encoding: [0x62,0xa3,0x7f,0xaf,0x56,0xf7,0x7b] - vreducenepbf16 ymm22 {k7} {z}, ymm23, 123 + vreducebf16 ymm22 {k7} {z}, ymm23, 123 -// CHECK: vreducenepbf16 xmm22, xmm23, 123 +// CHECK: vreducebf16 xmm22, xmm23, 123 // CHECK: encoding: [0x62,0xa3,0x7f,0x08,0x56,0xf7,0x7b] - vreducenepbf16 xmm22, xmm23, 123 + vreducebf16 xmm22, xmm23, 123 -// CHECK: vreducenepbf16 xmm22 {k7}, xmm23, 123 +// CHECK: vreducebf16 xmm22 {k7}, xmm23, 123 // CHECK: encoding: [0x62,0xa3,0x7f,0x0f,0x56,0xf7,0x7b] - vreducenepbf16 xmm22 {k7}, xmm23, 123 + vreducebf16 xmm22 {k7}, xmm23, 123 -// CHECK: vreducenepbf16 xmm22 {k7} {z}, xmm23, 123 +// CHECK: vreducebf16 xmm22 {k7} {z}, xmm23, 123 // CHECK: encoding: [0x62,0xa3,0x7f,0x8f,0x56,0xf7,0x7b] - vreducenepbf16 xmm22 {k7} {z}, xmm23, 123 + vreducebf16 xmm22 {k7} {z}, xmm23, 123 -// CHECK: vreducenepbf16 xmm22, xmmword ptr [rbp + 8*r14 + 268435456], 123 +// CHECK: vreducebf16 xmm22, xmmword ptr [rbp + 8*r14 + 268435456], 123 // CHECK: encoding: [0x62,0xa3,0x7f,0x08,0x56,0xb4,0xf5,0x00,0x00,0x00,0x10,0x7b] - vreducenepbf16 xmm22, xmmword ptr [rbp + 8*r14 + 268435456], 123 + vreducebf16 xmm22, xmmword ptr [rbp + 8*r14 + 268435456], 123 -// CHECK: vreducenepbf16 xmm22 {k7}, xmmword ptr [r8 + 4*rax + 291], 123 +// CHECK: vreducebf16 xmm22 {k7}, xmmword ptr [r8 + 4*rax + 291], 123 // CHECK: encoding: [0x62,0xc3,0x7f,0x0f,0x56,0xb4,0x80,0x23,0x01,0x00,0x00,0x7b] - vreducenepbf16 xmm22 {k7}, xmmword ptr [r8 + 4*rax + 291], 123 + vreducebf16 xmm22 {k7}, xmmword ptr [r8 + 4*rax + 291], 123 -// CHECK: vreducenepbf16 xmm22, word ptr [rip]{1to8}, 123 +// CHECK: vreducebf16 xmm22, word ptr [rip]{1to8}, 123 // CHECK: encoding: [0x62,0xe3,0x7f,0x18,0x56,0x35,0x00,0x00,0x00,0x00,0x7b] - vreducenepbf16 xmm22, word ptr [rip]{1to8}, 123 + vreducebf16 xmm22, word ptr [rip]{1to8}, 123 -// CHECK: vreducenepbf16 xmm22, xmmword ptr [2*rbp - 512], 123 +// CHECK: vreducebf16 xmm22, xmmword ptr [2*rbp - 512], 123 // CHECK: encoding: [0x62,0xe3,0x7f,0x08,0x56,0x34,0x6d,0x00,0xfe,0xff,0xff,0x7b] - vreducenepbf16 xmm22, xmmword ptr [2*rbp - 512], 123 + vreducebf16 xmm22, xmmword ptr [2*rbp - 512], 123 -// CHECK: vreducenepbf16 xmm22 {k7} {z}, xmmword ptr [rcx + 2032], 123 +// CHECK: vreducebf16 xmm22 {k7} {z}, xmmword ptr [rcx + 2032], 123 // CHECK: encoding: [0x62,0xe3,0x7f,0x8f,0x56,0x71,0x7f,0x7b] - vreducenepbf16 xmm22 {k7} {z}, xmmword ptr [rcx + 2032], 123 + vreducebf16 xmm22 {k7} {z}, xmmword ptr [rcx + 2032], 123 -// CHECK: vreducenepbf16 xmm22 {k7} {z}, word ptr [rdx - 256]{1to8}, 123 +// CHECK: vreducebf16 xmm22 {k7} {z}, word ptr [rdx - 256]{1to8}, 123 // CHECK: encoding: [0x62,0xe3,0x7f,0x9f,0x56,0x72,0x80,0x7b] - vreducenepbf16 xmm22 {k7} {z}, word ptr [rdx - 256]{1to8}, 123 + vreducebf16 xmm22 {k7} {z}, word ptr [rdx - 256]{1to8}, 123 -// CHECK: vreducenepbf16 ymm22, ymmword ptr [rbp + 8*r14 + 268435456], 123 +// CHECK: vreducebf16 ymm22, ymmword ptr [rbp + 8*r14 + 268435456], 123 // CHECK: encoding: [0x62,0xa3,0x7f,0x28,0x56,0xb4,0xf5,0x00,0x00,0x00,0x10,0x7b] - vreducenepbf16 ymm22, ymmword ptr [rbp + 8*r14 + 268435456], 123 + vreducebf16 ymm22, ymmword ptr [rbp + 8*r14 + 268435456], 123 -// CHECK: vreducenepbf16 ymm22 {k7}, ymmword ptr [r8 + 4*rax + 291], 123 +// CHECK: vreducebf16 ymm22 {k7}, ymmword ptr [r8 + 4*rax + 291], 123 // CHECK: encoding: [0x62,0xc3,0x7f,0x2f,0x56,0xb4,0x80,0x23,0x01,0x00,0x00,0x7b] - vreducenepbf16 ymm22 {k7}, ymmword ptr [r8 + 4*rax + 291], 123 + vreducebf16 ymm22 {k7}, ymmword ptr [r8 + 4*rax + 291], 123 -// CHECK: vreducenepbf16 ymm22, word ptr [rip]{1to16}, 123 +// CHECK: vreducebf16 ymm22, word ptr [rip]{1to16}, 123 // CHECK: encoding: [0x62,0xe3,0x7f,0x38,0x56,0x35,0x00,0x00,0x00,0x00,0x7b] - vreducenepbf16 ymm22, word ptr [rip]{1to16}, 123 + vreducebf16 ymm22, word ptr [rip]{1to16}, 123 -// CHECK: vreducenepbf16 ymm22, ymmword ptr [2*rbp - 1024], 123 +// CHECK: vreducebf16 ymm22, ymmword ptr [2*rbp - 1024], 123 // CHECK: encoding: [0x62,0xe3,0x7f,0x28,0x56,0x34,0x6d,0x00,0xfc,0xff,0xff,0x7b] - vreducenepbf16 ymm22, ymmword ptr [2*rbp - 1024], 123 + vreducebf16 ymm22, ymmword ptr [2*rbp - 1024], 123 -// CHECK: vreducenepbf16 ymm22 {k7} {z}, ymmword ptr [rcx + 4064], 123 +// CHECK: vreducebf16 ymm22 {k7} {z}, ymmword ptr [rcx + 4064], 123 // CHECK: encoding: [0x62,0xe3,0x7f,0xaf,0x56,0x71,0x7f,0x7b] - vreducenepbf16 ymm22 {k7} {z}, ymmword ptr [rcx + 4064], 123 + vreducebf16 ymm22 {k7} {z}, ymmword ptr [rcx + 4064], 123 -// CHECK: vreducenepbf16 ymm22 {k7} {z}, word ptr [rdx - 256]{1to16}, 123 +// CHECK: vreducebf16 ymm22 {k7} {z}, word ptr [rdx - 256]{1to16}, 123 // CHECK: encoding: [0x62,0xe3,0x7f,0xbf,0x56,0x72,0x80,0x7b] - vreducenepbf16 ymm22 {k7} {z}, word ptr [rdx - 256]{1to16}, 123 + vreducebf16 ymm22 {k7} {z}, word ptr [rdx - 256]{1to16}, 123 -// CHECK: vreducenepbf16 zmm22, zmmword ptr [rbp + 8*r14 + 268435456], 123 +// CHECK: vreducebf16 zmm22, zmmword ptr [rbp + 8*r14 + 268435456], 123 // CHECK: encoding: [0x62,0xa3,0x7f,0x48,0x56,0xb4,0xf5,0x00,0x00,0x00,0x10,0x7b] - vreducenepbf16 zmm22, zmmword ptr [rbp + 8*r14 + 268435456], 123 + vreducebf16 zmm22, zmmword ptr [rbp + 8*r14 + 268435456], 123 -// CHECK: vreducenepbf16 zmm22 {k7}, zmmword ptr [r8 + 4*rax + 291], 123 +// CHECK: vreducebf16 zmm22 {k7}, zmmword ptr [r8 + 4*rax + 291], 123 // CHECK: encoding: [0x62,0xc3,0x7f,0x4f,0x56,0xb4,0x80,0x23,0x01,0x00,0x00,0x7b] - vreducenepbf16 zmm22 {k7}, zmmword ptr [r8 + 4*rax + 291], 123 + vreducebf16 zmm22 {k7}, zmmword ptr [r8 + 4*rax + 291], 123 -// CHECK: vreducenepbf16 zmm22, word ptr [rip]{1to32}, 123 +// CHECK: vreducebf16 zmm22, word ptr [rip]{1to32}, 123 // CHECK: encoding: [0x62,0xe3,0x7f,0x58,0x56,0x35,0x00,0x00,0x00,0x00,0x7b] - vreducenepbf16 zmm22, word ptr [rip]{1to32}, 123 + vreducebf16 zmm22, word ptr [rip]{1to32}, 123 -// CHECK: vreducenepbf16 zmm22, zmmword ptr [2*rbp - 2048], 123 +// CHECK: vreducebf16 zmm22, zmmword ptr [2*rbp - 2048], 123 // CHECK: encoding: [0x62,0xe3,0x7f,0x48,0x56,0x34,0x6d,0x00,0xf8,0xff,0xff,0x7b] - vreducenepbf16 zmm22, zmmword ptr [2*rbp - 2048], 123 + vreducebf16 zmm22, zmmword ptr [2*rbp - 2048], 123 -// CHECK: vreducenepbf16 zmm22 {k7} {z}, zmmword ptr [rcx + 8128], 123 +// CHECK: vreducebf16 zmm22 {k7} {z}, zmmword ptr [rcx + 8128], 123 // CHECK: encoding: [0x62,0xe3,0x7f,0xcf,0x56,0x71,0x7f,0x7b] - vreducenepbf16 zmm22 {k7} {z}, zmmword ptr [rcx + 8128], 123 + vreducebf16 zmm22 {k7} {z}, zmmword ptr [rcx + 8128], 123 -// CHECK: vreducenepbf16 zmm22 {k7} {z}, word ptr [rdx - 256]{1to32}, 123 +// CHECK: vreducebf16 zmm22 {k7} {z}, word ptr [rdx - 256]{1to32}, 123 // CHECK: encoding: [0x62,0xe3,0x7f,0xdf,0x56,0x72,0x80,0x7b] - vreducenepbf16 zmm22 {k7} {z}, word ptr [rdx - 256]{1to32}, 123 + vreducebf16 zmm22 {k7} {z}, word ptr [rdx - 256]{1to32}, 123 -// CHECK: vrndscalenepbf16 zmm22, zmm23, 123 +// CHECK: vrndscalebf16 zmm22, zmm23, 123 // CHECK: encoding: [0x62,0xa3,0x7f,0x48,0x08,0xf7,0x7b] - vrndscalenepbf16 zmm22, zmm23, 123 + vrndscalebf16 zmm22, zmm23, 123 -// CHECK: vrndscalenepbf16 zmm22 {k7}, zmm23, 123 +// CHECK: vrndscalebf16 zmm22 {k7}, zmm23, 123 // CHECK: encoding: [0x62,0xa3,0x7f,0x4f,0x08,0xf7,0x7b] - vrndscalenepbf16 zmm22 {k7}, zmm23, 123 + vrndscalebf16 zmm22 {k7}, zmm23, 123 -// CHECK: vrndscalenepbf16 zmm22 {k7} {z}, zmm23, 123 +// CHECK: vrndscalebf16 zmm22 {k7} {z}, zmm23, 123 // CHECK: encoding: [0x62,0xa3,0x7f,0xcf,0x08,0xf7,0x7b] - vrndscalenepbf16 zmm22 {k7} {z}, zmm23, 123 + vrndscalebf16 zmm22 {k7} {z}, zmm23, 123 -// CHECK: vrndscalenepbf16 ymm22, ymm23, 123 +// CHECK: vrndscalebf16 ymm22, ymm23, 123 // CHECK: encoding: [0x62,0xa3,0x7f,0x28,0x08,0xf7,0x7b] - vrndscalenepbf16 ymm22, ymm23, 123 + vrndscalebf16 ymm22, ymm23, 123 -// CHECK: vrndscalenepbf16 ymm22 {k7}, ymm23, 123 +// CHECK: vrndscalebf16 ymm22 {k7}, ymm23, 123 // CHECK: encoding: [0x62,0xa3,0x7f,0x2f,0x08,0xf7,0x7b] - vrndscalenepbf16 ymm22 {k7}, ymm23, 123 + vrndscalebf16 ymm22 {k7}, ymm23, 123 -// CHECK: vrndscalenepbf16 ymm22 {k7} {z}, ymm23, 123 +// CHECK: vrndscalebf16 ymm22 {k7} {z}, ymm23, 123 // CHECK: encoding: [0x62,0xa3,0x7f,0xaf,0x08,0xf7,0x7b] - vrndscalenepbf16 ymm22 {k7} {z}, ymm23, 123 + vrndscalebf16 ymm22 {k7} {z}, ymm23, 123 -// CHECK: vrndscalenepbf16 xmm22, xmm23, 123 +// CHECK: vrndscalebf16 xmm22, xmm23, 123 // CHECK: encoding: [0x62,0xa3,0x7f,0x08,0x08,0xf7,0x7b] - vrndscalenepbf16 xmm22, xmm23, 123 + vrndscalebf16 xmm22, xmm23, 123 -// CHECK: vrndscalenepbf16 xmm22 {k7}, xmm23, 123 +// CHECK: vrndscalebf16 xmm22 {k7}, xmm23, 123 // CHECK: encoding: [0x62,0xa3,0x7f,0x0f,0x08,0xf7,0x7b] - vrndscalenepbf16 xmm22 {k7}, xmm23, 123 + vrndscalebf16 xmm22 {k7}, xmm23, 123 -// CHECK: vrndscalenepbf16 xmm22 {k7} {z}, xmm23, 123 +// CHECK: vrndscalebf16 xmm22 {k7} {z}, xmm23, 123 // CHECK: encoding: [0x62,0xa3,0x7f,0x8f,0x08,0xf7,0x7b] - vrndscalenepbf16 xmm22 {k7} {z}, xmm23, 123 + vrndscalebf16 xmm22 {k7} {z}, xmm23, 123 -// CHECK: vrndscalenepbf16 xmm22, xmmword ptr [rbp + 8*r14 + 268435456], 123 +// CHECK: vrndscalebf16 xmm22, xmmword ptr [rbp + 8*r14 + 268435456], 123 // CHECK: encoding: [0x62,0xa3,0x7f,0x08,0x08,0xb4,0xf5,0x00,0x00,0x00,0x10,0x7b] - vrndscalenepbf16 xmm22, xmmword ptr [rbp + 8*r14 + 268435456], 123 + vrndscalebf16 xmm22, xmmword ptr [rbp + 8*r14 + 268435456], 123 -// CHECK: vrndscalenepbf16 xmm22 {k7}, xmmword ptr [r8 + 4*rax + 291], 123 +// CHECK: vrndscalebf16 xmm22 {k7}, xmmword ptr [r8 + 4*rax + 291], 123 // CHECK: encoding: [0x62,0xc3,0x7f,0x0f,0x08,0xb4,0x80,0x23,0x01,0x00,0x00,0x7b] - vrndscalenepbf16 xmm22 {k7}, xmmword ptr [r8 + 4*rax + 291], 123 + vrndscalebf16 xmm22 {k7}, xmmword ptr [r8 + 4*rax + 291], 123 -// CHECK: vrndscalenepbf16 xmm22, word ptr [rip]{1to8}, 123 +// CHECK: vrndscalebf16 xmm22, word ptr [rip]{1to8}, 123 // CHECK: encoding: [0x62,0xe3,0x7f,0x18,0x08,0x35,0x00,0x00,0x00,0x00,0x7b] - vrndscalenepbf16 xmm22, word ptr [rip]{1to8}, 123 + vrndscalebf16 xmm22, word ptr [rip]{1to8}, 123 -// CHECK: vrndscalenepbf16 xmm22, xmmword ptr [2*rbp - 512], 123 +// CHECK: vrndscalebf16 xmm22, xmmword ptr [2*rbp - 512], 123 // CHECK: encoding: [0x62,0xe3,0x7f,0x08,0x08,0x34,0x6d,0x00,0xfe,0xff,0xff,0x7b] - vrndscalenepbf16 xmm22, xmmword ptr [2*rbp - 512], 123 + vrndscalebf16 xmm22, xmmword ptr [2*rbp - 512], 123 -// CHECK: vrndscalenepbf16 xmm22 {k7} {z}, xmmword ptr [rcx + 2032], 123 +// CHECK: vrndscalebf16 xmm22 {k7} {z}, xmmword ptr [rcx + 2032], 123 // CHECK: encoding: [0x62,0xe3,0x7f,0x8f,0x08,0x71,0x7f,0x7b] - vrndscalenepbf16 xmm22 {k7} {z}, xmmword ptr [rcx + 2032], 123 + vrndscalebf16 xmm22 {k7} {z}, xmmword ptr [rcx + 2032], 123 -// CHECK: vrndscalenepbf16 xmm22 {k7} {z}, word ptr [rdx - 256]{1to8}, 123 +// CHECK: vrndscalebf16 xmm22 {k7} {z}, word ptr [rdx - 256]{1to8}, 123 // CHECK: encoding: [0x62,0xe3,0x7f,0x9f,0x08,0x72,0x80,0x7b] - vrndscalenepbf16 xmm22 {k7} {z}, word ptr [rdx - 256]{1to8}, 123 + vrndscalebf16 xmm22 {k7} {z}, word ptr [rdx - 256]{1to8}, 123 -// CHECK: vrndscalenepbf16 ymm22, ymmword ptr [rbp + 8*r14 + 268435456], 123 +// CHECK: vrndscalebf16 ymm22, ymmword ptr [rbp + 8*r14 + 268435456], 123 // CHECK: encoding: [0x62,0xa3,0x7f,0x28,0x08,0xb4,0xf5,0x00,0x00,0x00,0x10,0x7b] - vrndscalenepbf16 ymm22, ymmword ptr [rbp + 8*r14 + 268435456], 123 + vrndscalebf16 ymm22, ymmword ptr [rbp + 8*r14 + 268435456], 123 -// CHECK: vrndscalenepbf16 ymm22 {k7}, ymmword ptr [r8 + 4*rax + 291], 123 +// CHECK: vrndscalebf16 ymm22 {k7}, ymmword ptr [r8 + 4*rax + 291], 123 // CHECK: encoding: [0x62,0xc3,0x7f,0x2f,0x08,0xb4,0x80,0x23,0x01,0x00,0x00,0x7b] - vrndscalenepbf16 ymm22 {k7}, ymmword ptr [r8 + 4*rax + 291], 123 + vrndscalebf16 ymm22 {k7}, ymmword ptr [r8 + 4*rax + 291], 123 -// CHECK: vrndscalenepbf16 ymm22, word ptr [rip]{1to16}, 123 +// CHECK: vrndscalebf16 ymm22, word ptr [rip]{1to16}, 123 // CHECK: encoding: [0x62,0xe3,0x7f,0x38,0x08,0x35,0x00,0x00,0x00,0x00,0x7b] - vrndscalenepbf16 ymm22, word ptr [rip]{1to16}, 123 + vrndscalebf16 ymm22, word ptr [rip]{1to16}, 123 -// CHECK: vrndscalenepbf16 ymm22, ymmword ptr [2*rbp - 1024], 123 +// CHECK: vrndscalebf16 ymm22, ymmword ptr [2*rbp - 1024], 123 // CHECK: encoding: [0x62,0xe3,0x7f,0x28,0x08,0x34,0x6d,0x00,0xfc,0xff,0xff,0x7b] - vrndscalenepbf16 ymm22, ymmword ptr [2*rbp - 1024], 123 + vrndscalebf16 ymm22, ymmword ptr [2*rbp - 1024], 123 -// CHECK: vrndscalenepbf16 ymm22 {k7} {z}, ymmword ptr [rcx + 4064], 123 +// CHECK: vrndscalebf16 ymm22 {k7} {z}, ymmword ptr [rcx + 4064], 123 // CHECK: encoding: [0x62,0xe3,0x7f,0xaf,0x08,0x71,0x7f,0x7b] - vrndscalenepbf16 ymm22 {k7} {z}, ymmword ptr [rcx + 4064], 123 + vrndscalebf16 ymm22 {k7} {z}, ymmword ptr [rcx + 4064], 123 -// CHECK: vrndscalenepbf16 ymm22 {k7} {z}, word ptr [rdx - 256]{1to16}, 123 +// CHECK: vrndscalebf16 ymm22 {k7} {z}, word ptr [rdx - 256]{1to16}, 123 // CHECK: encoding: [0x62,0xe3,0x7f,0xbf,0x08,0x72,0x80,0x7b] - vrndscalenepbf16 ymm22 {k7} {z}, word ptr [rdx - 256]{1to16}, 123 + vrndscalebf16 ymm22 {k7} {z}, word ptr [rdx - 256]{1to16}, 123 -// CHECK: vrndscalenepbf16 zmm22, zmmword ptr [rbp + 8*r14 + 268435456], 123 +// CHECK: vrndscalebf16 zmm22, zmmword ptr [rbp + 8*r14 + 268435456], 123 // CHECK: encoding: [0x62,0xa3,0x7f,0x48,0x08,0xb4,0xf5,0x00,0x00,0x00,0x10,0x7b] - vrndscalenepbf16 zmm22, zmmword ptr [rbp + 8*r14 + 268435456], 123 + vrndscalebf16 zmm22, zmmword ptr [rbp + 8*r14 + 268435456], 123 -// CHECK: vrndscalenepbf16 zmm22 {k7}, zmmword ptr [r8 + 4*rax + 291], 123 +// CHECK: vrndscalebf16 zmm22 {k7}, zmmword ptr [r8 + 4*rax + 291], 123 // CHECK: encoding: [0x62,0xc3,0x7f,0x4f,0x08,0xb4,0x80,0x23,0x01,0x00,0x00,0x7b] - vrndscalenepbf16 zmm22 {k7}, zmmword ptr [r8 + 4*rax + 291], 123 + vrndscalebf16 zmm22 {k7}, zmmword ptr [r8 + 4*rax + 291], 123 -// CHECK: vrndscalenepbf16 zmm22, word ptr [rip]{1to32}, 123 +// CHECK: vrndscalebf16 zmm22, word ptr [rip]{1to32}, 123 // CHECK: encoding: [0x62,0xe3,0x7f,0x58,0x08,0x35,0x00,0x00,0x00,0x00,0x7b] - vrndscalenepbf16 zmm22, word ptr [rip]{1to32}, 123 + vrndscalebf16 zmm22, word ptr [rip]{1to32}, 123 -// CHECK: vrndscalenepbf16 zmm22, zmmword ptr [2*rbp - 2048], 123 +// CHECK: vrndscalebf16 zmm22, zmmword ptr [2*rbp - 2048], 123 // CHECK: encoding: [0x62,0xe3,0x7f,0x48,0x08,0x34,0x6d,0x00,0xf8,0xff,0xff,0x7b] - vrndscalenepbf16 zmm22, zmmword ptr [2*rbp - 2048], 123 + vrndscalebf16 zmm22, zmmword ptr [2*rbp - 2048], 123 -// CHECK: vrndscalenepbf16 zmm22 {k7} {z}, zmmword ptr [rcx + 8128], 123 +// CHECK: vrndscalebf16 zmm22 {k7} {z}, zmmword ptr [rcx + 8128], 123 // CHECK: encoding: [0x62,0xe3,0x7f,0xcf,0x08,0x71,0x7f,0x7b] - vrndscalenepbf16 zmm22 {k7} {z}, zmmword ptr [rcx + 8128], 123 + vrndscalebf16 zmm22 {k7} {z}, zmmword ptr [rcx + 8128], 123 -// CHECK: vrndscalenepbf16 zmm22 {k7} {z}, word ptr [rdx - 256]{1to32}, 123 +// CHECK: vrndscalebf16 zmm22 {k7} {z}, word ptr [rdx - 256]{1to32}, 123 // CHECK: encoding: [0x62,0xe3,0x7f,0xdf,0x08,0x72,0x80,0x7b] - vrndscalenepbf16 zmm22 {k7} {z}, word ptr [rdx - 256]{1to32}, 123 + vrndscalebf16 zmm22 {k7} {z}, word ptr [rdx - 256]{1to32}, 123 -// CHECK: vrsqrtpbf16 xmm22, xmm23 +// CHECK: vrsqrtbf16 xmm22, xmm23 // CHECK: encoding: [0x62,0xa6,0x7c,0x08,0x4e,0xf7] - vrsqrtpbf16 xmm22, xmm23 + vrsqrtbf16 xmm22, xmm23 -// CHECK: vrsqrtpbf16 xmm22 {k7}, xmm23 +// CHECK: vrsqrtbf16 xmm22 {k7}, xmm23 // CHECK: encoding: [0x62,0xa6,0x7c,0x0f,0x4e,0xf7] - vrsqrtpbf16 xmm22 {k7}, xmm23 + vrsqrtbf16 xmm22 {k7}, xmm23 -// CHECK: vrsqrtpbf16 xmm22 {k7} {z}, xmm23 +// CHECK: vrsqrtbf16 xmm22 {k7} {z}, xmm23 // CHECK: encoding: [0x62,0xa6,0x7c,0x8f,0x4e,0xf7] - vrsqrtpbf16 xmm22 {k7} {z}, xmm23 + vrsqrtbf16 xmm22 {k7} {z}, xmm23 -// CHECK: vrsqrtpbf16 zmm22, zmm23 +// CHECK: vrsqrtbf16 zmm22, zmm23 // CHECK: encoding: [0x62,0xa6,0x7c,0x48,0x4e,0xf7] - vrsqrtpbf16 zmm22, zmm23 + vrsqrtbf16 zmm22, zmm23 -// CHECK: vrsqrtpbf16 zmm22 {k7}, zmm23 +// CHECK: vrsqrtbf16 zmm22 {k7}, zmm23 // CHECK: encoding: [0x62,0xa6,0x7c,0x4f,0x4e,0xf7] - vrsqrtpbf16 zmm22 {k7}, zmm23 + vrsqrtbf16 zmm22 {k7}, zmm23 -// CHECK: vrsqrtpbf16 zmm22 {k7} {z}, zmm23 +// CHECK: vrsqrtbf16 zmm22 {k7} {z}, zmm23 // CHECK: encoding: [0x62,0xa6,0x7c,0xcf,0x4e,0xf7] - vrsqrtpbf16 zmm22 {k7} {z}, zmm23 + vrsqrtbf16 zmm22 {k7} {z}, zmm23 -// CHECK: vrsqrtpbf16 ymm22, ymm23 +// CHECK: vrsqrtbf16 ymm22, ymm23 // CHECK: encoding: [0x62,0xa6,0x7c,0x28,0x4e,0xf7] - vrsqrtpbf16 ymm22, ymm23 + vrsqrtbf16 ymm22, ymm23 -// CHECK: vrsqrtpbf16 ymm22 {k7}, ymm23 +// CHECK: vrsqrtbf16 ymm22 {k7}, ymm23 // CHECK: encoding: [0x62,0xa6,0x7c,0x2f,0x4e,0xf7] - vrsqrtpbf16 ymm22 {k7}, ymm23 + vrsqrtbf16 ymm22 {k7}, ymm23 -// CHECK: vrsqrtpbf16 ymm22 {k7} {z}, ymm23 +// CHECK: vrsqrtbf16 ymm22 {k7} {z}, ymm23 // CHECK: encoding: [0x62,0xa6,0x7c,0xaf,0x4e,0xf7] - vrsqrtpbf16 ymm22 {k7} {z}, ymm23 + vrsqrtbf16 ymm22 {k7} {z}, ymm23 -// CHECK: vrsqrtpbf16 xmm22, xmmword ptr [rbp + 8*r14 + 268435456] +// CHECK: vrsqrtbf16 xmm22, xmmword ptr [rbp + 8*r14 + 268435456] // CHECK: encoding: [0x62,0xa6,0x7c,0x08,0x4e,0xb4,0xf5,0x00,0x00,0x00,0x10] - vrsqrtpbf16 xmm22, xmmword ptr [rbp + 8*r14 + 268435456] + vrsqrtbf16 xmm22, xmmword ptr [rbp + 8*r14 + 268435456] -// CHECK: vrsqrtpbf16 xmm22 {k7}, xmmword ptr [r8 + 4*rax + 291] +// CHECK: vrsqrtbf16 xmm22 {k7}, xmmword ptr [r8 + 4*rax + 291] // CHECK: encoding: [0x62,0xc6,0x7c,0x0f,0x4e,0xb4,0x80,0x23,0x01,0x00,0x00] - vrsqrtpbf16 xmm22 {k7}, xmmword ptr [r8 + 4*rax + 291] + vrsqrtbf16 xmm22 {k7}, xmmword ptr [r8 + 4*rax + 291] -// CHECK: vrsqrtpbf16 xmm22, word ptr [rip]{1to8} +// CHECK: vrsqrtbf16 xmm22, word ptr [rip]{1to8} // CHECK: encoding: [0x62,0xe6,0x7c,0x18,0x4e,0x35,0x00,0x00,0x00,0x00] - vrsqrtpbf16 xmm22, word ptr [rip]{1to8} + vrsqrtbf16 xmm22, word ptr [rip]{1to8} -// CHECK: vrsqrtpbf16 xmm22, xmmword ptr [2*rbp - 512] +// CHECK: vrsqrtbf16 xmm22, xmmword ptr [2*rbp - 512] // CHECK: encoding: [0x62,0xe6,0x7c,0x08,0x4e,0x34,0x6d,0x00,0xfe,0xff,0xff] - vrsqrtpbf16 xmm22, xmmword ptr [2*rbp - 512] + vrsqrtbf16 xmm22, xmmword ptr [2*rbp - 512] -// CHECK: vrsqrtpbf16 xmm22 {k7} {z}, xmmword ptr [rcx + 2032] +// CHECK: vrsqrtbf16 xmm22 {k7} {z}, xmmword ptr [rcx + 2032] // CHECK: encoding: [0x62,0xe6,0x7c,0x8f,0x4e,0x71,0x7f] - vrsqrtpbf16 xmm22 {k7} {z}, xmmword ptr [rcx + 2032] + vrsqrtbf16 xmm22 {k7} {z}, xmmword ptr [rcx + 2032] -// CHECK: vrsqrtpbf16 xmm22 {k7} {z}, word ptr [rdx - 256]{1to8} +// CHECK: vrsqrtbf16 xmm22 {k7} {z}, word ptr [rdx - 256]{1to8} // CHECK: encoding: [0x62,0xe6,0x7c,0x9f,0x4e,0x72,0x80] - vrsqrtpbf16 xmm22 {k7} {z}, word ptr [rdx - 256]{1to8} + vrsqrtbf16 xmm22 {k7} {z}, word ptr [rdx - 256]{1to8} -// CHECK: vrsqrtpbf16 ymm22, ymmword ptr [rbp + 8*r14 + 268435456] +// CHECK: vrsqrtbf16 ymm22, ymmword ptr [rbp + 8*r14 + 268435456] // CHECK: encoding: [0x62,0xa6,0x7c,0x28,0x4e,0xb4,0xf5,0x00,0x00,0x00,0x10] - vrsqrtpbf16 ymm22, ymmword ptr [rbp + 8*r14 + 268435456] + vrsqrtbf16 ymm22, ymmword ptr [rbp + 8*r14 + 268435456] -// CHECK: vrsqrtpbf16 ymm22 {k7}, ymmword ptr [r8 + 4*rax + 291] +// CHECK: vrsqrtbf16 ymm22 {k7}, ymmword ptr [r8 + 4*rax + 291] // CHECK: encoding: [0x62,0xc6,0x7c,0x2f,0x4e,0xb4,0x80,0x23,0x01,0x00,0x00] - vrsqrtpbf16 ymm22 {k7}, ymmword ptr [r8 + 4*rax + 291] + vrsqrtbf16 ymm22 {k7}, ymmword ptr [r8 + 4*rax + 291] -// CHECK: vrsqrtpbf16 ymm22, word ptr [rip]{1to16} +// CHECK: vrsqrtbf16 ymm22, word ptr [rip]{1to16} // CHECK: encoding: [0x62,0xe6,0x7c,0x38,0x4e,0x35,0x00,0x00,0x00,0x00] - vrsqrtpbf16 ymm22, word ptr [rip]{1to16} + vrsqrtbf16 ymm22, word ptr [rip]{1to16} -// CHECK: vrsqrtpbf16 ymm22, ymmword ptr [2*rbp - 1024] +// CHECK: vrsqrtbf16 ymm22, ymmword ptr [2*rbp - 1024] // CHECK: encoding: [0x62,0xe6,0x7c,0x28,0x4e,0x34,0x6d,0x00,0xfc,0xff,0xff] - vrsqrtpbf16 ymm22, ymmword ptr [2*rbp - 1024] + vrsqrtbf16 ymm22, ymmword ptr [2*rbp - 1024] -// CHECK: vrsqrtpbf16 ymm22 {k7} {z}, ymmword ptr [rcx + 4064] +// CHECK: vrsqrtbf16 ymm22 {k7} {z}, ymmword ptr [rcx + 4064] // CHECK: encoding: [0x62,0xe6,0x7c,0xaf,0x4e,0x71,0x7f] - vrsqrtpbf16 ymm22 {k7} {z}, ymmword ptr [rcx + 4064] + vrsqrtbf16 ymm22 {k7} {z}, ymmword ptr [rcx + 4064] -// CHECK: vrsqrtpbf16 ymm22 {k7} {z}, word ptr [rdx - 256]{1to16} +// CHECK: vrsqrtbf16 ymm22 {k7} {z}, word ptr [rdx - 256]{1to16} // CHECK: encoding: [0x62,0xe6,0x7c,0xbf,0x4e,0x72,0x80] - vrsqrtpbf16 ymm22 {k7} {z}, word ptr [rdx - 256]{1to16} + vrsqrtbf16 ymm22 {k7} {z}, word ptr [rdx - 256]{1to16} -// CHECK: vrsqrtpbf16 zmm22, zmmword ptr [rbp + 8*r14 + 268435456] +// CHECK: vrsqrtbf16 zmm22, zmmword ptr [rbp + 8*r14 + 268435456] // CHECK: encoding: [0x62,0xa6,0x7c,0x48,0x4e,0xb4,0xf5,0x00,0x00,0x00,0x10] - vrsqrtpbf16 zmm22, zmmword ptr [rbp + 8*r14 + 268435456] + vrsqrtbf16 zmm22, zmmword ptr [rbp + 8*r14 + 268435456] -// CHECK: vrsqrtpbf16 zmm22 {k7}, zmmword ptr [r8 + 4*rax + 291] +// CHECK: vrsqrtbf16 zmm22 {k7}, zmmword ptr [r8 + 4*rax + 291] // CHECK: encoding: [0x62,0xc6,0x7c,0x4f,0x4e,0xb4,0x80,0x23,0x01,0x00,0x00] - vrsqrtpbf16 zmm22 {k7}, zmmword ptr [r8 + 4*rax + 291] + vrsqrtbf16 zmm22 {k7}, zmmword ptr [r8 + 4*rax + 291] -// CHECK: vrsqrtpbf16 zmm22, word ptr [rip]{1to32} +// CHECK: vrsqrtbf16 zmm22, word ptr [rip]{1to32} // CHECK: encoding: [0x62,0xe6,0x7c,0x58,0x4e,0x35,0x00,0x00,0x00,0x00] - vrsqrtpbf16 zmm22, word ptr [rip]{1to32} + vrsqrtbf16 zmm22, word ptr [rip]{1to32} -// CHECK: vrsqrtpbf16 zmm22, zmmword ptr [2*rbp - 2048] +// CHECK: vrsqrtbf16 zmm22, zmmword ptr [2*rbp - 2048] // CHECK: encoding: [0x62,0xe6,0x7c,0x48,0x4e,0x34,0x6d,0x00,0xf8,0xff,0xff] - vrsqrtpbf16 zmm22, zmmword ptr [2*rbp - 2048] + vrsqrtbf16 zmm22, zmmword ptr [2*rbp - 2048] -// CHECK: vrsqrtpbf16 zmm22 {k7} {z}, zmmword ptr [rcx + 8128] +// CHECK: vrsqrtbf16 zmm22 {k7} {z}, zmmword ptr [rcx + 8128] // CHECK: encoding: [0x62,0xe6,0x7c,0xcf,0x4e,0x71,0x7f] - vrsqrtpbf16 zmm22 {k7} {z}, zmmword ptr [rcx + 8128] + vrsqrtbf16 zmm22 {k7} {z}, zmmword ptr [rcx + 8128] -// CHECK: vrsqrtpbf16 zmm22 {k7} {z}, word ptr [rdx - 256]{1to32} +// CHECK: vrsqrtbf16 zmm22 {k7} {z}, word ptr [rdx - 256]{1to32} // CHECK: encoding: [0x62,0xe6,0x7c,0xdf,0x4e,0x72,0x80] - vrsqrtpbf16 zmm22 {k7} {z}, word ptr [rdx - 256]{1to32} + vrsqrtbf16 zmm22 {k7} {z}, word ptr [rdx - 256]{1to32} -// CHECK: vscalefpbf16 ymm22, ymm23, ymm24 +// CHECK: vscalefbf16 ymm22, ymm23, ymm24 // CHECK: encoding: [0x62,0x86,0x44,0x20,0x2c,0xf0] - vscalefpbf16 ymm22, ymm23, ymm24 + vscalefbf16 ymm22, ymm23, ymm24 -// CHECK: vscalefpbf16 ymm22 {k7}, ymm23, ymm24 +// CHECK: vscalefbf16 ymm22 {k7}, ymm23, ymm24 // CHECK: encoding: [0x62,0x86,0x44,0x27,0x2c,0xf0] - vscalefpbf16 ymm22 {k7}, ymm23, ymm24 + vscalefbf16 ymm22 {k7}, ymm23, ymm24 -// CHECK: vscalefpbf16 ymm22 {k7} {z}, ymm23, ymm24 +// CHECK: vscalefbf16 ymm22 {k7} {z}, ymm23, ymm24 // CHECK: encoding: [0x62,0x86,0x44,0xa7,0x2c,0xf0] - vscalefpbf16 ymm22 {k7} {z}, ymm23, ymm24 + vscalefbf16 ymm22 {k7} {z}, ymm23, ymm24 -// CHECK: vscalefpbf16 zmm22, zmm23, zmm24 +// CHECK: vscalefbf16 zmm22, zmm23, zmm24 // CHECK: encoding: [0x62,0x86,0x44,0x40,0x2c,0xf0] - vscalefpbf16 zmm22, zmm23, zmm24 + vscalefbf16 zmm22, zmm23, zmm24 -// CHECK: vscalefpbf16 zmm22 {k7}, zmm23, zmm24 +// CHECK: vscalefbf16 zmm22 {k7}, zmm23, zmm24 // CHECK: encoding: [0x62,0x86,0x44,0x47,0x2c,0xf0] - vscalefpbf16 zmm22 {k7}, zmm23, zmm24 + vscalefbf16 zmm22 {k7}, zmm23, zmm24 -// CHECK: vscalefpbf16 zmm22 {k7} {z}, zmm23, zmm24 +// CHECK: vscalefbf16 zmm22 {k7} {z}, zmm23, zmm24 // CHECK: encoding: [0x62,0x86,0x44,0xc7,0x2c,0xf0] - vscalefpbf16 zmm22 {k7} {z}, zmm23, zmm24 + vscalefbf16 zmm22 {k7} {z}, zmm23, zmm24 -// CHECK: vscalefpbf16 xmm22, xmm23, xmm24 +// CHECK: vscalefbf16 xmm22, xmm23, xmm24 // CHECK: encoding: [0x62,0x86,0x44,0x00,0x2c,0xf0] - vscalefpbf16 xmm22, xmm23, xmm24 + vscalefbf16 xmm22, xmm23, xmm24 -// CHECK: vscalefpbf16 xmm22 {k7}, xmm23, xmm24 +// CHECK: vscalefbf16 xmm22 {k7}, xmm23, xmm24 // CHECK: encoding: [0x62,0x86,0x44,0x07,0x2c,0xf0] - vscalefpbf16 xmm22 {k7}, xmm23, xmm24 + vscalefbf16 xmm22 {k7}, xmm23, xmm24 -// CHECK: vscalefpbf16 xmm22 {k7} {z}, xmm23, xmm24 +// CHECK: vscalefbf16 xmm22 {k7} {z}, xmm23, xmm24 // CHECK: encoding: [0x62,0x86,0x44,0x87,0x2c,0xf0] - vscalefpbf16 xmm22 {k7} {z}, xmm23, xmm24 + vscalefbf16 xmm22 {k7} {z}, xmm23, xmm24 -// CHECK: vscalefpbf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456] +// CHECK: vscalefbf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456] // CHECK: encoding: [0x62,0xa6,0x44,0x40,0x2c,0xb4,0xf5,0x00,0x00,0x00,0x10] - vscalefpbf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456] + vscalefbf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456] -// CHECK: vscalefpbf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291] +// CHECK: vscalefbf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291] // CHECK: encoding: [0x62,0xc6,0x44,0x47,0x2c,0xb4,0x80,0x23,0x01,0x00,0x00] - vscalefpbf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291] + vscalefbf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291] -// CHECK: vscalefpbf16 zmm22, zmm23, word ptr [rip]{1to32} +// CHECK: vscalefbf16 zmm22, zmm23, word ptr [rip]{1to32} // CHECK: encoding: [0x62,0xe6,0x44,0x50,0x2c,0x35,0x00,0x00,0x00,0x00] - vscalefpbf16 zmm22, zmm23, word ptr [rip]{1to32} + vscalefbf16 zmm22, zmm23, word ptr [rip]{1to32} -// CHECK: vscalefpbf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048] +// CHECK: vscalefbf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048] // CHECK: encoding: [0x62,0xe6,0x44,0x40,0x2c,0x34,0x6d,0x00,0xf8,0xff,0xff] - vscalefpbf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048] + vscalefbf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048] -// CHECK: vscalefpbf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128] +// CHECK: vscalefbf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128] // CHECK: encoding: [0x62,0xe6,0x44,0xc7,0x2c,0x71,0x7f] - vscalefpbf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128] + vscalefbf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128] -// CHECK: vscalefpbf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32} +// CHECK: vscalefbf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32} // CHECK: encoding: [0x62,0xe6,0x44,0xd7,0x2c,0x72,0x80] - vscalefpbf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32} + vscalefbf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32} -// CHECK: vscalefpbf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456] +// CHECK: vscalefbf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456] // CHECK: encoding: [0x62,0xa6,0x44,0x20,0x2c,0xb4,0xf5,0x00,0x00,0x00,0x10] - vscalefpbf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456] + vscalefbf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456] -// CHECK: vscalefpbf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291] +// CHECK: vscalefbf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291] // CHECK: encoding: [0x62,0xc6,0x44,0x27,0x2c,0xb4,0x80,0x23,0x01,0x00,0x00] - vscalefpbf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291] + vscalefbf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291] -// CHECK: vscalefpbf16 ymm22, ymm23, word ptr [rip]{1to16} +// CHECK: vscalefbf16 ymm22, ymm23, word ptr [rip]{1to16} // CHECK: encoding: [0x62,0xe6,0x44,0x30,0x2c,0x35,0x00,0x00,0x00,0x00] - vscalefpbf16 ymm22, ymm23, word ptr [rip]{1to16} + vscalefbf16 ymm22, ymm23, word ptr [rip]{1to16} -// CHECK: vscalefpbf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024] +// CHECK: vscalefbf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024] // CHECK: encoding: [0x62,0xe6,0x44,0x20,0x2c,0x34,0x6d,0x00,0xfc,0xff,0xff] - vscalefpbf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024] + vscalefbf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024] -// CHECK: vscalefpbf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064] +// CHECK: vscalefbf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064] // CHECK: encoding: [0x62,0xe6,0x44,0xa7,0x2c,0x71,0x7f] - vscalefpbf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064] + vscalefbf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064] -// CHECK: vscalefpbf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16} +// CHECK: vscalefbf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16} // CHECK: encoding: [0x62,0xe6,0x44,0xb7,0x2c,0x72,0x80] - vscalefpbf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16} + vscalefbf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16} -// CHECK: vscalefpbf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456] +// CHECK: vscalefbf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456] // CHECK: encoding: [0x62,0xa6,0x44,0x00,0x2c,0xb4,0xf5,0x00,0x00,0x00,0x10] - vscalefpbf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456] + vscalefbf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456] -// CHECK: vscalefpbf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291] +// CHECK: vscalefbf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291] // CHECK: encoding: [0x62,0xc6,0x44,0x07,0x2c,0xb4,0x80,0x23,0x01,0x00,0x00] - vscalefpbf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291] + vscalefbf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291] -// CHECK: vscalefpbf16 xmm22, xmm23, word ptr [rip]{1to8} +// CHECK: vscalefbf16 xmm22, xmm23, word ptr [rip]{1to8} // CHECK: encoding: [0x62,0xe6,0x44,0x10,0x2c,0x35,0x00,0x00,0x00,0x00] - vscalefpbf16 xmm22, xmm23, word ptr [rip]{1to8} + vscalefbf16 xmm22, xmm23, word ptr [rip]{1to8} -// CHECK: vscalefpbf16 xmm22, xmm23, xmmword ptr [2*rbp - 512] +// CHECK: vscalefbf16 xmm22, xmm23, xmmword ptr [2*rbp - 512] // CHECK: encoding: [0x62,0xe6,0x44,0x00,0x2c,0x34,0x6d,0x00,0xfe,0xff,0xff] - vscalefpbf16 xmm22, xmm23, xmmword ptr [2*rbp - 512] + vscalefbf16 xmm22, xmm23, xmmword ptr [2*rbp - 512] -// CHECK: vscalefpbf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032] +// CHECK: vscalefbf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032] // CHECK: encoding: [0x62,0xe6,0x44,0x87,0x2c,0x71,0x7f] - vscalefpbf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032] + vscalefbf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032] -// CHECK: vscalefpbf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8} +// CHECK: vscalefbf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8} // CHECK: encoding: [0x62,0xe6,0x44,0x97,0x2c,0x72,0x80] - vscalefpbf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8} + vscalefbf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8} -// CHECK: vsqrtnepbf16 xmm22, xmm23 +// CHECK: vsqrtbf16 xmm22, xmm23 // CHECK: encoding: [0x62,0xa5,0x7d,0x08,0x51,0xf7] - vsqrtnepbf16 xmm22, xmm23 + vsqrtbf16 xmm22, xmm23 -// CHECK: vsqrtnepbf16 xmm22 {k7}, xmm23 +// CHECK: vsqrtbf16 xmm22 {k7}, xmm23 // CHECK: encoding: [0x62,0xa5,0x7d,0x0f,0x51,0xf7] - vsqrtnepbf16 xmm22 {k7}, xmm23 + vsqrtbf16 xmm22 {k7}, xmm23 -// CHECK: vsqrtnepbf16 xmm22 {k7} {z}, xmm23 +// CHECK: vsqrtbf16 xmm22 {k7} {z}, xmm23 // CHECK: encoding: [0x62,0xa5,0x7d,0x8f,0x51,0xf7] - vsqrtnepbf16 xmm22 {k7} {z}, xmm23 + vsqrtbf16 xmm22 {k7} {z}, xmm23 -// CHECK: vsqrtnepbf16 zmm22, zmm23 +// CHECK: vsqrtbf16 zmm22, zmm23 // CHECK: encoding: [0x62,0xa5,0x7d,0x48,0x51,0xf7] - vsqrtnepbf16 zmm22, zmm23 + vsqrtbf16 zmm22, zmm23 -// CHECK: vsqrtnepbf16 zmm22 {k7}, zmm23 +// CHECK: vsqrtbf16 zmm22 {k7}, zmm23 // CHECK: encoding: [0x62,0xa5,0x7d,0x4f,0x51,0xf7] - vsqrtnepbf16 zmm22 {k7}, zmm23 + vsqrtbf16 zmm22 {k7}, zmm23 -// CHECK: vsqrtnepbf16 zmm22 {k7} {z}, zmm23 +// CHECK: vsqrtbf16 zmm22 {k7} {z}, zmm23 // CHECK: encoding: [0x62,0xa5,0x7d,0xcf,0x51,0xf7] - vsqrtnepbf16 zmm22 {k7} {z}, zmm23 + vsqrtbf16 zmm22 {k7} {z}, zmm23 -// CHECK: vsqrtnepbf16 ymm22, ymm23 +// CHECK: vsqrtbf16 ymm22, ymm23 // CHECK: encoding: [0x62,0xa5,0x7d,0x28,0x51,0xf7] - vsqrtnepbf16 ymm22, ymm23 + vsqrtbf16 ymm22, ymm23 -// CHECK: vsqrtnepbf16 ymm22 {k7}, ymm23 +// CHECK: vsqrtbf16 ymm22 {k7}, ymm23 // CHECK: encoding: [0x62,0xa5,0x7d,0x2f,0x51,0xf7] - vsqrtnepbf16 ymm22 {k7}, ymm23 + vsqrtbf16 ymm22 {k7}, ymm23 -// CHECK: vsqrtnepbf16 ymm22 {k7} {z}, ymm23 +// CHECK: vsqrtbf16 ymm22 {k7} {z}, ymm23 // CHECK: encoding: [0x62,0xa5,0x7d,0xaf,0x51,0xf7] - vsqrtnepbf16 ymm22 {k7} {z}, ymm23 + vsqrtbf16 ymm22 {k7} {z}, ymm23 -// CHECK: vsqrtnepbf16 xmm22, xmmword ptr [rbp + 8*r14 + 268435456] +// CHECK: vsqrtbf16 xmm22, xmmword ptr [rbp + 8*r14 + 268435456] // CHECK: encoding: [0x62,0xa5,0x7d,0x08,0x51,0xb4,0xf5,0x00,0x00,0x00,0x10] - vsqrtnepbf16 xmm22, xmmword ptr [rbp + 8*r14 + 268435456] + vsqrtbf16 xmm22, xmmword ptr [rbp + 8*r14 + 268435456] -// CHECK: vsqrtnepbf16 xmm22 {k7}, xmmword ptr [r8 + 4*rax + 291] +// CHECK: vsqrtbf16 xmm22 {k7}, xmmword ptr [r8 + 4*rax + 291] // CHECK: encoding: [0x62,0xc5,0x7d,0x0f,0x51,0xb4,0x80,0x23,0x01,0x00,0x00] - vsqrtnepbf16 xmm22 {k7}, xmmword ptr [r8 + 4*rax + 291] + vsqrtbf16 xmm22 {k7}, xmmword ptr [r8 + 4*rax + 291] -// CHECK: vsqrtnepbf16 xmm22, word ptr [rip]{1to8} +// CHECK: vsqrtbf16 xmm22, word ptr [rip]{1to8} // CHECK: encoding: [0x62,0xe5,0x7d,0x18,0x51,0x35,0x00,0x00,0x00,0x00] - vsqrtnepbf16 xmm22, word ptr [rip]{1to8} + vsqrtbf16 xmm22, word ptr [rip]{1to8} -// CHECK: vsqrtnepbf16 xmm22, xmmword ptr [2*rbp - 512] +// CHECK: vsqrtbf16 xmm22, xmmword ptr [2*rbp - 512] // CHECK: encoding: [0x62,0xe5,0x7d,0x08,0x51,0x34,0x6d,0x00,0xfe,0xff,0xff] - vsqrtnepbf16 xmm22, xmmword ptr [2*rbp - 512] + vsqrtbf16 xmm22, xmmword ptr [2*rbp - 512] -// CHECK: vsqrtnepbf16 xmm22 {k7} {z}, xmmword ptr [rcx + 2032] +// CHECK: vsqrtbf16 xmm22 {k7} {z}, xmmword ptr [rcx + 2032] // CHECK: encoding: [0x62,0xe5,0x7d,0x8f,0x51,0x71,0x7f] - vsqrtnepbf16 xmm22 {k7} {z}, xmmword ptr [rcx + 2032] + vsqrtbf16 xmm22 {k7} {z}, xmmword ptr [rcx + 2032] -// CHECK: vsqrtnepbf16 xmm22 {k7} {z}, word ptr [rdx - 256]{1to8} +// CHECK: vsqrtbf16 xmm22 {k7} {z}, word ptr [rdx - 256]{1to8} // CHECK: encoding: [0x62,0xe5,0x7d,0x9f,0x51,0x72,0x80] - vsqrtnepbf16 xmm22 {k7} {z}, word ptr [rdx - 256]{1to8} + vsqrtbf16 xmm22 {k7} {z}, word ptr [rdx - 256]{1to8} -// CHECK: vsqrtnepbf16 ymm22, ymmword ptr [rbp + 8*r14 + 268435456] +// CHECK: vsqrtbf16 ymm22, ymmword ptr [rbp + 8*r14 + 268435456] // CHECK: encoding: [0x62,0xa5,0x7d,0x28,0x51,0xb4,0xf5,0x00,0x00,0x00,0x10] - vsqrtnepbf16 ymm22, ymmword ptr [rbp + 8*r14 + 268435456] + vsqrtbf16 ymm22, ymmword ptr [rbp + 8*r14 + 268435456] -// CHECK: vsqrtnepbf16 ymm22 {k7}, ymmword ptr [r8 + 4*rax + 291] +// CHECK: vsqrtbf16 ymm22 {k7}, ymmword ptr [r8 + 4*rax + 291] // CHECK: encoding: [0x62,0xc5,0x7d,0x2f,0x51,0xb4,0x80,0x23,0x01,0x00,0x00] - vsqrtnepbf16 ymm22 {k7}, ymmword ptr [r8 + 4*rax + 291] + vsqrtbf16 ymm22 {k7}, ymmword ptr [r8 + 4*rax + 291] -// CHECK: vsqrtnepbf16 ymm22, word ptr [rip]{1to16} +// CHECK: vsqrtbf16 ymm22, word ptr [rip]{1to16} // CHECK: encoding: [0x62,0xe5,0x7d,0x38,0x51,0x35,0x00,0x00,0x00,0x00] - vsqrtnepbf16 ymm22, word ptr [rip]{1to16} + vsqrtbf16 ymm22, word ptr [rip]{1to16} -// CHECK: vsqrtnepbf16 ymm22, ymmword ptr [2*rbp - 1024] +// CHECK: vsqrtbf16 ymm22, ymmword ptr [2*rbp - 1024] // CHECK: encoding: [0x62,0xe5,0x7d,0x28,0x51,0x34,0x6d,0x00,0xfc,0xff,0xff] - vsqrtnepbf16 ymm22, ymmword ptr [2*rbp - 1024] + vsqrtbf16 ymm22, ymmword ptr [2*rbp - 1024] -// CHECK: vsqrtnepbf16 ymm22 {k7} {z}, ymmword ptr [rcx + 4064] +// CHECK: vsqrtbf16 ymm22 {k7} {z}, ymmword ptr [rcx + 4064] // CHECK: encoding: [0x62,0xe5,0x7d,0xaf,0x51,0x71,0x7f] - vsqrtnepbf16 ymm22 {k7} {z}, ymmword ptr [rcx + 4064] + vsqrtbf16 ymm22 {k7} {z}, ymmword ptr [rcx + 4064] -// CHECK: vsqrtnepbf16 ymm22 {k7} {z}, word ptr [rdx - 256]{1to16} +// CHECK: vsqrtbf16 ymm22 {k7} {z}, word ptr [rdx - 256]{1to16} // CHECK: encoding: [0x62,0xe5,0x7d,0xbf,0x51,0x72,0x80] - vsqrtnepbf16 ymm22 {k7} {z}, word ptr [rdx - 256]{1to16} + vsqrtbf16 ymm22 {k7} {z}, word ptr [rdx - 256]{1to16} -// CHECK: vsqrtnepbf16 zmm22, zmmword ptr [rbp + 8*r14 + 268435456] +// CHECK: vsqrtbf16 zmm22, zmmword ptr [rbp + 8*r14 + 268435456] // CHECK: encoding: [0x62,0xa5,0x7d,0x48,0x51,0xb4,0xf5,0x00,0x00,0x00,0x10] - vsqrtnepbf16 zmm22, zmmword ptr [rbp + 8*r14 + 268435456] + vsqrtbf16 zmm22, zmmword ptr [rbp + 8*r14 + 268435456] -// CHECK: vsqrtnepbf16 zmm22 {k7}, zmmword ptr [r8 + 4*rax + 291] +// CHECK: vsqrtbf16 zmm22 {k7}, zmmword ptr [r8 + 4*rax + 291] // CHECK: encoding: [0x62,0xc5,0x7d,0x4f,0x51,0xb4,0x80,0x23,0x01,0x00,0x00] - vsqrtnepbf16 zmm22 {k7}, zmmword ptr [r8 + 4*rax + 291] + vsqrtbf16 zmm22 {k7}, zmmword ptr [r8 + 4*rax + 291] -// CHECK: vsqrtnepbf16 zmm22, word ptr [rip]{1to32} +// CHECK: vsqrtbf16 zmm22, word ptr [rip]{1to32} // CHECK: encoding: [0x62,0xe5,0x7d,0x58,0x51,0x35,0x00,0x00,0x00,0x00] - vsqrtnepbf16 zmm22, word ptr [rip]{1to32} + vsqrtbf16 zmm22, word ptr [rip]{1to32} -// CHECK: vsqrtnepbf16 zmm22, zmmword ptr [2*rbp - 2048] +// CHECK: vsqrtbf16 zmm22, zmmword ptr [2*rbp - 2048] // CHECK: encoding: [0x62,0xe5,0x7d,0x48,0x51,0x34,0x6d,0x00,0xf8,0xff,0xff] - vsqrtnepbf16 zmm22, zmmword ptr [2*rbp - 2048] + vsqrtbf16 zmm22, zmmword ptr [2*rbp - 2048] -// CHECK: vsqrtnepbf16 zmm22 {k7} {z}, zmmword ptr [rcx + 8128] +// CHECK: vsqrtbf16 zmm22 {k7} {z}, zmmword ptr [rcx + 8128] // CHECK: encoding: [0x62,0xe5,0x7d,0xcf,0x51,0x71,0x7f] - vsqrtnepbf16 zmm22 {k7} {z}, zmmword ptr [rcx + 8128] + vsqrtbf16 zmm22 {k7} {z}, zmmword ptr [rcx + 8128] -// CHECK: vsqrtnepbf16 zmm22 {k7} {z}, word ptr [rdx - 256]{1to32} +// CHECK: vsqrtbf16 zmm22 {k7} {z}, word ptr [rdx - 256]{1to32} // CHECK: encoding: [0x62,0xe5,0x7d,0xdf,0x51,0x72,0x80] - vsqrtnepbf16 zmm22 {k7} {z}, word ptr [rdx - 256]{1to32} + vsqrtbf16 zmm22 {k7} {z}, word ptr [rdx - 256]{1to32} -// CHECK: vsubnepbf16 ymm22, ymm23, ymm24 +// CHECK: vsubbf16 ymm22, ymm23, ymm24 // CHECK: encoding: [0x62,0x85,0x45,0x20,0x5c,0xf0] - vsubnepbf16 ymm22, ymm23, ymm24 + vsubbf16 ymm22, ymm23, ymm24 -// CHECK: vsubnepbf16 ymm22 {k7}, ymm23, ymm24 +// CHECK: vsubbf16 ymm22 {k7}, ymm23, ymm24 // CHECK: encoding: [0x62,0x85,0x45,0x27,0x5c,0xf0] - vsubnepbf16 ymm22 {k7}, ymm23, ymm24 + vsubbf16 ymm22 {k7}, ymm23, ymm24 -// CHECK: vsubnepbf16 ymm22 {k7} {z}, ymm23, ymm24 +// CHECK: vsubbf16 ymm22 {k7} {z}, ymm23, ymm24 // CHECK: encoding: [0x62,0x85,0x45,0xa7,0x5c,0xf0] - vsubnepbf16 ymm22 {k7} {z}, ymm23, ymm24 + vsubbf16 ymm22 {k7} {z}, ymm23, ymm24 -// CHECK: vsubnepbf16 zmm22, zmm23, zmm24 +// CHECK: vsubbf16 zmm22, zmm23, zmm24 // CHECK: encoding: [0x62,0x85,0x45,0x40,0x5c,0xf0] - vsubnepbf16 zmm22, zmm23, zmm24 + vsubbf16 zmm22, zmm23, zmm24 -// CHECK: vsubnepbf16 zmm22 {k7}, zmm23, zmm24 +// CHECK: vsubbf16 zmm22 {k7}, zmm23, zmm24 // CHECK: encoding: [0x62,0x85,0x45,0x47,0x5c,0xf0] - vsubnepbf16 zmm22 {k7}, zmm23, zmm24 + vsubbf16 zmm22 {k7}, zmm23, zmm24 -// CHECK: vsubnepbf16 zmm22 {k7} {z}, zmm23, zmm24 +// CHECK: vsubbf16 zmm22 {k7} {z}, zmm23, zmm24 // CHECK: encoding: [0x62,0x85,0x45,0xc7,0x5c,0xf0] - vsubnepbf16 zmm22 {k7} {z}, zmm23, zmm24 + vsubbf16 zmm22 {k7} {z}, zmm23, zmm24 -// CHECK: vsubnepbf16 xmm22, xmm23, xmm24 +// CHECK: vsubbf16 xmm22, xmm23, xmm24 // CHECK: encoding: [0x62,0x85,0x45,0x00,0x5c,0xf0] - vsubnepbf16 xmm22, xmm23, xmm24 + vsubbf16 xmm22, xmm23, xmm24 -// CHECK: vsubnepbf16 xmm22 {k7}, xmm23, xmm24 +// CHECK: vsubbf16 xmm22 {k7}, xmm23, xmm24 // CHECK: encoding: [0x62,0x85,0x45,0x07,0x5c,0xf0] - vsubnepbf16 xmm22 {k7}, xmm23, xmm24 + vsubbf16 xmm22 {k7}, xmm23, xmm24 -// CHECK: vsubnepbf16 xmm22 {k7} {z}, xmm23, xmm24 +// CHECK: vsubbf16 xmm22 {k7} {z}, xmm23, xmm24 // CHECK: encoding: [0x62,0x85,0x45,0x87,0x5c,0xf0] - vsubnepbf16 xmm22 {k7} {z}, xmm23, xmm24 + vsubbf16 xmm22 {k7} {z}, xmm23, xmm24 -// CHECK: vsubnepbf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456] +// CHECK: vsubbf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456] // CHECK: encoding: [0x62,0xa5,0x45,0x40,0x5c,0xb4,0xf5,0x00,0x00,0x00,0x10] - vsubnepbf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456] + vsubbf16 zmm22, zmm23, zmmword ptr [rbp + 8*r14 + 268435456] -// CHECK: vsubnepbf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291] +// CHECK: vsubbf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291] // CHECK: encoding: [0x62,0xc5,0x45,0x47,0x5c,0xb4,0x80,0x23,0x01,0x00,0x00] - vsubnepbf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291] + vsubbf16 zmm22 {k7}, zmm23, zmmword ptr [r8 + 4*rax + 291] -// CHECK: vsubnepbf16 zmm22, zmm23, word ptr [rip]{1to32} +// CHECK: vsubbf16 zmm22, zmm23, word ptr [rip]{1to32} // CHECK: encoding: [0x62,0xe5,0x45,0x50,0x5c,0x35,0x00,0x00,0x00,0x00] - vsubnepbf16 zmm22, zmm23, word ptr [rip]{1to32} + vsubbf16 zmm22, zmm23, word ptr [rip]{1to32} -// CHECK: vsubnepbf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048] +// CHECK: vsubbf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048] // CHECK: encoding: [0x62,0xe5,0x45,0x40,0x5c,0x34,0x6d,0x00,0xf8,0xff,0xff] - vsubnepbf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048] + vsubbf16 zmm22, zmm23, zmmword ptr [2*rbp - 2048] -// CHECK: vsubnepbf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128] +// CHECK: vsubbf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128] // CHECK: encoding: [0x62,0xe5,0x45,0xc7,0x5c,0x71,0x7f] - vsubnepbf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128] + vsubbf16 zmm22 {k7} {z}, zmm23, zmmword ptr [rcx + 8128] -// CHECK: vsubnepbf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32} +// CHECK: vsubbf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32} // CHECK: encoding: [0x62,0xe5,0x45,0xd7,0x5c,0x72,0x80] - vsubnepbf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32} + vsubbf16 zmm22 {k7} {z}, zmm23, word ptr [rdx - 256]{1to32} -// CHECK: vsubnepbf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456] +// CHECK: vsubbf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456] // CHECK: encoding: [0x62,0xa5,0x45,0x20,0x5c,0xb4,0xf5,0x00,0x00,0x00,0x10] - vsubnepbf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456] + vsubbf16 ymm22, ymm23, ymmword ptr [rbp + 8*r14 + 268435456] -// CHECK: vsubnepbf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291] +// CHECK: vsubbf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291] // CHECK: encoding: [0x62,0xc5,0x45,0x27,0x5c,0xb4,0x80,0x23,0x01,0x00,0x00] - vsubnepbf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291] + vsubbf16 ymm22 {k7}, ymm23, ymmword ptr [r8 + 4*rax + 291] -// CHECK: vsubnepbf16 ymm22, ymm23, word ptr [rip]{1to16} +// CHECK: vsubbf16 ymm22, ymm23, word ptr [rip]{1to16} // CHECK: encoding: [0x62,0xe5,0x45,0x30,0x5c,0x35,0x00,0x00,0x00,0x00] - vsubnepbf16 ymm22, ymm23, word ptr [rip]{1to16} + vsubbf16 ymm22, ymm23, word ptr [rip]{1to16} -// CHECK: vsubnepbf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024] +// CHECK: vsubbf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024] // CHECK: encoding: [0x62,0xe5,0x45,0x20,0x5c,0x34,0x6d,0x00,0xfc,0xff,0xff] - vsubnepbf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024] + vsubbf16 ymm22, ymm23, ymmword ptr [2*rbp - 1024] -// CHECK: vsubnepbf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064] +// CHECK: vsubbf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064] // CHECK: encoding: [0x62,0xe5,0x45,0xa7,0x5c,0x71,0x7f] - vsubnepbf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064] + vsubbf16 ymm22 {k7} {z}, ymm23, ymmword ptr [rcx + 4064] -// CHECK: vsubnepbf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16} +// CHECK: vsubbf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16} // CHECK: encoding: [0x62,0xe5,0x45,0xb7,0x5c,0x72,0x80] - vsubnepbf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16} + vsubbf16 ymm22 {k7} {z}, ymm23, word ptr [rdx - 256]{1to16} -// CHECK: vsubnepbf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456] +// CHECK: vsubbf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456] // CHECK: encoding: [0x62,0xa5,0x45,0x00,0x5c,0xb4,0xf5,0x00,0x00,0x00,0x10] - vsubnepbf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456] + vsubbf16 xmm22, xmm23, xmmword ptr [rbp + 8*r14 + 268435456] -// CHECK: vsubnepbf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291] +// CHECK: vsubbf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291] // CHECK: encoding: [0x62,0xc5,0x45,0x07,0x5c,0xb4,0x80,0x23,0x01,0x00,0x00] - vsubnepbf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291] + vsubbf16 xmm22 {k7}, xmm23, xmmword ptr [r8 + 4*rax + 291] -// CHECK: vsubnepbf16 xmm22, xmm23, word ptr [rip]{1to8} +// CHECK: vsubbf16 xmm22, xmm23, word ptr [rip]{1to8} // CHECK: encoding: [0x62,0xe5,0x45,0x10,0x5c,0x35,0x00,0x00,0x00,0x00] - vsubnepbf16 xmm22, xmm23, word ptr [rip]{1to8} + vsubbf16 xmm22, xmm23, word ptr [rip]{1to8} -// CHECK: vsubnepbf16 xmm22, xmm23, xmmword ptr [2*rbp - 512] +// CHECK: vsubbf16 xmm22, xmm23, xmmword ptr [2*rbp - 512] // CHECK: encoding: [0x62,0xe5,0x45,0x00,0x5c,0x34,0x6d,0x00,0xfe,0xff,0xff] - vsubnepbf16 xmm22, xmm23, xmmword ptr [2*rbp - 512] + vsubbf16 xmm22, xmm23, xmmword ptr [2*rbp - 512] -// CHECK: vsubnepbf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032] +// CHECK: vsubbf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032] // CHECK: encoding: [0x62,0xe5,0x45,0x87,0x5c,0x71,0x7f] - vsubnepbf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032] + vsubbf16 xmm22 {k7} {z}, xmm23, xmmword ptr [rcx + 2032] -// CHECK: vsubnepbf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8} +// CHECK: vsubbf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8} // CHECK: encoding: [0x62,0xe5,0x45,0x97,0x5c,0x72,0x80] - vsubnepbf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8} + vsubbf16 xmm22 {k7} {z}, xmm23, word ptr [rdx - 256]{1to8} diff --git a/llvm/test/TableGen/x86-fold-tables.inc b/llvm/test/TableGen/x86-fold-tables.inc index 954c05bdb2076..f2a3ba854c127 100644 --- a/llvm/test/TableGen/x86-fold-tables.inc +++ b/llvm/test/TableGen/x86-fold-tables.inc @@ -1506,9 +1506,9 @@ static const X86FoldTableEntry Table1[] = { {X86::VEXPANDPSZ128rr, X86::VEXPANDPSZ128rm, TB_NO_REVERSE}, {X86::VEXPANDPSZ256rr, X86::VEXPANDPSZ256rm, TB_NO_REVERSE}, {X86::VEXPANDPSZrr, X86::VEXPANDPSZrm, TB_NO_REVERSE}, - {X86::VFPCLASSPBF16Z128ri, X86::VFPCLASSPBF16Z128mi, 0}, - {X86::VFPCLASSPBF16Z256ri, X86::VFPCLASSPBF16Z256mi, 0}, - {X86::VFPCLASSPBF16Zri, X86::VFPCLASSPBF16Zmi, 0}, + {X86::VFPCLASSBF16Z128ri, X86::VFPCLASSBF16Z128mi, 0}, + {X86::VFPCLASSBF16Z256ri, X86::VFPCLASSBF16Z256mi, 0}, + {X86::VFPCLASSBF16Zri, X86::VFPCLASSBF16Zmi, 0}, {X86::VFPCLASSPDZ128ri, X86::VFPCLASSPDZ128mi, 0}, {X86::VFPCLASSPDZ256ri, X86::VFPCLASSPDZ256mi, 0}, {X86::VFPCLASSPDZri, X86::VFPCLASSPDZmi, 0}, @@ -1527,9 +1527,9 @@ static const X86FoldTableEntry Table1[] = { {X86::VFRCZPSrr, X86::VFRCZPSrm, 0}, {X86::VFRCZSDrr, X86::VFRCZSDrm, TB_NO_REVERSE}, {X86::VFRCZSSrr, X86::VFRCZSSrm, TB_NO_REVERSE}, - {X86::VGETEXPPBF16Z128r, X86::VGETEXPPBF16Z128m, 0}, - {X86::VGETEXPPBF16Z256r, X86::VGETEXPPBF16Z256m, 0}, - {X86::VGETEXPPBF16Zr, X86::VGETEXPPBF16Zm, 0}, + {X86::VGETEXPBF16Z128r, X86::VGETEXPBF16Z128m, 0}, + {X86::VGETEXPBF16Z256r, X86::VGETEXPBF16Z256m, 0}, + {X86::VGETEXPBF16Zr, X86::VGETEXPBF16Zm, 0}, {X86::VGETEXPPDZ128r, X86::VGETEXPPDZ128m, 0}, {X86::VGETEXPPDZ256r, X86::VGETEXPPDZ256m, 0}, {X86::VGETEXPPDZr, X86::VGETEXPPDZm, 0}, @@ -1539,9 +1539,9 @@ static const X86FoldTableEntry Table1[] = { {X86::VGETEXPPSZ128r, X86::VGETEXPPSZ128m, 0}, {X86::VGETEXPPSZ256r, X86::VGETEXPPSZ256m, 0}, {X86::VGETEXPPSZr, X86::VGETEXPPSZm, 0}, - {X86::VGETMANTPBF16Z128rri, X86::VGETMANTPBF16Z128rmi, 0}, - {X86::VGETMANTPBF16Z256rri, X86::VGETMANTPBF16Z256rmi, 0}, - {X86::VGETMANTPBF16Zrri, X86::VGETMANTPBF16Zrmi, 0}, + {X86::VGETMANTBF16Z128rri, X86::VGETMANTBF16Z128rmi, 0}, + {X86::VGETMANTBF16Z256rri, X86::VGETMANTBF16Z256rmi, 0}, + {X86::VGETMANTBF16Zrri, X86::VGETMANTBF16Zrmi, 0}, {X86::VGETMANTPDZ128rri, X86::VGETMANTPDZ128rmi, 0}, {X86::VGETMANTPDZ256rri, X86::VGETMANTPDZ256rmi, 0}, {X86::VGETMANTPDZrri, X86::VGETMANTPDZrmi, 0}, @@ -1877,17 +1877,17 @@ static const X86FoldTableEntry Table1[] = { {X86::VRCP14PSZr, X86::VRCP14PSZm, 0}, {X86::VRCP28PDZr, X86::VRCP28PDZm, 0}, {X86::VRCP28PSZr, X86::VRCP28PSZm, 0}, - {X86::VRCPPBF16Z128r, X86::VRCPPBF16Z128m, 0}, - {X86::VRCPPBF16Z256r, X86::VRCPPBF16Z256m, 0}, - {X86::VRCPPBF16Zr, X86::VRCPPBF16Zm, 0}, + {X86::VRCPBF16Z128r, X86::VRCPBF16Z128m, 0}, + {X86::VRCPBF16Z256r, X86::VRCPBF16Z256m, 0}, + {X86::VRCPBF16Zr, X86::VRCPBF16Zm, 0}, {X86::VRCPPHZ128r, X86::VRCPPHZ128m, 0}, {X86::VRCPPHZ256r, X86::VRCPPHZ256m, 0}, {X86::VRCPPHZr, X86::VRCPPHZm, 0}, {X86::VRCPPSYr, X86::VRCPPSYm, 0}, {X86::VRCPPSr, X86::VRCPPSm, 0}, - {X86::VREDUCENEPBF16Z128rri, X86::VREDUCENEPBF16Z128rmi, 0}, - {X86::VREDUCENEPBF16Z256rri, X86::VREDUCENEPBF16Z256rmi, 0}, - {X86::VREDUCENEPBF16Zrri, X86::VREDUCENEPBF16Zrmi, 0}, + {X86::VREDUCEBF16Z128rri, X86::VREDUCEBF16Z128rmi, 0}, + {X86::VREDUCEBF16Z256rri, X86::VREDUCEBF16Z256rmi, 0}, + {X86::VREDUCEBF16Zrri, X86::VREDUCEBF16Zrmi, 0}, {X86::VREDUCEPDZ128rri, X86::VREDUCEPDZ128rmi, 0}, {X86::VREDUCEPDZ256rri, X86::VREDUCEPDZ256rmi, 0}, {X86::VREDUCEPDZrri, X86::VREDUCEPDZrmi, 0}, @@ -1897,9 +1897,9 @@ static const X86FoldTableEntry Table1[] = { {X86::VREDUCEPSZ128rri, X86::VREDUCEPSZ128rmi, 0}, {X86::VREDUCEPSZ256rri, X86::VREDUCEPSZ256rmi, 0}, {X86::VREDUCEPSZrri, X86::VREDUCEPSZrmi, 0}, - {X86::VRNDSCALENEPBF16Z128rri, X86::VRNDSCALENEPBF16Z128rmi, 0}, - {X86::VRNDSCALENEPBF16Z256rri, X86::VRNDSCALENEPBF16Z256rmi, 0}, - {X86::VRNDSCALENEPBF16Zrri, X86::VRNDSCALENEPBF16Zrmi, 0}, + {X86::VRNDSCALEBF16Z128rri, X86::VRNDSCALEBF16Z128rmi, 0}, + {X86::VRNDSCALEBF16Z256rri, X86::VRNDSCALEBF16Z256rmi, 0}, + {X86::VRNDSCALEBF16Zrri, X86::VRNDSCALEBF16Zrmi, 0}, {X86::VRNDSCALEPDZ128rri, X86::VRNDSCALEPDZ128rmi, 0}, {X86::VRNDSCALEPDZ256rri, X86::VRNDSCALEPDZ256rmi, 0}, {X86::VRNDSCALEPDZrri, X86::VRNDSCALEPDZrmi, 0}, @@ -1921,17 +1921,17 @@ static const X86FoldTableEntry Table1[] = { {X86::VRSQRT14PSZr, X86::VRSQRT14PSZm, 0}, {X86::VRSQRT28PDZr, X86::VRSQRT28PDZm, 0}, {X86::VRSQRT28PSZr, X86::VRSQRT28PSZm, 0}, - {X86::VRSQRTPBF16Z128r, X86::VRSQRTPBF16Z128m, 0}, - {X86::VRSQRTPBF16Z256r, X86::VRSQRTPBF16Z256m, 0}, - {X86::VRSQRTPBF16Zr, X86::VRSQRTPBF16Zm, 0}, + {X86::VRSQRTBF16Z128r, X86::VRSQRTBF16Z128m, 0}, + {X86::VRSQRTBF16Z256r, X86::VRSQRTBF16Z256m, 0}, + {X86::VRSQRTBF16Zr, X86::VRSQRTBF16Zm, 0}, {X86::VRSQRTPHZ128r, X86::VRSQRTPHZ128m, 0}, {X86::VRSQRTPHZ256r, X86::VRSQRTPHZ256m, 0}, {X86::VRSQRTPHZr, X86::VRSQRTPHZm, 0}, {X86::VRSQRTPSYr, X86::VRSQRTPSYm, 0}, {X86::VRSQRTPSr, X86::VRSQRTPSm, 0}, - {X86::VSQRTNEPBF16Z128r, X86::VSQRTNEPBF16Z128m, 0}, - {X86::VSQRTNEPBF16Z256r, X86::VSQRTNEPBF16Z256m, 0}, - {X86::VSQRTNEPBF16Zr, X86::VSQRTNEPBF16Zm, 0}, + {X86::VSQRTBF16Z128r, X86::VSQRTBF16Z128m, 0}, + {X86::VSQRTBF16Z256r, X86::VSQRTBF16Z256m, 0}, + {X86::VSQRTBF16Zr, X86::VSQRTBF16Zm, 0}, {X86::VSQRTPDYr, X86::VSQRTPDYm, 0}, {X86::VSQRTPDZ128r, X86::VSQRTPDZ128m, 0}, {X86::VSQRTPDZ256r, X86::VSQRTPDZ256m, 0}, @@ -2412,9 +2412,9 @@ static const X86FoldTableEntry Table2[] = { {X86::UNPCKHPSrr, X86::UNPCKHPSrm, TB_ALIGN_16}, {X86::UNPCKLPDrr, X86::UNPCKLPDrm, TB_ALIGN_16}, {X86::UNPCKLPSrr, X86::UNPCKLPSrm, TB_ALIGN_16}, - {X86::VADDNEPBF16Z128rr, X86::VADDNEPBF16Z128rm, 0}, - {X86::VADDNEPBF16Z256rr, X86::VADDNEPBF16Z256rm, 0}, - {X86::VADDNEPBF16Zrr, X86::VADDNEPBF16Zrm, 0}, + {X86::VADDBF16Z128rr, X86::VADDBF16Z128rm, 0}, + {X86::VADDBF16Z256rr, X86::VADDBF16Z256rm, 0}, + {X86::VADDBF16Zrr, X86::VADDBF16Zrm, 0}, {X86::VADDPDYrr, X86::VADDPDYrm, 0}, {X86::VADDPDZ128rr, X86::VADDPDZ128rm, 0}, {X86::VADDPDZ256rr, X86::VADDPDZ256rm, 0}, @@ -2512,9 +2512,9 @@ static const X86FoldTableEntry Table2[] = { {X86::VBROADCASTSSZ128rrkz, X86::VBROADCASTSSZ128rmkz, TB_NO_REVERSE}, {X86::VBROADCASTSSZ256rrkz, X86::VBROADCASTSSZ256rmkz, TB_NO_REVERSE}, {X86::VBROADCASTSSZrrkz, X86::VBROADCASTSSZrmkz, TB_NO_REVERSE}, - {X86::VCMPPBF16Z128rri, X86::VCMPPBF16Z128rmi, 0}, - {X86::VCMPPBF16Z256rri, X86::VCMPPBF16Z256rmi, 0}, - {X86::VCMPPBF16Zrri, X86::VCMPPBF16Zrmi, 0}, + {X86::VCMPBF16Z128rri, X86::VCMPBF16Z128rmi, 0}, + {X86::VCMPBF16Z256rri, X86::VCMPBF16Z256rmi, 0}, + {X86::VCMPBF16Zrri, X86::VCMPBF16Zrmi, 0}, {X86::VCMPPDYrri, X86::VCMPPDYrmi, 0}, {X86::VCMPPDZ128rri, X86::VCMPPDZ128rmi, 0}, {X86::VCMPPDZ256rri, X86::VCMPPDZ256rmi, 0}, @@ -2844,9 +2844,9 @@ static const X86FoldTableEntry Table2[] = { {X86::VDBPSADBWZ128rri, X86::VDBPSADBWZ128rmi, 0}, {X86::VDBPSADBWZ256rri, X86::VDBPSADBWZ256rmi, 0}, {X86::VDBPSADBWZrri, X86::VDBPSADBWZrmi, 0}, - {X86::VDIVNEPBF16Z128rr, X86::VDIVNEPBF16Z128rm, 0}, - {X86::VDIVNEPBF16Z256rr, X86::VDIVNEPBF16Z256rm, 0}, - {X86::VDIVNEPBF16Zrr, X86::VDIVNEPBF16Zrm, 0}, + {X86::VDIVBF16Z128rr, X86::VDIVBF16Z128rm, 0}, + {X86::VDIVBF16Z256rr, X86::VDIVBF16Z256rm, 0}, + {X86::VDIVBF16Zrr, X86::VDIVBF16Zrm, 0}, {X86::VDIVPDYrr, X86::VDIVPDYrm, 0}, {X86::VDIVPDZ128rr, X86::VDIVPDZ128rm, 0}, {X86::VDIVPDZ256rr, X86::VDIVPDZ256rm, 0}, @@ -2929,9 +2929,9 @@ static const X86FoldTableEntry Table2[] = { {X86::VFNMSUBSD4rr_Int, X86::VFNMSUBSD4mr_Int, TB_NO_REVERSE}, {X86::VFNMSUBSS4rr, X86::VFNMSUBSS4mr, 0}, {X86::VFNMSUBSS4rr_Int, X86::VFNMSUBSS4mr_Int, TB_NO_REVERSE}, - {X86::VFPCLASSPBF16Z128rik, X86::VFPCLASSPBF16Z128mik, 0}, - {X86::VFPCLASSPBF16Z256rik, X86::VFPCLASSPBF16Z256mik, 0}, - {X86::VFPCLASSPBF16Zrik, X86::VFPCLASSPBF16Zmik, 0}, + {X86::VFPCLASSBF16Z128rik, X86::VFPCLASSBF16Z128mik, 0}, + {X86::VFPCLASSBF16Z256rik, X86::VFPCLASSBF16Z256mik, 0}, + {X86::VFPCLASSBF16Zrik, X86::VFPCLASSBF16Zmik, 0}, {X86::VFPCLASSPDZ128rik, X86::VFPCLASSPDZ128mik, 0}, {X86::VFPCLASSPDZ256rik, X86::VFPCLASSPDZ256mik, 0}, {X86::VFPCLASSPDZrik, X86::VFPCLASSPDZmik, 0}, @@ -2944,9 +2944,9 @@ static const X86FoldTableEntry Table2[] = { {X86::VFPCLASSSDZrik, X86::VFPCLASSSDZmik, TB_NO_REVERSE}, {X86::VFPCLASSSHZrik, X86::VFPCLASSSHZmik, TB_NO_REVERSE}, {X86::VFPCLASSSSZrik, X86::VFPCLASSSSZmik, TB_NO_REVERSE}, - {X86::VGETEXPPBF16Z128rkz, X86::VGETEXPPBF16Z128mkz, 0}, - {X86::VGETEXPPBF16Z256rkz, X86::VGETEXPPBF16Z256mkz, 0}, - {X86::VGETEXPPBF16Zrkz, X86::VGETEXPPBF16Zmkz, 0}, + {X86::VGETEXPBF16Z128rkz, X86::VGETEXPBF16Z128mkz, 0}, + {X86::VGETEXPBF16Z256rkz, X86::VGETEXPBF16Z256mkz, 0}, + {X86::VGETEXPBF16Zrkz, X86::VGETEXPBF16Zmkz, 0}, {X86::VGETEXPPDZ128rkz, X86::VGETEXPPDZ128mkz, 0}, {X86::VGETEXPPDZ256rkz, X86::VGETEXPPDZ256mkz, 0}, {X86::VGETEXPPDZrkz, X86::VGETEXPPDZmkz, 0}, @@ -2959,9 +2959,9 @@ static const X86FoldTableEntry Table2[] = { {X86::VGETEXPSDZr, X86::VGETEXPSDZm, TB_NO_REVERSE}, {X86::VGETEXPSHZr, X86::VGETEXPSHZm, TB_NO_REVERSE}, {X86::VGETEXPSSZr, X86::VGETEXPSSZm, TB_NO_REVERSE}, - {X86::VGETMANTPBF16Z128rrikz, X86::VGETMANTPBF16Z128rmikz, 0}, - {X86::VGETMANTPBF16Z256rrikz, X86::VGETMANTPBF16Z256rmikz, 0}, - {X86::VGETMANTPBF16Zrrikz, X86::VGETMANTPBF16Zrmikz, 0}, + {X86::VGETMANTBF16Z128rrikz, X86::VGETMANTBF16Z128rmikz, 0}, + {X86::VGETMANTBF16Z256rrikz, X86::VGETMANTBF16Z256rmikz, 0}, + {X86::VGETMANTBF16Zrrikz, X86::VGETMANTBF16Zrmikz, 0}, {X86::VGETMANTPDZ128rrikz, X86::VGETMANTPDZ128rmikz, 0}, {X86::VGETMANTPDZ256rrikz, X86::VGETMANTPDZ256rmikz, 0}, {X86::VGETMANTPDZrrikz, X86::VGETMANTPDZrmikz, 0}, @@ -3011,6 +3011,9 @@ static const X86FoldTableEntry Table2[] = { {X86::VINSERTI64X2Z256rri, X86::VINSERTI64X2Z256rmi, 0}, {X86::VINSERTI64X2Zrri, X86::VINSERTI64X2Zrmi, 0}, {X86::VINSERTI64X4Zrri, X86::VINSERTI64X4Zrmi, 0}, + {X86::VMAXBF16Z128rr, X86::VMAXBF16Z128rm, 0}, + {X86::VMAXBF16Z256rr, X86::VMAXBF16Z256rm, 0}, + {X86::VMAXBF16Zrr, X86::VMAXBF16Zrm, 0}, {X86::VMAXCPDYrr, X86::VMAXCPDYrm, 0}, {X86::VMAXCPDZ128rr, X86::VMAXCPDZ128rm, 0}, {X86::VMAXCPDZ256rr, X86::VMAXCPDZ256rm, 0}, @@ -3029,9 +3032,6 @@ static const X86FoldTableEntry Table2[] = { {X86::VMAXCSHZrr, X86::VMAXCSHZrm, 0}, {X86::VMAXCSSZrr, X86::VMAXCSSZrm, 0}, {X86::VMAXCSSrr, X86::VMAXCSSrm, 0}, - {X86::VMAXPBF16Z128rr, X86::VMAXPBF16Z128rm, 0}, - {X86::VMAXPBF16Z256rr, X86::VMAXPBF16Z256rm, 0}, - {X86::VMAXPBF16Zrr, X86::VMAXPBF16Zrm, 0}, {X86::VMAXPDYrr, X86::VMAXPDYrm, 0}, {X86::VMAXPDZ128rr, X86::VMAXPDZ128rm, 0}, {X86::VMAXPDZ256rr, X86::VMAXPDZ256rm, 0}, @@ -3055,6 +3055,9 @@ static const X86FoldTableEntry Table2[] = { {X86::VMAXSSZrr_Int, X86::VMAXSSZrm_Int, TB_NO_REVERSE}, {X86::VMAXSSrr, X86::VMAXSSrm, 0}, {X86::VMAXSSrr_Int, X86::VMAXSSrm_Int, TB_NO_REVERSE}, + {X86::VMINBF16Z128rr, X86::VMINBF16Z128rm, 0}, + {X86::VMINBF16Z256rr, X86::VMINBF16Z256rm, 0}, + {X86::VMINBF16Zrr, X86::VMINBF16Zrm, 0}, {X86::VMINCPDYrr, X86::VMINCPDYrm, 0}, {X86::VMINCPDZ128rr, X86::VMINCPDZ128rm, 0}, {X86::VMINCPDZ256rr, X86::VMINCPDZ256rm, 0}, @@ -3091,9 +3094,6 @@ static const X86FoldTableEntry Table2[] = { {X86::VMINMAXSHrri_Int, X86::VMINMAXSHrmi_Int, TB_NO_REVERSE}, {X86::VMINMAXSSrri, X86::VMINMAXSSrmi, 0}, {X86::VMINMAXSSrri_Int, X86::VMINMAXSSrmi_Int, TB_NO_REVERSE}, - {X86::VMINPBF16Z128rr, X86::VMINPBF16Z128rm, 0}, - {X86::VMINPBF16Z256rr, X86::VMINPBF16Z256rm, 0}, - {X86::VMINPBF16Zrr, X86::VMINPBF16Zrm, 0}, {X86::VMINPDYrr, X86::VMINPDYrm, 0}, {X86::VMINPDZ128rr, X86::VMINPDZ128rm, 0}, {X86::VMINPDZ256rr, X86::VMINPDZ256rm, 0}, @@ -3165,9 +3165,9 @@ static const X86FoldTableEntry Table2[] = { {X86::VMPSADBWZ256rri, X86::VMPSADBWZ256rmi, 0}, {X86::VMPSADBWZrri, X86::VMPSADBWZrmi, 0}, {X86::VMPSADBWrri, X86::VMPSADBWrmi, 0}, - {X86::VMULNEPBF16Z128rr, X86::VMULNEPBF16Z128rm, 0}, - {X86::VMULNEPBF16Z256rr, X86::VMULNEPBF16Z256rm, 0}, - {X86::VMULNEPBF16Zrr, X86::VMULNEPBF16Zrm, 0}, + {X86::VMULBF16Z128rr, X86::VMULBF16Z128rm, 0}, + {X86::VMULBF16Z256rr, X86::VMULBF16Z256rm, 0}, + {X86::VMULBF16Zrr, X86::VMULBF16Zrm, 0}, {X86::VMULPDYrr, X86::VMULPDYrm, 0}, {X86::VMULPDZ128rr, X86::VMULPDZ128rm, 0}, {X86::VMULPDZ256rr, X86::VMULPDZ256rm, 0}, @@ -4018,18 +4018,18 @@ static const X86FoldTableEntry Table2[] = { {X86::VRCP28PSZrkz, X86::VRCP28PSZmkz, 0}, {X86::VRCP28SDZr, X86::VRCP28SDZm, TB_NO_REVERSE}, {X86::VRCP28SSZr, X86::VRCP28SSZm, TB_NO_REVERSE}, - {X86::VRCPPBF16Z128rkz, X86::VRCPPBF16Z128mkz, 0}, - {X86::VRCPPBF16Z256rkz, X86::VRCPPBF16Z256mkz, 0}, - {X86::VRCPPBF16Zrkz, X86::VRCPPBF16Zmkz, 0}, + {X86::VRCPBF16Z128rkz, X86::VRCPBF16Z128mkz, 0}, + {X86::VRCPBF16Z256rkz, X86::VRCPBF16Z256mkz, 0}, + {X86::VRCPBF16Zrkz, X86::VRCPBF16Zmkz, 0}, {X86::VRCPPHZ128rkz, X86::VRCPPHZ128mkz, 0}, {X86::VRCPPHZ256rkz, X86::VRCPPHZ256mkz, 0}, {X86::VRCPPHZrkz, X86::VRCPPHZmkz, 0}, {X86::VRCPSHZrr, X86::VRCPSHZrm, TB_NO_REVERSE}, {X86::VRCPSSr, X86::VRCPSSm, 0}, {X86::VRCPSSr_Int, X86::VRCPSSm_Int, TB_NO_REVERSE}, - {X86::VREDUCENEPBF16Z128rrikz, X86::VREDUCENEPBF16Z128rmikz, 0}, - {X86::VREDUCENEPBF16Z256rrikz, X86::VREDUCENEPBF16Z256rmikz, 0}, - {X86::VREDUCENEPBF16Zrrikz, X86::VREDUCENEPBF16Zrmikz, 0}, + {X86::VREDUCEBF16Z128rrikz, X86::VREDUCEBF16Z128rmikz, 0}, + {X86::VREDUCEBF16Z256rrikz, X86::VREDUCEBF16Z256rmikz, 0}, + {X86::VREDUCEBF16Zrrikz, X86::VREDUCEBF16Zrmikz, 0}, {X86::VREDUCEPDZ128rrikz, X86::VREDUCEPDZ128rmikz, 0}, {X86::VREDUCEPDZ256rrikz, X86::VREDUCEPDZ256rmikz, 0}, {X86::VREDUCEPDZrrikz, X86::VREDUCEPDZrmikz, 0}, @@ -4042,9 +4042,9 @@ static const X86FoldTableEntry Table2[] = { {X86::VREDUCESDZrri, X86::VREDUCESDZrmi, TB_NO_REVERSE}, {X86::VREDUCESHZrri, X86::VREDUCESHZrmi, TB_NO_REVERSE}, {X86::VREDUCESSZrri, X86::VREDUCESSZrmi, TB_NO_REVERSE}, - {X86::VRNDSCALENEPBF16Z128rrikz, X86::VRNDSCALENEPBF16Z128rmikz, 0}, - {X86::VRNDSCALENEPBF16Z256rrikz, X86::VRNDSCALENEPBF16Z256rmikz, 0}, - {X86::VRNDSCALENEPBF16Zrrikz, X86::VRNDSCALENEPBF16Zrmikz, 0}, + {X86::VRNDSCALEBF16Z128rrikz, X86::VRNDSCALEBF16Z128rmikz, 0}, + {X86::VRNDSCALEBF16Z256rrikz, X86::VRNDSCALEBF16Z256rmikz, 0}, + {X86::VRNDSCALEBF16Zrrikz, X86::VRNDSCALEBF16Zrmikz, 0}, {X86::VRNDSCALEPDZ128rrikz, X86::VRNDSCALEPDZ128rmikz, 0}, {X86::VRNDSCALEPDZ256rrikz, X86::VRNDSCALEPDZ256rmikz, 0}, {X86::VRNDSCALEPDZrrikz, X86::VRNDSCALEPDZrmikz, 0}, @@ -4076,18 +4076,18 @@ static const X86FoldTableEntry Table2[] = { {X86::VRSQRT28PSZrkz, X86::VRSQRT28PSZmkz, 0}, {X86::VRSQRT28SDZr, X86::VRSQRT28SDZm, TB_NO_REVERSE}, {X86::VRSQRT28SSZr, X86::VRSQRT28SSZm, TB_NO_REVERSE}, - {X86::VRSQRTPBF16Z128rkz, X86::VRSQRTPBF16Z128mkz, 0}, - {X86::VRSQRTPBF16Z256rkz, X86::VRSQRTPBF16Z256mkz, 0}, - {X86::VRSQRTPBF16Zrkz, X86::VRSQRTPBF16Zmkz, 0}, + {X86::VRSQRTBF16Z128rkz, X86::VRSQRTBF16Z128mkz, 0}, + {X86::VRSQRTBF16Z256rkz, X86::VRSQRTBF16Z256mkz, 0}, + {X86::VRSQRTBF16Zrkz, X86::VRSQRTBF16Zmkz, 0}, {X86::VRSQRTPHZ128rkz, X86::VRSQRTPHZ128mkz, 0}, {X86::VRSQRTPHZ256rkz, X86::VRSQRTPHZ256mkz, 0}, {X86::VRSQRTPHZrkz, X86::VRSQRTPHZmkz, 0}, {X86::VRSQRTSHZrr, X86::VRSQRTSHZrm, TB_NO_REVERSE}, {X86::VRSQRTSSr, X86::VRSQRTSSm, 0}, {X86::VRSQRTSSr_Int, X86::VRSQRTSSm_Int, TB_NO_REVERSE}, - {X86::VSCALEFPBF16Z128rr, X86::VSCALEFPBF16Z128rm, 0}, - {X86::VSCALEFPBF16Z256rr, X86::VSCALEFPBF16Z256rm, 0}, - {X86::VSCALEFPBF16Zrr, X86::VSCALEFPBF16Zrm, 0}, + {X86::VSCALEFBF16Z128rr, X86::VSCALEFBF16Z128rm, 0}, + {X86::VSCALEFBF16Z256rr, X86::VSCALEFBF16Z256rm, 0}, + {X86::VSCALEFBF16Zrr, X86::VSCALEFBF16Zrm, 0}, {X86::VSCALEFPDZ128rr, X86::VSCALEFPDZ128rm, 0}, {X86::VSCALEFPDZ256rr, X86::VSCALEFPDZ256rm, 0}, {X86::VSCALEFPDZrr, X86::VSCALEFPDZrm, 0}, @@ -4128,9 +4128,9 @@ static const X86FoldTableEntry Table2[] = { {X86::VSM4RNDS4Z256rr, X86::VSM4RNDS4Z256rm, 0}, {X86::VSM4RNDS4Zrr, X86::VSM4RNDS4Zrm, 0}, {X86::VSM4RNDS4rr, X86::VSM4RNDS4rm, 0}, - {X86::VSQRTNEPBF16Z128rkz, X86::VSQRTNEPBF16Z128mkz, 0}, - {X86::VSQRTNEPBF16Z256rkz, X86::VSQRTNEPBF16Z256mkz, 0}, - {X86::VSQRTNEPBF16Zrkz, X86::VSQRTNEPBF16Zmkz, 0}, + {X86::VSQRTBF16Z128rkz, X86::VSQRTBF16Z128mkz, 0}, + {X86::VSQRTBF16Z256rkz, X86::VSQRTBF16Z256mkz, 0}, + {X86::VSQRTBF16Zrkz, X86::VSQRTBF16Zmkz, 0}, {X86::VSQRTPDZ128rkz, X86::VSQRTPDZ128mkz, 0}, {X86::VSQRTPDZ256rkz, X86::VSQRTPDZ256mkz, 0}, {X86::VSQRTPDZrkz, X86::VSQRTPDZmkz, 0}, @@ -4150,9 +4150,9 @@ static const X86FoldTableEntry Table2[] = { {X86::VSQRTSSZr_Int, X86::VSQRTSSZm_Int, TB_NO_REVERSE}, {X86::VSQRTSSr, X86::VSQRTSSm, 0}, {X86::VSQRTSSr_Int, X86::VSQRTSSm_Int, TB_NO_REVERSE}, - {X86::VSUBNEPBF16Z128rr, X86::VSUBNEPBF16Z128rm, 0}, - {X86::VSUBNEPBF16Z256rr, X86::VSUBNEPBF16Z256rm, 0}, - {X86::VSUBNEPBF16Zrr, X86::VSUBNEPBF16Zrm, 0}, + {X86::VSUBBF16Z128rr, X86::VSUBBF16Z128rm, 0}, + {X86::VSUBBF16Z256rr, X86::VSUBBF16Z256rm, 0}, + {X86::VSUBBF16Zrr, X86::VSUBBF16Zrm, 0}, {X86::VSUBPDYrr, X86::VSUBPDYrm, 0}, {X86::VSUBPDZ128rr, X86::VSUBPDZ128rm, 0}, {X86::VSUBPDZ256rr, X86::VSUBPDZ256rm, 0}, @@ -4227,9 +4227,9 @@ static const X86FoldTableEntry Table2[] = { }; static const X86FoldTableEntry Table3[] = { - {X86::VADDNEPBF16Z128rrkz, X86::VADDNEPBF16Z128rmkz, 0}, - {X86::VADDNEPBF16Z256rrkz, X86::VADDNEPBF16Z256rmkz, 0}, - {X86::VADDNEPBF16Zrrkz, X86::VADDNEPBF16Zrmkz, 0}, + {X86::VADDBF16Z128rrkz, X86::VADDBF16Z128rmkz, 0}, + {X86::VADDBF16Z256rrkz, X86::VADDBF16Z256rmkz, 0}, + {X86::VADDBF16Zrrkz, X86::VADDBF16Zrmkz, 0}, {X86::VADDPDZ128rrkz, X86::VADDPDZ128rmkz, 0}, {X86::VADDPDZ256rrkz, X86::VADDPDZ256rmkz, 0}, {X86::VADDPDZrrkz, X86::VADDPDZrmkz, 0}, @@ -4276,9 +4276,9 @@ static const X86FoldTableEntry Table3[] = { {X86::VBROADCASTSSZ128rrk, X86::VBROADCASTSSZ128rmk, TB_NO_REVERSE}, {X86::VBROADCASTSSZ256rrk, X86::VBROADCASTSSZ256rmk, TB_NO_REVERSE}, {X86::VBROADCASTSSZrrk, X86::VBROADCASTSSZrmk, TB_NO_REVERSE}, - {X86::VCMPPBF16Z128rrik, X86::VCMPPBF16Z128rmik, 0}, - {X86::VCMPPBF16Z256rrik, X86::VCMPPBF16Z256rmik, 0}, - {X86::VCMPPBF16Zrrik, X86::VCMPPBF16Zrmik, 0}, + {X86::VCMPBF16Z128rrik, X86::VCMPBF16Z128rmik, 0}, + {X86::VCMPBF16Z256rrik, X86::VCMPBF16Z256rmik, 0}, + {X86::VCMPBF16Zrrik, X86::VCMPBF16Zrmik, 0}, {X86::VCMPPDZ128rrik, X86::VCMPPDZ128rmik, 0}, {X86::VCMPPDZ256rrik, X86::VCMPPDZ256rmik, 0}, {X86::VCMPPDZrrik, X86::VCMPPDZrmik, 0}, @@ -4555,9 +4555,9 @@ static const X86FoldTableEntry Table3[] = { {X86::VDBPSADBWZ128rrikz, X86::VDBPSADBWZ128rmikz, 0}, {X86::VDBPSADBWZ256rrikz, X86::VDBPSADBWZ256rmikz, 0}, {X86::VDBPSADBWZrrikz, X86::VDBPSADBWZrmikz, 0}, - {X86::VDIVNEPBF16Z128rrkz, X86::VDIVNEPBF16Z128rmkz, 0}, - {X86::VDIVNEPBF16Z256rrkz, X86::VDIVNEPBF16Z256rmkz, 0}, - {X86::VDIVNEPBF16Zrrkz, X86::VDIVNEPBF16Zrmkz, 0}, + {X86::VDIVBF16Z128rrkz, X86::VDIVBF16Z128rmkz, 0}, + {X86::VDIVBF16Z256rrkz, X86::VDIVBF16Z256rmkz, 0}, + {X86::VDIVBF16Zrrkz, X86::VDIVBF16Zrmkz, 0}, {X86::VDIVPDZ128rrkz, X86::VDIVPDZ128rmkz, 0}, {X86::VDIVPDZ256rrkz, X86::VDIVPDZ256rmkz, 0}, {X86::VDIVPDZrrkz, X86::VDIVPDZrmkz, 0}, @@ -4600,9 +4600,9 @@ static const X86FoldTableEntry Table3[] = { {X86::VFIXUPIMMPSZrri, X86::VFIXUPIMMPSZrmi, 0}, {X86::VFIXUPIMMSDZrri, X86::VFIXUPIMMSDZrmi, TB_NO_REVERSE}, {X86::VFIXUPIMMSSZrri, X86::VFIXUPIMMSSZrmi, TB_NO_REVERSE}, - {X86::VFMADD132NEPBF16Z128r, X86::VFMADD132NEPBF16Z128m, 0}, - {X86::VFMADD132NEPBF16Z256r, X86::VFMADD132NEPBF16Z256m, 0}, - {X86::VFMADD132NEPBF16Zr, X86::VFMADD132NEPBF16Zm, 0}, + {X86::VFMADD132BF16Z128r, X86::VFMADD132BF16Z128m, 0}, + {X86::VFMADD132BF16Z256r, X86::VFMADD132BF16Z256m, 0}, + {X86::VFMADD132BF16Zr, X86::VFMADD132BF16Zm, 0}, {X86::VFMADD132PDYr, X86::VFMADD132PDYm, 0}, {X86::VFMADD132PDZ128r, X86::VFMADD132PDZ128m, 0}, {X86::VFMADD132PDZ256r, X86::VFMADD132PDZ256m, 0}, @@ -4626,9 +4626,9 @@ static const X86FoldTableEntry Table3[] = { {X86::VFMADD132SSZr_Int, X86::VFMADD132SSZm_Int, TB_NO_REVERSE}, {X86::VFMADD132SSr, X86::VFMADD132SSm, 0}, {X86::VFMADD132SSr_Int, X86::VFMADD132SSm_Int, TB_NO_REVERSE}, - {X86::VFMADD213NEPBF16Z128r, X86::VFMADD213NEPBF16Z128m, 0}, - {X86::VFMADD213NEPBF16Z256r, X86::VFMADD213NEPBF16Z256m, 0}, - {X86::VFMADD213NEPBF16Zr, X86::VFMADD213NEPBF16Zm, 0}, + {X86::VFMADD213BF16Z128r, X86::VFMADD213BF16Z128m, 0}, + {X86::VFMADD213BF16Z256r, X86::VFMADD213BF16Z256m, 0}, + {X86::VFMADD213BF16Zr, X86::VFMADD213BF16Zm, 0}, {X86::VFMADD213PDYr, X86::VFMADD213PDYm, 0}, {X86::VFMADD213PDZ128r, X86::VFMADD213PDZ128m, 0}, {X86::VFMADD213PDZ256r, X86::VFMADD213PDZ256m, 0}, @@ -4652,9 +4652,9 @@ static const X86FoldTableEntry Table3[] = { {X86::VFMADD213SSZr_Int, X86::VFMADD213SSZm_Int, TB_NO_REVERSE}, {X86::VFMADD213SSr, X86::VFMADD213SSm, 0}, {X86::VFMADD213SSr_Int, X86::VFMADD213SSm_Int, TB_NO_REVERSE}, - {X86::VFMADD231NEPBF16Z128r, X86::VFMADD231NEPBF16Z128m, 0}, - {X86::VFMADD231NEPBF16Z256r, X86::VFMADD231NEPBF16Z256m, 0}, - {X86::VFMADD231NEPBF16Zr, X86::VFMADD231NEPBF16Zm, 0}, + {X86::VFMADD231BF16Z128r, X86::VFMADD231BF16Z128m, 0}, + {X86::VFMADD231BF16Z256r, X86::VFMADD231BF16Z256m, 0}, + {X86::VFMADD231BF16Zr, X86::VFMADD231BF16Zm, 0}, {X86::VFMADD231PDYr, X86::VFMADD231PDYm, 0}, {X86::VFMADD231PDZ128r, X86::VFMADD231PDZ128m, 0}, {X86::VFMADD231PDZ256r, X86::VFMADD231PDZ256m, 0}, @@ -4733,9 +4733,9 @@ static const X86FoldTableEntry Table3[] = { {X86::VFMADDSUBPD4rr, X86::VFMADDSUBPD4rm, 0}, {X86::VFMADDSUBPS4Yrr, X86::VFMADDSUBPS4Yrm, 0}, {X86::VFMADDSUBPS4rr, X86::VFMADDSUBPS4rm, 0}, - {X86::VFMSUB132NEPBF16Z128r, X86::VFMSUB132NEPBF16Z128m, 0}, - {X86::VFMSUB132NEPBF16Z256r, X86::VFMSUB132NEPBF16Z256m, 0}, - {X86::VFMSUB132NEPBF16Zr, X86::VFMSUB132NEPBF16Zm, 0}, + {X86::VFMSUB132BF16Z128r, X86::VFMSUB132BF16Z128m, 0}, + {X86::VFMSUB132BF16Z256r, X86::VFMSUB132BF16Z256m, 0}, + {X86::VFMSUB132BF16Zr, X86::VFMSUB132BF16Zm, 0}, {X86::VFMSUB132PDYr, X86::VFMSUB132PDYm, 0}, {X86::VFMSUB132PDZ128r, X86::VFMSUB132PDZ128m, 0}, {X86::VFMSUB132PDZ256r, X86::VFMSUB132PDZ256m, 0}, @@ -4759,9 +4759,9 @@ static const X86FoldTableEntry Table3[] = { {X86::VFMSUB132SSZr_Int, X86::VFMSUB132SSZm_Int, TB_NO_REVERSE}, {X86::VFMSUB132SSr, X86::VFMSUB132SSm, 0}, {X86::VFMSUB132SSr_Int, X86::VFMSUB132SSm_Int, TB_NO_REVERSE}, - {X86::VFMSUB213NEPBF16Z128r, X86::VFMSUB213NEPBF16Z128m, 0}, - {X86::VFMSUB213NEPBF16Z256r, X86::VFMSUB213NEPBF16Z256m, 0}, - {X86::VFMSUB213NEPBF16Zr, X86::VFMSUB213NEPBF16Zm, 0}, + {X86::VFMSUB213BF16Z128r, X86::VFMSUB213BF16Z128m, 0}, + {X86::VFMSUB213BF16Z256r, X86::VFMSUB213BF16Z256m, 0}, + {X86::VFMSUB213BF16Zr, X86::VFMSUB213BF16Zm, 0}, {X86::VFMSUB213PDYr, X86::VFMSUB213PDYm, 0}, {X86::VFMSUB213PDZ128r, X86::VFMSUB213PDZ128m, 0}, {X86::VFMSUB213PDZ256r, X86::VFMSUB213PDZ256m, 0}, @@ -4785,9 +4785,9 @@ static const X86FoldTableEntry Table3[] = { {X86::VFMSUB213SSZr_Int, X86::VFMSUB213SSZm_Int, TB_NO_REVERSE}, {X86::VFMSUB213SSr, X86::VFMSUB213SSm, 0}, {X86::VFMSUB213SSr_Int, X86::VFMSUB213SSm_Int, TB_NO_REVERSE}, - {X86::VFMSUB231NEPBF16Z128r, X86::VFMSUB231NEPBF16Z128m, 0}, - {X86::VFMSUB231NEPBF16Z256r, X86::VFMSUB231NEPBF16Z256m, 0}, - {X86::VFMSUB231NEPBF16Zr, X86::VFMSUB231NEPBF16Zm, 0}, + {X86::VFMSUB231BF16Z128r, X86::VFMSUB231BF16Z128m, 0}, + {X86::VFMSUB231BF16Z256r, X86::VFMSUB231BF16Z256m, 0}, + {X86::VFMSUB231BF16Zr, X86::VFMSUB231BF16Zm, 0}, {X86::VFMSUB231PDYr, X86::VFMSUB231PDYm, 0}, {X86::VFMSUB231PDZ128r, X86::VFMSUB231PDZ128m, 0}, {X86::VFMSUB231PDZ256r, X86::VFMSUB231PDZ256m, 0}, @@ -4866,9 +4866,9 @@ static const X86FoldTableEntry Table3[] = { {X86::VFMULCPHZ256rrkz, X86::VFMULCPHZ256rmkz, 0}, {X86::VFMULCPHZrrkz, X86::VFMULCPHZrmkz, 0}, {X86::VFMULCSHZrrkz, X86::VFMULCSHZrmkz, TB_NO_REVERSE}, - {X86::VFNMADD132NEPBF16Z128r, X86::VFNMADD132NEPBF16Z128m, 0}, - {X86::VFNMADD132NEPBF16Z256r, X86::VFNMADD132NEPBF16Z256m, 0}, - {X86::VFNMADD132NEPBF16Zr, X86::VFNMADD132NEPBF16Zm, 0}, + {X86::VFNMADD132BF16Z128r, X86::VFNMADD132BF16Z128m, 0}, + {X86::VFNMADD132BF16Z256r, X86::VFNMADD132BF16Z256m, 0}, + {X86::VFNMADD132BF16Zr, X86::VFNMADD132BF16Zm, 0}, {X86::VFNMADD132PDYr, X86::VFNMADD132PDYm, 0}, {X86::VFNMADD132PDZ128r, X86::VFNMADD132PDZ128m, 0}, {X86::VFNMADD132PDZ256r, X86::VFNMADD132PDZ256m, 0}, @@ -4892,9 +4892,9 @@ static const X86FoldTableEntry Table3[] = { {X86::VFNMADD132SSZr_Int, X86::VFNMADD132SSZm_Int, TB_NO_REVERSE}, {X86::VFNMADD132SSr, X86::VFNMADD132SSm, 0}, {X86::VFNMADD132SSr_Int, X86::VFNMADD132SSm_Int, TB_NO_REVERSE}, - {X86::VFNMADD213NEPBF16Z128r, X86::VFNMADD213NEPBF16Z128m, 0}, - {X86::VFNMADD213NEPBF16Z256r, X86::VFNMADD213NEPBF16Z256m, 0}, - {X86::VFNMADD213NEPBF16Zr, X86::VFNMADD213NEPBF16Zm, 0}, + {X86::VFNMADD213BF16Z128r, X86::VFNMADD213BF16Z128m, 0}, + {X86::VFNMADD213BF16Z256r, X86::VFNMADD213BF16Z256m, 0}, + {X86::VFNMADD213BF16Zr, X86::VFNMADD213BF16Zm, 0}, {X86::VFNMADD213PDYr, X86::VFNMADD213PDYm, 0}, {X86::VFNMADD213PDZ128r, X86::VFNMADD213PDZ128m, 0}, {X86::VFNMADD213PDZ256r, X86::VFNMADD213PDZ256m, 0}, @@ -4918,9 +4918,9 @@ static const X86FoldTableEntry Table3[] = { {X86::VFNMADD213SSZr_Int, X86::VFNMADD213SSZm_Int, TB_NO_REVERSE}, {X86::VFNMADD213SSr, X86::VFNMADD213SSm, 0}, {X86::VFNMADD213SSr_Int, X86::VFNMADD213SSm_Int, TB_NO_REVERSE}, - {X86::VFNMADD231NEPBF16Z128r, X86::VFNMADD231NEPBF16Z128m, 0}, - {X86::VFNMADD231NEPBF16Z256r, X86::VFNMADD231NEPBF16Z256m, 0}, - {X86::VFNMADD231NEPBF16Zr, X86::VFNMADD231NEPBF16Zm, 0}, + {X86::VFNMADD231BF16Z128r, X86::VFNMADD231BF16Z128m, 0}, + {X86::VFNMADD231BF16Z256r, X86::VFNMADD231BF16Z256m, 0}, + {X86::VFNMADD231BF16Zr, X86::VFNMADD231BF16Zm, 0}, {X86::VFNMADD231PDYr, X86::VFNMADD231PDYm, 0}, {X86::VFNMADD231PDZ128r, X86::VFNMADD231PDZ128m, 0}, {X86::VFNMADD231PDZ256r, X86::VFNMADD231PDZ256m, 0}, @@ -4952,9 +4952,9 @@ static const X86FoldTableEntry Table3[] = { {X86::VFNMADDSD4rr_Int, X86::VFNMADDSD4rm_Int, TB_NO_REVERSE}, {X86::VFNMADDSS4rr, X86::VFNMADDSS4rm, 0}, {X86::VFNMADDSS4rr_Int, X86::VFNMADDSS4rm_Int, TB_NO_REVERSE}, - {X86::VFNMSUB132NEPBF16Z128r, X86::VFNMSUB132NEPBF16Z128m, 0}, - {X86::VFNMSUB132NEPBF16Z256r, X86::VFNMSUB132NEPBF16Z256m, 0}, - {X86::VFNMSUB132NEPBF16Zr, X86::VFNMSUB132NEPBF16Zm, 0}, + {X86::VFNMSUB132BF16Z128r, X86::VFNMSUB132BF16Z128m, 0}, + {X86::VFNMSUB132BF16Z256r, X86::VFNMSUB132BF16Z256m, 0}, + {X86::VFNMSUB132BF16Zr, X86::VFNMSUB132BF16Zm, 0}, {X86::VFNMSUB132PDYr, X86::VFNMSUB132PDYm, 0}, {X86::VFNMSUB132PDZ128r, X86::VFNMSUB132PDZ128m, 0}, {X86::VFNMSUB132PDZ256r, X86::VFNMSUB132PDZ256m, 0}, @@ -4978,9 +4978,9 @@ static const X86FoldTableEntry Table3[] = { {X86::VFNMSUB132SSZr_Int, X86::VFNMSUB132SSZm_Int, TB_NO_REVERSE}, {X86::VFNMSUB132SSr, X86::VFNMSUB132SSm, 0}, {X86::VFNMSUB132SSr_Int, X86::VFNMSUB132SSm_Int, TB_NO_REVERSE}, - {X86::VFNMSUB213NEPBF16Z128r, X86::VFNMSUB213NEPBF16Z128m, 0}, - {X86::VFNMSUB213NEPBF16Z256r, X86::VFNMSUB213NEPBF16Z256m, 0}, - {X86::VFNMSUB213NEPBF16Zr, X86::VFNMSUB213NEPBF16Zm, 0}, + {X86::VFNMSUB213BF16Z128r, X86::VFNMSUB213BF16Z128m, 0}, + {X86::VFNMSUB213BF16Z256r, X86::VFNMSUB213BF16Z256m, 0}, + {X86::VFNMSUB213BF16Zr, X86::VFNMSUB213BF16Zm, 0}, {X86::VFNMSUB213PDYr, X86::VFNMSUB213PDYm, 0}, {X86::VFNMSUB213PDZ128r, X86::VFNMSUB213PDZ128m, 0}, {X86::VFNMSUB213PDZ256r, X86::VFNMSUB213PDZ256m, 0}, @@ -5004,9 +5004,9 @@ static const X86FoldTableEntry Table3[] = { {X86::VFNMSUB213SSZr_Int, X86::VFNMSUB213SSZm_Int, TB_NO_REVERSE}, {X86::VFNMSUB213SSr, X86::VFNMSUB213SSm, 0}, {X86::VFNMSUB213SSr_Int, X86::VFNMSUB213SSm_Int, TB_NO_REVERSE}, - {X86::VFNMSUB231NEPBF16Z128r, X86::VFNMSUB231NEPBF16Z128m, 0}, - {X86::VFNMSUB231NEPBF16Z256r, X86::VFNMSUB231NEPBF16Z256m, 0}, - {X86::VFNMSUB231NEPBF16Zr, X86::VFNMSUB231NEPBF16Zm, 0}, + {X86::VFNMSUB231BF16Z128r, X86::VFNMSUB231BF16Z128m, 0}, + {X86::VFNMSUB231BF16Z256r, X86::VFNMSUB231BF16Z256m, 0}, + {X86::VFNMSUB231BF16Zr, X86::VFNMSUB231BF16Zm, 0}, {X86::VFNMSUB231PDYr, X86::VFNMSUB231PDYm, 0}, {X86::VFNMSUB231PDZ128r, X86::VFNMSUB231PDZ128m, 0}, {X86::VFNMSUB231PDZ256r, X86::VFNMSUB231PDZ256m, 0}, @@ -5038,9 +5038,9 @@ static const X86FoldTableEntry Table3[] = { {X86::VFNMSUBSD4rr_Int, X86::VFNMSUBSD4rm_Int, TB_NO_REVERSE}, {X86::VFNMSUBSS4rr, X86::VFNMSUBSS4rm, 0}, {X86::VFNMSUBSS4rr_Int, X86::VFNMSUBSS4rm_Int, TB_NO_REVERSE}, - {X86::VGETEXPPBF16Z128rk, X86::VGETEXPPBF16Z128mk, 0}, - {X86::VGETEXPPBF16Z256rk, X86::VGETEXPPBF16Z256mk, 0}, - {X86::VGETEXPPBF16Zrk, X86::VGETEXPPBF16Zmk, 0}, + {X86::VGETEXPBF16Z128rk, X86::VGETEXPBF16Z128mk, 0}, + {X86::VGETEXPBF16Z256rk, X86::VGETEXPBF16Z256mk, 0}, + {X86::VGETEXPBF16Zrk, X86::VGETEXPBF16Zmk, 0}, {X86::VGETEXPPDZ128rk, X86::VGETEXPPDZ128mk, 0}, {X86::VGETEXPPDZ256rk, X86::VGETEXPPDZ256mk, 0}, {X86::VGETEXPPDZrk, X86::VGETEXPPDZmk, 0}, @@ -5053,9 +5053,9 @@ static const X86FoldTableEntry Table3[] = { {X86::VGETEXPSDZrkz, X86::VGETEXPSDZmkz, TB_NO_REVERSE}, {X86::VGETEXPSHZrkz, X86::VGETEXPSHZmkz, TB_NO_REVERSE}, {X86::VGETEXPSSZrkz, X86::VGETEXPSSZmkz, TB_NO_REVERSE}, - {X86::VGETMANTPBF16Z128rrik, X86::VGETMANTPBF16Z128rmik, 0}, - {X86::VGETMANTPBF16Z256rrik, X86::VGETMANTPBF16Z256rmik, 0}, - {X86::VGETMANTPBF16Zrrik, X86::VGETMANTPBF16Zrmik, 0}, + {X86::VGETMANTBF16Z128rrik, X86::VGETMANTBF16Z128rmik, 0}, + {X86::VGETMANTBF16Z256rrik, X86::VGETMANTBF16Z256rmik, 0}, + {X86::VGETMANTBF16Zrrik, X86::VGETMANTBF16Zrmik, 0}, {X86::VGETMANTPDZ128rrik, X86::VGETMANTPDZ128rmik, 0}, {X86::VGETMANTPDZ256rrik, X86::VGETMANTPDZ256rmik, 0}, {X86::VGETMANTPDZrrik, X86::VGETMANTPDZrmik, 0}, @@ -5089,6 +5089,9 @@ static const X86FoldTableEntry Table3[] = { {X86::VINSERTI64X2Z256rrikz, X86::VINSERTI64X2Z256rmikz, 0}, {X86::VINSERTI64X2Zrrikz, X86::VINSERTI64X2Zrmikz, 0}, {X86::VINSERTI64X4Zrrikz, X86::VINSERTI64X4Zrmikz, 0}, + {X86::VMAXBF16Z128rrkz, X86::VMAXBF16Z128rmkz, 0}, + {X86::VMAXBF16Z256rrkz, X86::VMAXBF16Z256rmkz, 0}, + {X86::VMAXBF16Zrrkz, X86::VMAXBF16Zrmkz, 0}, {X86::VMAXCPDZ128rrkz, X86::VMAXCPDZ128rmkz, 0}, {X86::VMAXCPDZ256rrkz, X86::VMAXCPDZ256rmkz, 0}, {X86::VMAXCPDZrrkz, X86::VMAXCPDZrmkz, 0}, @@ -5098,9 +5101,6 @@ static const X86FoldTableEntry Table3[] = { {X86::VMAXCPSZ128rrkz, X86::VMAXCPSZ128rmkz, 0}, {X86::VMAXCPSZ256rrkz, X86::VMAXCPSZ256rmkz, 0}, {X86::VMAXCPSZrrkz, X86::VMAXCPSZrmkz, 0}, - {X86::VMAXPBF16Z128rrkz, X86::VMAXPBF16Z128rmkz, 0}, - {X86::VMAXPBF16Z256rrkz, X86::VMAXPBF16Z256rmkz, 0}, - {X86::VMAXPBF16Zrrkz, X86::VMAXPBF16Zrmkz, 0}, {X86::VMAXPDZ128rrkz, X86::VMAXPDZ128rmkz, 0}, {X86::VMAXPDZ256rrkz, X86::VMAXPDZ256rmkz, 0}, {X86::VMAXPDZrrkz, X86::VMAXPDZrmkz, 0}, @@ -5113,6 +5113,9 @@ static const X86FoldTableEntry Table3[] = { {X86::VMAXSDZrrkz_Int, X86::VMAXSDZrmkz_Int, TB_NO_REVERSE}, {X86::VMAXSHZrrkz_Int, X86::VMAXSHZrmkz_Int, TB_NO_REVERSE}, {X86::VMAXSSZrrkz_Int, X86::VMAXSSZrmkz_Int, TB_NO_REVERSE}, + {X86::VMINBF16Z128rrkz, X86::VMINBF16Z128rmkz, 0}, + {X86::VMINBF16Z256rrkz, X86::VMINBF16Z256rmkz, 0}, + {X86::VMINBF16Zrrkz, X86::VMINBF16Zrmkz, 0}, {X86::VMINCPDZ128rrkz, X86::VMINCPDZ128rmkz, 0}, {X86::VMINCPDZ256rrkz, X86::VMINCPDZ256rmkz, 0}, {X86::VMINCPDZrrkz, X86::VMINCPDZrmkz, 0}, @@ -5137,9 +5140,6 @@ static const X86FoldTableEntry Table3[] = { {X86::VMINMAXSDrrikz_Int, X86::VMINMAXSDrmikz_Int, TB_NO_REVERSE}, {X86::VMINMAXSHrrikz_Int, X86::VMINMAXSHrmikz_Int, TB_NO_REVERSE}, {X86::VMINMAXSSrrikz_Int, X86::VMINMAXSSrmikz_Int, TB_NO_REVERSE}, - {X86::VMINPBF16Z128rrkz, X86::VMINPBF16Z128rmkz, 0}, - {X86::VMINPBF16Z256rrkz, X86::VMINPBF16Z256rmkz, 0}, - {X86::VMINPBF16Zrrkz, X86::VMINPBF16Zrmkz, 0}, {X86::VMINPDZ128rrkz, X86::VMINPDZ128rmkz, 0}, {X86::VMINPDZ256rrkz, X86::VMINPDZ256rmkz, 0}, {X86::VMINPDZrrkz, X86::VMINPDZrmkz, 0}, @@ -5194,9 +5194,9 @@ static const X86FoldTableEntry Table3[] = { {X86::VMPSADBWZ128rrikz, X86::VMPSADBWZ128rmikz, 0}, {X86::VMPSADBWZ256rrikz, X86::VMPSADBWZ256rmikz, 0}, {X86::VMPSADBWZrrikz, X86::VMPSADBWZrmikz, 0}, - {X86::VMULNEPBF16Z128rrkz, X86::VMULNEPBF16Z128rmkz, 0}, - {X86::VMULNEPBF16Z256rrkz, X86::VMULNEPBF16Z256rmkz, 0}, - {X86::VMULNEPBF16Zrrkz, X86::VMULNEPBF16Zrmkz, 0}, + {X86::VMULBF16Z128rrkz, X86::VMULBF16Z128rmkz, 0}, + {X86::VMULBF16Z256rrkz, X86::VMULBF16Z256rmkz, 0}, + {X86::VMULBF16Zrrkz, X86::VMULBF16Zrmkz, 0}, {X86::VMULPDZ128rrkz, X86::VMULPDZ128rmkz, 0}, {X86::VMULPDZ256rrkz, X86::VMULPDZ256rmkz, 0}, {X86::VMULPDZrrkz, X86::VMULPDZrmkz, 0}, @@ -5938,16 +5938,16 @@ static const X86FoldTableEntry Table3[] = { {X86::VRCP28PSZrk, X86::VRCP28PSZmk, 0}, {X86::VRCP28SDZrkz, X86::VRCP28SDZmkz, TB_NO_REVERSE}, {X86::VRCP28SSZrkz, X86::VRCP28SSZmkz, TB_NO_REVERSE}, - {X86::VRCPPBF16Z128rk, X86::VRCPPBF16Z128mk, 0}, - {X86::VRCPPBF16Z256rk, X86::VRCPPBF16Z256mk, 0}, - {X86::VRCPPBF16Zrk, X86::VRCPPBF16Zmk, 0}, + {X86::VRCPBF16Z128rk, X86::VRCPBF16Z128mk, 0}, + {X86::VRCPBF16Z256rk, X86::VRCPBF16Z256mk, 0}, + {X86::VRCPBF16Zrk, X86::VRCPBF16Zmk, 0}, {X86::VRCPPHZ128rk, X86::VRCPPHZ128mk, 0}, {X86::VRCPPHZ256rk, X86::VRCPPHZ256mk, 0}, {X86::VRCPPHZrk, X86::VRCPPHZmk, 0}, {X86::VRCPSHZrrkz, X86::VRCPSHZrmkz, TB_NO_REVERSE}, - {X86::VREDUCENEPBF16Z128rrik, X86::VREDUCENEPBF16Z128rmik, 0}, - {X86::VREDUCENEPBF16Z256rrik, X86::VREDUCENEPBF16Z256rmik, 0}, - {X86::VREDUCENEPBF16Zrrik, X86::VREDUCENEPBF16Zrmik, 0}, + {X86::VREDUCEBF16Z128rrik, X86::VREDUCEBF16Z128rmik, 0}, + {X86::VREDUCEBF16Z256rrik, X86::VREDUCEBF16Z256rmik, 0}, + {X86::VREDUCEBF16Zrrik, X86::VREDUCEBF16Zrmik, 0}, {X86::VREDUCEPDZ128rrik, X86::VREDUCEPDZ128rmik, 0}, {X86::VREDUCEPDZ256rrik, X86::VREDUCEPDZ256rmik, 0}, {X86::VREDUCEPDZrrik, X86::VREDUCEPDZrmik, 0}, @@ -5960,9 +5960,9 @@ static const X86FoldTableEntry Table3[] = { {X86::VREDUCESDZrrikz, X86::VREDUCESDZrmikz, TB_NO_REVERSE}, {X86::VREDUCESHZrrikz, X86::VREDUCESHZrmikz, TB_NO_REVERSE}, {X86::VREDUCESSZrrikz, X86::VREDUCESSZrmikz, TB_NO_REVERSE}, - {X86::VRNDSCALENEPBF16Z128rrik, X86::VRNDSCALENEPBF16Z128rmik, 0}, - {X86::VRNDSCALENEPBF16Z256rrik, X86::VRNDSCALENEPBF16Z256rmik, 0}, - {X86::VRNDSCALENEPBF16Zrrik, X86::VRNDSCALENEPBF16Zrmik, 0}, + {X86::VRNDSCALEBF16Z128rrik, X86::VRNDSCALEBF16Z128rmik, 0}, + {X86::VRNDSCALEBF16Z256rrik, X86::VRNDSCALEBF16Z256rmik, 0}, + {X86::VRNDSCALEBF16Zrrik, X86::VRNDSCALEBF16Zrmik, 0}, {X86::VRNDSCALEPDZ128rrik, X86::VRNDSCALEPDZ128rmik, 0}, {X86::VRNDSCALEPDZ256rrik, X86::VRNDSCALEPDZ256rmik, 0}, {X86::VRNDSCALEPDZrrik, X86::VRNDSCALEPDZrmik, 0}, @@ -5987,16 +5987,16 @@ static const X86FoldTableEntry Table3[] = { {X86::VRSQRT28PSZrk, X86::VRSQRT28PSZmk, 0}, {X86::VRSQRT28SDZrkz, X86::VRSQRT28SDZmkz, TB_NO_REVERSE}, {X86::VRSQRT28SSZrkz, X86::VRSQRT28SSZmkz, TB_NO_REVERSE}, - {X86::VRSQRTPBF16Z128rk, X86::VRSQRTPBF16Z128mk, 0}, - {X86::VRSQRTPBF16Z256rk, X86::VRSQRTPBF16Z256mk, 0}, - {X86::VRSQRTPBF16Zrk, X86::VRSQRTPBF16Zmk, 0}, + {X86::VRSQRTBF16Z128rk, X86::VRSQRTBF16Z128mk, 0}, + {X86::VRSQRTBF16Z256rk, X86::VRSQRTBF16Z256mk, 0}, + {X86::VRSQRTBF16Zrk, X86::VRSQRTBF16Zmk, 0}, {X86::VRSQRTPHZ128rk, X86::VRSQRTPHZ128mk, 0}, {X86::VRSQRTPHZ256rk, X86::VRSQRTPHZ256mk, 0}, {X86::VRSQRTPHZrk, X86::VRSQRTPHZmk, 0}, {X86::VRSQRTSHZrrkz, X86::VRSQRTSHZrmkz, TB_NO_REVERSE}, - {X86::VSCALEFPBF16Z128rrkz, X86::VSCALEFPBF16Z128rmkz, 0}, - {X86::VSCALEFPBF16Z256rrkz, X86::VSCALEFPBF16Z256rmkz, 0}, - {X86::VSCALEFPBF16Zrrkz, X86::VSCALEFPBF16Zrmkz, 0}, + {X86::VSCALEFBF16Z128rrkz, X86::VSCALEFBF16Z128rmkz, 0}, + {X86::VSCALEFBF16Z256rrkz, X86::VSCALEFBF16Z256rmkz, 0}, + {X86::VSCALEFBF16Zrrkz, X86::VSCALEFBF16Zrmkz, 0}, {X86::VSCALEFPDZ128rrkz, X86::VSCALEFPDZ128rmkz, 0}, {X86::VSCALEFPDZ256rrkz, X86::VSCALEFPDZ256rmkz, 0}, {X86::VSCALEFPDZrrkz, X86::VSCALEFPDZrmkz, 0}, @@ -6026,9 +6026,9 @@ static const X86FoldTableEntry Table3[] = { {X86::VSM3MSG1rr, X86::VSM3MSG1rm, 0}, {X86::VSM3MSG2rr, X86::VSM3MSG2rm, 0}, {X86::VSM3RNDS2rr, X86::VSM3RNDS2rm, 0}, - {X86::VSQRTNEPBF16Z128rk, X86::VSQRTNEPBF16Z128mk, 0}, - {X86::VSQRTNEPBF16Z256rk, X86::VSQRTNEPBF16Z256mk, 0}, - {X86::VSQRTNEPBF16Zrk, X86::VSQRTNEPBF16Zmk, 0}, + {X86::VSQRTBF16Z128rk, X86::VSQRTBF16Z128mk, 0}, + {X86::VSQRTBF16Z256rk, X86::VSQRTBF16Z256mk, 0}, + {X86::VSQRTBF16Zrk, X86::VSQRTBF16Zmk, 0}, {X86::VSQRTPDZ128rk, X86::VSQRTPDZ128mk, 0}, {X86::VSQRTPDZ256rk, X86::VSQRTPDZ256mk, 0}, {X86::VSQRTPDZrk, X86::VSQRTPDZmk, 0}, @@ -6041,9 +6041,9 @@ static const X86FoldTableEntry Table3[] = { {X86::VSQRTSDZrkz_Int, X86::VSQRTSDZmkz_Int, TB_NO_REVERSE}, {X86::VSQRTSHZrkz_Int, X86::VSQRTSHZmkz_Int, TB_NO_REVERSE}, {X86::VSQRTSSZrkz_Int, X86::VSQRTSSZmkz_Int, TB_NO_REVERSE}, - {X86::VSUBNEPBF16Z128rrkz, X86::VSUBNEPBF16Z128rmkz, 0}, - {X86::VSUBNEPBF16Z256rrkz, X86::VSUBNEPBF16Z256rmkz, 0}, - {X86::VSUBNEPBF16Zrrkz, X86::VSUBNEPBF16Zrmkz, 0}, + {X86::VSUBBF16Z128rrkz, X86::VSUBBF16Z128rmkz, 0}, + {X86::VSUBBF16Z256rrkz, X86::VSUBBF16Z256rmkz, 0}, + {X86::VSUBBF16Zrrkz, X86::VSUBBF16Zrmkz, 0}, {X86::VSUBPDZ128rrkz, X86::VSUBPDZ128rmkz, 0}, {X86::VSUBPDZ256rrkz, X86::VSUBPDZ256rmkz, 0}, {X86::VSUBPDZrrkz, X86::VSUBPDZrmkz, 0}, @@ -6077,9 +6077,9 @@ static const X86FoldTableEntry Table3[] = { }; static const X86FoldTableEntry Table4[] = { - {X86::VADDNEPBF16Z128rrk, X86::VADDNEPBF16Z128rmk, 0}, - {X86::VADDNEPBF16Z256rrk, X86::VADDNEPBF16Z256rmk, 0}, - {X86::VADDNEPBF16Zrrk, X86::VADDNEPBF16Zrmk, 0}, + {X86::VADDBF16Z128rrk, X86::VADDBF16Z128rmk, 0}, + {X86::VADDBF16Z256rrk, X86::VADDBF16Z256rmk, 0}, + {X86::VADDBF16Zrrk, X86::VADDBF16Zrmk, 0}, {X86::VADDPDZ128rrk, X86::VADDPDZ128rmk, 0}, {X86::VADDPDZ256rrk, X86::VADDPDZ256rmk, 0}, {X86::VADDPDZrrk, X86::VADDPDZrmk, 0}, @@ -6149,9 +6149,9 @@ static const X86FoldTableEntry Table4[] = { {X86::VDBPSADBWZ128rrik, X86::VDBPSADBWZ128rmik, 0}, {X86::VDBPSADBWZ256rrik, X86::VDBPSADBWZ256rmik, 0}, {X86::VDBPSADBWZrrik, X86::VDBPSADBWZrmik, 0}, - {X86::VDIVNEPBF16Z128rrk, X86::VDIVNEPBF16Z128rmk, 0}, - {X86::VDIVNEPBF16Z256rrk, X86::VDIVNEPBF16Z256rmk, 0}, - {X86::VDIVNEPBF16Zrrk, X86::VDIVNEPBF16Zrmk, 0}, + {X86::VDIVBF16Z128rrk, X86::VDIVBF16Z128rmk, 0}, + {X86::VDIVBF16Z256rrk, X86::VDIVBF16Z256rmk, 0}, + {X86::VDIVBF16Zrrk, X86::VDIVBF16Zrmk, 0}, {X86::VDIVPDZ128rrk, X86::VDIVPDZ128rmk, 0}, {X86::VDIVPDZ256rrk, X86::VDIVPDZ256rmk, 0}, {X86::VDIVPDZrrk, X86::VDIVPDZrmk, 0}, @@ -6204,12 +6204,12 @@ static const X86FoldTableEntry Table4[] = { {X86::VFIXUPIMMSDZrrikz, X86::VFIXUPIMMSDZrmikz, TB_NO_REVERSE}, {X86::VFIXUPIMMSSZrrik, X86::VFIXUPIMMSSZrmik, TB_NO_REVERSE}, {X86::VFIXUPIMMSSZrrikz, X86::VFIXUPIMMSSZrmikz, TB_NO_REVERSE}, - {X86::VFMADD132NEPBF16Z128rk, X86::VFMADD132NEPBF16Z128mk, 0}, - {X86::VFMADD132NEPBF16Z128rkz, X86::VFMADD132NEPBF16Z128mkz, 0}, - {X86::VFMADD132NEPBF16Z256rk, X86::VFMADD132NEPBF16Z256mk, 0}, - {X86::VFMADD132NEPBF16Z256rkz, X86::VFMADD132NEPBF16Z256mkz, 0}, - {X86::VFMADD132NEPBF16Zrk, X86::VFMADD132NEPBF16Zmk, 0}, - {X86::VFMADD132NEPBF16Zrkz, X86::VFMADD132NEPBF16Zmkz, 0}, + {X86::VFMADD132BF16Z128rk, X86::VFMADD132BF16Z128mk, 0}, + {X86::VFMADD132BF16Z128rkz, X86::VFMADD132BF16Z128mkz, 0}, + {X86::VFMADD132BF16Z256rk, X86::VFMADD132BF16Z256mk, 0}, + {X86::VFMADD132BF16Z256rkz, X86::VFMADD132BF16Z256mkz, 0}, + {X86::VFMADD132BF16Zrk, X86::VFMADD132BF16Zmk, 0}, + {X86::VFMADD132BF16Zrkz, X86::VFMADD132BF16Zmkz, 0}, {X86::VFMADD132PDZ128rk, X86::VFMADD132PDZ128mk, 0}, {X86::VFMADD132PDZ128rkz, X86::VFMADD132PDZ128mkz, 0}, {X86::VFMADD132PDZ256rk, X86::VFMADD132PDZ256mk, 0}, @@ -6234,12 +6234,12 @@ static const X86FoldTableEntry Table4[] = { {X86::VFMADD132SHZrkz_Int, X86::VFMADD132SHZmkz_Int, TB_NO_REVERSE}, {X86::VFMADD132SSZrk_Int, X86::VFMADD132SSZmk_Int, TB_NO_REVERSE}, {X86::VFMADD132SSZrkz_Int, X86::VFMADD132SSZmkz_Int, TB_NO_REVERSE}, - {X86::VFMADD213NEPBF16Z128rk, X86::VFMADD213NEPBF16Z128mk, 0}, - {X86::VFMADD213NEPBF16Z128rkz, X86::VFMADD213NEPBF16Z128mkz, 0}, - {X86::VFMADD213NEPBF16Z256rk, X86::VFMADD213NEPBF16Z256mk, 0}, - {X86::VFMADD213NEPBF16Z256rkz, X86::VFMADD213NEPBF16Z256mkz, 0}, - {X86::VFMADD213NEPBF16Zrk, X86::VFMADD213NEPBF16Zmk, 0}, - {X86::VFMADD213NEPBF16Zrkz, X86::VFMADD213NEPBF16Zmkz, 0}, + {X86::VFMADD213BF16Z128rk, X86::VFMADD213BF16Z128mk, 0}, + {X86::VFMADD213BF16Z128rkz, X86::VFMADD213BF16Z128mkz, 0}, + {X86::VFMADD213BF16Z256rk, X86::VFMADD213BF16Z256mk, 0}, + {X86::VFMADD213BF16Z256rkz, X86::VFMADD213BF16Z256mkz, 0}, + {X86::VFMADD213BF16Zrk, X86::VFMADD213BF16Zmk, 0}, + {X86::VFMADD213BF16Zrkz, X86::VFMADD213BF16Zmkz, 0}, {X86::VFMADD213PDZ128rk, X86::VFMADD213PDZ128mk, 0}, {X86::VFMADD213PDZ128rkz, X86::VFMADD213PDZ128mkz, 0}, {X86::VFMADD213PDZ256rk, X86::VFMADD213PDZ256mk, 0}, @@ -6264,12 +6264,12 @@ static const X86FoldTableEntry Table4[] = { {X86::VFMADD213SHZrkz_Int, X86::VFMADD213SHZmkz_Int, TB_NO_REVERSE}, {X86::VFMADD213SSZrk_Int, X86::VFMADD213SSZmk_Int, TB_NO_REVERSE}, {X86::VFMADD213SSZrkz_Int, X86::VFMADD213SSZmkz_Int, TB_NO_REVERSE}, - {X86::VFMADD231NEPBF16Z128rk, X86::VFMADD231NEPBF16Z128mk, 0}, - {X86::VFMADD231NEPBF16Z128rkz, X86::VFMADD231NEPBF16Z128mkz, 0}, - {X86::VFMADD231NEPBF16Z256rk, X86::VFMADD231NEPBF16Z256mk, 0}, - {X86::VFMADD231NEPBF16Z256rkz, X86::VFMADD231NEPBF16Z256mkz, 0}, - {X86::VFMADD231NEPBF16Zrk, X86::VFMADD231NEPBF16Zmk, 0}, - {X86::VFMADD231NEPBF16Zrkz, X86::VFMADD231NEPBF16Zmkz, 0}, + {X86::VFMADD231BF16Z128rk, X86::VFMADD231BF16Z128mk, 0}, + {X86::VFMADD231BF16Z128rkz, X86::VFMADD231BF16Z128mkz, 0}, + {X86::VFMADD231BF16Z256rk, X86::VFMADD231BF16Z256mk, 0}, + {X86::VFMADD231BF16Z256rkz, X86::VFMADD231BF16Z256mkz, 0}, + {X86::VFMADD231BF16Zrk, X86::VFMADD231BF16Zmk, 0}, + {X86::VFMADD231BF16Zrkz, X86::VFMADD231BF16Zmkz, 0}, {X86::VFMADD231PDZ128rk, X86::VFMADD231PDZ128mk, 0}, {X86::VFMADD231PDZ128rkz, X86::VFMADD231PDZ128mkz, 0}, {X86::VFMADD231PDZ256rk, X86::VFMADD231PDZ256mk, 0}, @@ -6356,12 +6356,12 @@ static const X86FoldTableEntry Table4[] = { {X86::VFMADDSUB231PSZ256rkz, X86::VFMADDSUB231PSZ256mkz, 0}, {X86::VFMADDSUB231PSZrk, X86::VFMADDSUB231PSZmk, 0}, {X86::VFMADDSUB231PSZrkz, X86::VFMADDSUB231PSZmkz, 0}, - {X86::VFMSUB132NEPBF16Z128rk, X86::VFMSUB132NEPBF16Z128mk, 0}, - {X86::VFMSUB132NEPBF16Z128rkz, X86::VFMSUB132NEPBF16Z128mkz, 0}, - {X86::VFMSUB132NEPBF16Z256rk, X86::VFMSUB132NEPBF16Z256mk, 0}, - {X86::VFMSUB132NEPBF16Z256rkz, X86::VFMSUB132NEPBF16Z256mkz, 0}, - {X86::VFMSUB132NEPBF16Zrk, X86::VFMSUB132NEPBF16Zmk, 0}, - {X86::VFMSUB132NEPBF16Zrkz, X86::VFMSUB132NEPBF16Zmkz, 0}, + {X86::VFMSUB132BF16Z128rk, X86::VFMSUB132BF16Z128mk, 0}, + {X86::VFMSUB132BF16Z128rkz, X86::VFMSUB132BF16Z128mkz, 0}, + {X86::VFMSUB132BF16Z256rk, X86::VFMSUB132BF16Z256mk, 0}, + {X86::VFMSUB132BF16Z256rkz, X86::VFMSUB132BF16Z256mkz, 0}, + {X86::VFMSUB132BF16Zrk, X86::VFMSUB132BF16Zmk, 0}, + {X86::VFMSUB132BF16Zrkz, X86::VFMSUB132BF16Zmkz, 0}, {X86::VFMSUB132PDZ128rk, X86::VFMSUB132PDZ128mk, 0}, {X86::VFMSUB132PDZ128rkz, X86::VFMSUB132PDZ128mkz, 0}, {X86::VFMSUB132PDZ256rk, X86::VFMSUB132PDZ256mk, 0}, @@ -6386,12 +6386,12 @@ static const X86FoldTableEntry Table4[] = { {X86::VFMSUB132SHZrkz_Int, X86::VFMSUB132SHZmkz_Int, TB_NO_REVERSE}, {X86::VFMSUB132SSZrk_Int, X86::VFMSUB132SSZmk_Int, TB_NO_REVERSE}, {X86::VFMSUB132SSZrkz_Int, X86::VFMSUB132SSZmkz_Int, TB_NO_REVERSE}, - {X86::VFMSUB213NEPBF16Z128rk, X86::VFMSUB213NEPBF16Z128mk, 0}, - {X86::VFMSUB213NEPBF16Z128rkz, X86::VFMSUB213NEPBF16Z128mkz, 0}, - {X86::VFMSUB213NEPBF16Z256rk, X86::VFMSUB213NEPBF16Z256mk, 0}, - {X86::VFMSUB213NEPBF16Z256rkz, X86::VFMSUB213NEPBF16Z256mkz, 0}, - {X86::VFMSUB213NEPBF16Zrk, X86::VFMSUB213NEPBF16Zmk, 0}, - {X86::VFMSUB213NEPBF16Zrkz, X86::VFMSUB213NEPBF16Zmkz, 0}, + {X86::VFMSUB213BF16Z128rk, X86::VFMSUB213BF16Z128mk, 0}, + {X86::VFMSUB213BF16Z128rkz, X86::VFMSUB213BF16Z128mkz, 0}, + {X86::VFMSUB213BF16Z256rk, X86::VFMSUB213BF16Z256mk, 0}, + {X86::VFMSUB213BF16Z256rkz, X86::VFMSUB213BF16Z256mkz, 0}, + {X86::VFMSUB213BF16Zrk, X86::VFMSUB213BF16Zmk, 0}, + {X86::VFMSUB213BF16Zrkz, X86::VFMSUB213BF16Zmkz, 0}, {X86::VFMSUB213PDZ128rk, X86::VFMSUB213PDZ128mk, 0}, {X86::VFMSUB213PDZ128rkz, X86::VFMSUB213PDZ128mkz, 0}, {X86::VFMSUB213PDZ256rk, X86::VFMSUB213PDZ256mk, 0}, @@ -6416,12 +6416,12 @@ static const X86FoldTableEntry Table4[] = { {X86::VFMSUB213SHZrkz_Int, X86::VFMSUB213SHZmkz_Int, TB_NO_REVERSE}, {X86::VFMSUB213SSZrk_Int, X86::VFMSUB213SSZmk_Int, TB_NO_REVERSE}, {X86::VFMSUB213SSZrkz_Int, X86::VFMSUB213SSZmkz_Int, TB_NO_REVERSE}, - {X86::VFMSUB231NEPBF16Z128rk, X86::VFMSUB231NEPBF16Z128mk, 0}, - {X86::VFMSUB231NEPBF16Z128rkz, X86::VFMSUB231NEPBF16Z128mkz, 0}, - {X86::VFMSUB231NEPBF16Z256rk, X86::VFMSUB231NEPBF16Z256mk, 0}, - {X86::VFMSUB231NEPBF16Z256rkz, X86::VFMSUB231NEPBF16Z256mkz, 0}, - {X86::VFMSUB231NEPBF16Zrk, X86::VFMSUB231NEPBF16Zmk, 0}, - {X86::VFMSUB231NEPBF16Zrkz, X86::VFMSUB231NEPBF16Zmkz, 0}, + {X86::VFMSUB231BF16Z128rk, X86::VFMSUB231BF16Z128mk, 0}, + {X86::VFMSUB231BF16Z128rkz, X86::VFMSUB231BF16Z128mkz, 0}, + {X86::VFMSUB231BF16Z256rk, X86::VFMSUB231BF16Z256mk, 0}, + {X86::VFMSUB231BF16Z256rkz, X86::VFMSUB231BF16Z256mkz, 0}, + {X86::VFMSUB231BF16Zrk, X86::VFMSUB231BF16Zmk, 0}, + {X86::VFMSUB231BF16Zrkz, X86::VFMSUB231BF16Zmkz, 0}, {X86::VFMSUB231PDZ128rk, X86::VFMSUB231PDZ128mk, 0}, {X86::VFMSUB231PDZ128rkz, X86::VFMSUB231PDZ128mkz, 0}, {X86::VFMSUB231PDZ256rk, X86::VFMSUB231PDZ256mk, 0}, @@ -6504,12 +6504,12 @@ static const X86FoldTableEntry Table4[] = { {X86::VFMULCPHZ256rrk, X86::VFMULCPHZ256rmk, 0}, {X86::VFMULCPHZrrk, X86::VFMULCPHZrmk, 0}, {X86::VFMULCSHZrrk, X86::VFMULCSHZrmk, TB_NO_REVERSE}, - {X86::VFNMADD132NEPBF16Z128rk, X86::VFNMADD132NEPBF16Z128mk, 0}, - {X86::VFNMADD132NEPBF16Z128rkz, X86::VFNMADD132NEPBF16Z128mkz, 0}, - {X86::VFNMADD132NEPBF16Z256rk, X86::VFNMADD132NEPBF16Z256mk, 0}, - {X86::VFNMADD132NEPBF16Z256rkz, X86::VFNMADD132NEPBF16Z256mkz, 0}, - {X86::VFNMADD132NEPBF16Zrk, X86::VFNMADD132NEPBF16Zmk, 0}, - {X86::VFNMADD132NEPBF16Zrkz, X86::VFNMADD132NEPBF16Zmkz, 0}, + {X86::VFNMADD132BF16Z128rk, X86::VFNMADD132BF16Z128mk, 0}, + {X86::VFNMADD132BF16Z128rkz, X86::VFNMADD132BF16Z128mkz, 0}, + {X86::VFNMADD132BF16Z256rk, X86::VFNMADD132BF16Z256mk, 0}, + {X86::VFNMADD132BF16Z256rkz, X86::VFNMADD132BF16Z256mkz, 0}, + {X86::VFNMADD132BF16Zrk, X86::VFNMADD132BF16Zmk, 0}, + {X86::VFNMADD132BF16Zrkz, X86::VFNMADD132BF16Zmkz, 0}, {X86::VFNMADD132PDZ128rk, X86::VFNMADD132PDZ128mk, 0}, {X86::VFNMADD132PDZ128rkz, X86::VFNMADD132PDZ128mkz, 0}, {X86::VFNMADD132PDZ256rk, X86::VFNMADD132PDZ256mk, 0}, @@ -6534,12 +6534,12 @@ static const X86FoldTableEntry Table4[] = { {X86::VFNMADD132SHZrkz_Int, X86::VFNMADD132SHZmkz_Int, TB_NO_REVERSE}, {X86::VFNMADD132SSZrk_Int, X86::VFNMADD132SSZmk_Int, TB_NO_REVERSE}, {X86::VFNMADD132SSZrkz_Int, X86::VFNMADD132SSZmkz_Int, TB_NO_REVERSE}, - {X86::VFNMADD213NEPBF16Z128rk, X86::VFNMADD213NEPBF16Z128mk, 0}, - {X86::VFNMADD213NEPBF16Z128rkz, X86::VFNMADD213NEPBF16Z128mkz, 0}, - {X86::VFNMADD213NEPBF16Z256rk, X86::VFNMADD213NEPBF16Z256mk, 0}, - {X86::VFNMADD213NEPBF16Z256rkz, X86::VFNMADD213NEPBF16Z256mkz, 0}, - {X86::VFNMADD213NEPBF16Zrk, X86::VFNMADD213NEPBF16Zmk, 0}, - {X86::VFNMADD213NEPBF16Zrkz, X86::VFNMADD213NEPBF16Zmkz, 0}, + {X86::VFNMADD213BF16Z128rk, X86::VFNMADD213BF16Z128mk, 0}, + {X86::VFNMADD213BF16Z128rkz, X86::VFNMADD213BF16Z128mkz, 0}, + {X86::VFNMADD213BF16Z256rk, X86::VFNMADD213BF16Z256mk, 0}, + {X86::VFNMADD213BF16Z256rkz, X86::VFNMADD213BF16Z256mkz, 0}, + {X86::VFNMADD213BF16Zrk, X86::VFNMADD213BF16Zmk, 0}, + {X86::VFNMADD213BF16Zrkz, X86::VFNMADD213BF16Zmkz, 0}, {X86::VFNMADD213PDZ128rk, X86::VFNMADD213PDZ128mk, 0}, {X86::VFNMADD213PDZ128rkz, X86::VFNMADD213PDZ128mkz, 0}, {X86::VFNMADD213PDZ256rk, X86::VFNMADD213PDZ256mk, 0}, @@ -6564,12 +6564,12 @@ static const X86FoldTableEntry Table4[] = { {X86::VFNMADD213SHZrkz_Int, X86::VFNMADD213SHZmkz_Int, TB_NO_REVERSE}, {X86::VFNMADD213SSZrk_Int, X86::VFNMADD213SSZmk_Int, TB_NO_REVERSE}, {X86::VFNMADD213SSZrkz_Int, X86::VFNMADD213SSZmkz_Int, TB_NO_REVERSE}, - {X86::VFNMADD231NEPBF16Z128rk, X86::VFNMADD231NEPBF16Z128mk, 0}, - {X86::VFNMADD231NEPBF16Z128rkz, X86::VFNMADD231NEPBF16Z128mkz, 0}, - {X86::VFNMADD231NEPBF16Z256rk, X86::VFNMADD231NEPBF16Z256mk, 0}, - {X86::VFNMADD231NEPBF16Z256rkz, X86::VFNMADD231NEPBF16Z256mkz, 0}, - {X86::VFNMADD231NEPBF16Zrk, X86::VFNMADD231NEPBF16Zmk, 0}, - {X86::VFNMADD231NEPBF16Zrkz, X86::VFNMADD231NEPBF16Zmkz, 0}, + {X86::VFNMADD231BF16Z128rk, X86::VFNMADD231BF16Z128mk, 0}, + {X86::VFNMADD231BF16Z128rkz, X86::VFNMADD231BF16Z128mkz, 0}, + {X86::VFNMADD231BF16Z256rk, X86::VFNMADD231BF16Z256mk, 0}, + {X86::VFNMADD231BF16Z256rkz, X86::VFNMADD231BF16Z256mkz, 0}, + {X86::VFNMADD231BF16Zrk, X86::VFNMADD231BF16Zmk, 0}, + {X86::VFNMADD231BF16Zrkz, X86::VFNMADD231BF16Zmkz, 0}, {X86::VFNMADD231PDZ128rk, X86::VFNMADD231PDZ128mk, 0}, {X86::VFNMADD231PDZ128rkz, X86::VFNMADD231PDZ128mkz, 0}, {X86::VFNMADD231PDZ256rk, X86::VFNMADD231PDZ256mk, 0}, @@ -6594,12 +6594,12 @@ static const X86FoldTableEntry Table4[] = { {X86::VFNMADD231SHZrkz_Int, X86::VFNMADD231SHZmkz_Int, TB_NO_REVERSE}, {X86::VFNMADD231SSZrk_Int, X86::VFNMADD231SSZmk_Int, TB_NO_REVERSE}, {X86::VFNMADD231SSZrkz_Int, X86::VFNMADD231SSZmkz_Int, TB_NO_REVERSE}, - {X86::VFNMSUB132NEPBF16Z128rk, X86::VFNMSUB132NEPBF16Z128mk, 0}, - {X86::VFNMSUB132NEPBF16Z128rkz, X86::VFNMSUB132NEPBF16Z128mkz, 0}, - {X86::VFNMSUB132NEPBF16Z256rk, X86::VFNMSUB132NEPBF16Z256mk, 0}, - {X86::VFNMSUB132NEPBF16Z256rkz, X86::VFNMSUB132NEPBF16Z256mkz, 0}, - {X86::VFNMSUB132NEPBF16Zrk, X86::VFNMSUB132NEPBF16Zmk, 0}, - {X86::VFNMSUB132NEPBF16Zrkz, X86::VFNMSUB132NEPBF16Zmkz, 0}, + {X86::VFNMSUB132BF16Z128rk, X86::VFNMSUB132BF16Z128mk, 0}, + {X86::VFNMSUB132BF16Z128rkz, X86::VFNMSUB132BF16Z128mkz, 0}, + {X86::VFNMSUB132BF16Z256rk, X86::VFNMSUB132BF16Z256mk, 0}, + {X86::VFNMSUB132BF16Z256rkz, X86::VFNMSUB132BF16Z256mkz, 0}, + {X86::VFNMSUB132BF16Zrk, X86::VFNMSUB132BF16Zmk, 0}, + {X86::VFNMSUB132BF16Zrkz, X86::VFNMSUB132BF16Zmkz, 0}, {X86::VFNMSUB132PDZ128rk, X86::VFNMSUB132PDZ128mk, 0}, {X86::VFNMSUB132PDZ128rkz, X86::VFNMSUB132PDZ128mkz, 0}, {X86::VFNMSUB132PDZ256rk, X86::VFNMSUB132PDZ256mk, 0}, @@ -6624,12 +6624,12 @@ static const X86FoldTableEntry Table4[] = { {X86::VFNMSUB132SHZrkz_Int, X86::VFNMSUB132SHZmkz_Int, TB_NO_REVERSE}, {X86::VFNMSUB132SSZrk_Int, X86::VFNMSUB132SSZmk_Int, TB_NO_REVERSE}, {X86::VFNMSUB132SSZrkz_Int, X86::VFNMSUB132SSZmkz_Int, TB_NO_REVERSE}, - {X86::VFNMSUB213NEPBF16Z128rk, X86::VFNMSUB213NEPBF16Z128mk, 0}, - {X86::VFNMSUB213NEPBF16Z128rkz, X86::VFNMSUB213NEPBF16Z128mkz, 0}, - {X86::VFNMSUB213NEPBF16Z256rk, X86::VFNMSUB213NEPBF16Z256mk, 0}, - {X86::VFNMSUB213NEPBF16Z256rkz, X86::VFNMSUB213NEPBF16Z256mkz, 0}, - {X86::VFNMSUB213NEPBF16Zrk, X86::VFNMSUB213NEPBF16Zmk, 0}, - {X86::VFNMSUB213NEPBF16Zrkz, X86::VFNMSUB213NEPBF16Zmkz, 0}, + {X86::VFNMSUB213BF16Z128rk, X86::VFNMSUB213BF16Z128mk, 0}, + {X86::VFNMSUB213BF16Z128rkz, X86::VFNMSUB213BF16Z128mkz, 0}, + {X86::VFNMSUB213BF16Z256rk, X86::VFNMSUB213BF16Z256mk, 0}, + {X86::VFNMSUB213BF16Z256rkz, X86::VFNMSUB213BF16Z256mkz, 0}, + {X86::VFNMSUB213BF16Zrk, X86::VFNMSUB213BF16Zmk, 0}, + {X86::VFNMSUB213BF16Zrkz, X86::VFNMSUB213BF16Zmkz, 0}, {X86::VFNMSUB213PDZ128rk, X86::VFNMSUB213PDZ128mk, 0}, {X86::VFNMSUB213PDZ128rkz, X86::VFNMSUB213PDZ128mkz, 0}, {X86::VFNMSUB213PDZ256rk, X86::VFNMSUB213PDZ256mk, 0}, @@ -6654,12 +6654,12 @@ static const X86FoldTableEntry Table4[] = { {X86::VFNMSUB213SHZrkz_Int, X86::VFNMSUB213SHZmkz_Int, TB_NO_REVERSE}, {X86::VFNMSUB213SSZrk_Int, X86::VFNMSUB213SSZmk_Int, TB_NO_REVERSE}, {X86::VFNMSUB213SSZrkz_Int, X86::VFNMSUB213SSZmkz_Int, TB_NO_REVERSE}, - {X86::VFNMSUB231NEPBF16Z128rk, X86::VFNMSUB231NEPBF16Z128mk, 0}, - {X86::VFNMSUB231NEPBF16Z128rkz, X86::VFNMSUB231NEPBF16Z128mkz, 0}, - {X86::VFNMSUB231NEPBF16Z256rk, X86::VFNMSUB231NEPBF16Z256mk, 0}, - {X86::VFNMSUB231NEPBF16Z256rkz, X86::VFNMSUB231NEPBF16Z256mkz, 0}, - {X86::VFNMSUB231NEPBF16Zrk, X86::VFNMSUB231NEPBF16Zmk, 0}, - {X86::VFNMSUB231NEPBF16Zrkz, X86::VFNMSUB231NEPBF16Zmkz, 0}, + {X86::VFNMSUB231BF16Z128rk, X86::VFNMSUB231BF16Z128mk, 0}, + {X86::VFNMSUB231BF16Z128rkz, X86::VFNMSUB231BF16Z128mkz, 0}, + {X86::VFNMSUB231BF16Z256rk, X86::VFNMSUB231BF16Z256mk, 0}, + {X86::VFNMSUB231BF16Z256rkz, X86::VFNMSUB231BF16Z256mkz, 0}, + {X86::VFNMSUB231BF16Zrk, X86::VFNMSUB231BF16Zmk, 0}, + {X86::VFNMSUB231BF16Zrkz, X86::VFNMSUB231BF16Zmkz, 0}, {X86::VFNMSUB231PDZ128rk, X86::VFNMSUB231PDZ128mk, 0}, {X86::VFNMSUB231PDZ128rkz, X86::VFNMSUB231PDZ128mkz, 0}, {X86::VFNMSUB231PDZ256rk, X86::VFNMSUB231PDZ256mk, 0}, @@ -6711,6 +6711,9 @@ static const X86FoldTableEntry Table4[] = { {X86::VINSERTI64X2Z256rrik, X86::VINSERTI64X2Z256rmik, 0}, {X86::VINSERTI64X2Zrrik, X86::VINSERTI64X2Zrmik, 0}, {X86::VINSERTI64X4Zrrik, X86::VINSERTI64X4Zrmik, 0}, + {X86::VMAXBF16Z128rrk, X86::VMAXBF16Z128rmk, 0}, + {X86::VMAXBF16Z256rrk, X86::VMAXBF16Z256rmk, 0}, + {X86::VMAXBF16Zrrk, X86::VMAXBF16Zrmk, 0}, {X86::VMAXCPDZ128rrk, X86::VMAXCPDZ128rmk, 0}, {X86::VMAXCPDZ256rrk, X86::VMAXCPDZ256rmk, 0}, {X86::VMAXCPDZrrk, X86::VMAXCPDZrmk, 0}, @@ -6720,9 +6723,6 @@ static const X86FoldTableEntry Table4[] = { {X86::VMAXCPSZ128rrk, X86::VMAXCPSZ128rmk, 0}, {X86::VMAXCPSZ256rrk, X86::VMAXCPSZ256rmk, 0}, {X86::VMAXCPSZrrk, X86::VMAXCPSZrmk, 0}, - {X86::VMAXPBF16Z128rrk, X86::VMAXPBF16Z128rmk, 0}, - {X86::VMAXPBF16Z256rrk, X86::VMAXPBF16Z256rmk, 0}, - {X86::VMAXPBF16Zrrk, X86::VMAXPBF16Zrmk, 0}, {X86::VMAXPDZ128rrk, X86::VMAXPDZ128rmk, 0}, {X86::VMAXPDZ256rrk, X86::VMAXPDZ256rmk, 0}, {X86::VMAXPDZrrk, X86::VMAXPDZrmk, 0}, @@ -6735,6 +6735,9 @@ static const X86FoldTableEntry Table4[] = { {X86::VMAXSDZrrk_Int, X86::VMAXSDZrmk_Int, TB_NO_REVERSE}, {X86::VMAXSHZrrk_Int, X86::VMAXSHZrmk_Int, TB_NO_REVERSE}, {X86::VMAXSSZrrk_Int, X86::VMAXSSZrmk_Int, TB_NO_REVERSE}, + {X86::VMINBF16Z128rrk, X86::VMINBF16Z128rmk, 0}, + {X86::VMINBF16Z256rrk, X86::VMINBF16Z256rmk, 0}, + {X86::VMINBF16Zrrk, X86::VMINBF16Zrmk, 0}, {X86::VMINCPDZ128rrk, X86::VMINCPDZ128rmk, 0}, {X86::VMINCPDZ256rrk, X86::VMINCPDZ256rmk, 0}, {X86::VMINCPDZrrk, X86::VMINCPDZrmk, 0}, @@ -6759,9 +6762,6 @@ static const X86FoldTableEntry Table4[] = { {X86::VMINMAXSDrrik_Int, X86::VMINMAXSDrmik_Int, TB_NO_REVERSE}, {X86::VMINMAXSHrrik_Int, X86::VMINMAXSHrmik_Int, TB_NO_REVERSE}, {X86::VMINMAXSSrrik_Int, X86::VMINMAXSSrmik_Int, TB_NO_REVERSE}, - {X86::VMINPBF16Z128rrk, X86::VMINPBF16Z128rmk, 0}, - {X86::VMINPBF16Z256rrk, X86::VMINPBF16Z256rmk, 0}, - {X86::VMINPBF16Zrrk, X86::VMINPBF16Zrmk, 0}, {X86::VMINPDZ128rrk, X86::VMINPDZ128rmk, 0}, {X86::VMINPDZ256rrk, X86::VMINPDZ256rmk, 0}, {X86::VMINPDZrrk, X86::VMINPDZrmk, 0}, @@ -6777,9 +6777,9 @@ static const X86FoldTableEntry Table4[] = { {X86::VMPSADBWZ128rrik, X86::VMPSADBWZ128rmik, 0}, {X86::VMPSADBWZ256rrik, X86::VMPSADBWZ256rmik, 0}, {X86::VMPSADBWZrrik, X86::VMPSADBWZrmik, 0}, - {X86::VMULNEPBF16Z128rrk, X86::VMULNEPBF16Z128rmk, 0}, - {X86::VMULNEPBF16Z256rrk, X86::VMULNEPBF16Z256rmk, 0}, - {X86::VMULNEPBF16Zrrk, X86::VMULNEPBF16Zrmk, 0}, + {X86::VMULBF16Z128rrk, X86::VMULBF16Z128rmk, 0}, + {X86::VMULBF16Z256rrk, X86::VMULBF16Z256rmk, 0}, + {X86::VMULBF16Zrrk, X86::VMULBF16Zrmk, 0}, {X86::VMULPDZ128rrk, X86::VMULPDZ128rmk, 0}, {X86::VMULPDZ256rrk, X86::VMULPDZ256rmk, 0}, {X86::VMULPDZrrk, X86::VMULPDZrmk, 0}, @@ -7355,9 +7355,9 @@ static const X86FoldTableEntry Table4[] = { {X86::VRSQRT28SDZrk, X86::VRSQRT28SDZmk, TB_NO_REVERSE}, {X86::VRSQRT28SSZrk, X86::VRSQRT28SSZmk, TB_NO_REVERSE}, {X86::VRSQRTSHZrrk, X86::VRSQRTSHZrmk, TB_NO_REVERSE}, - {X86::VSCALEFPBF16Z128rrk, X86::VSCALEFPBF16Z128rmk, 0}, - {X86::VSCALEFPBF16Z256rrk, X86::VSCALEFPBF16Z256rmk, 0}, - {X86::VSCALEFPBF16Zrrk, X86::VSCALEFPBF16Zrmk, 0}, + {X86::VSCALEFBF16Z128rrk, X86::VSCALEFBF16Z128rmk, 0}, + {X86::VSCALEFBF16Z256rrk, X86::VSCALEFBF16Z256rmk, 0}, + {X86::VSCALEFBF16Zrrk, X86::VSCALEFBF16Zrmk, 0}, {X86::VSCALEFPDZ128rrk, X86::VSCALEFPDZ128rmk, 0}, {X86::VSCALEFPDZ256rrk, X86::VSCALEFPDZ256rmk, 0}, {X86::VSCALEFPDZrrk, X86::VSCALEFPDZrmk, 0}, @@ -7387,9 +7387,9 @@ static const X86FoldTableEntry Table4[] = { {X86::VSQRTSDZrk_Int, X86::VSQRTSDZmk_Int, TB_NO_REVERSE}, {X86::VSQRTSHZrk_Int, X86::VSQRTSHZmk_Int, TB_NO_REVERSE}, {X86::VSQRTSSZrk_Int, X86::VSQRTSSZmk_Int, TB_NO_REVERSE}, - {X86::VSUBNEPBF16Z128rrk, X86::VSUBNEPBF16Z128rmk, 0}, - {X86::VSUBNEPBF16Z256rrk, X86::VSUBNEPBF16Z256rmk, 0}, - {X86::VSUBNEPBF16Zrrk, X86::VSUBNEPBF16Zrmk, 0}, + {X86::VSUBBF16Z128rrk, X86::VSUBBF16Z128rmk, 0}, + {X86::VSUBBF16Z256rrk, X86::VSUBBF16Z256rmk, 0}, + {X86::VSUBBF16Zrrk, X86::VSUBBF16Zrmk, 0}, {X86::VSUBPDZ128rrk, X86::VSUBPDZ128rmk, 0}, {X86::VSUBPDZ256rrk, X86::VSUBPDZ256rmk, 0}, {X86::VSUBPDZrrk, X86::VSUBPDZrmk, 0}, @@ -7644,9 +7644,9 @@ static const X86FoldTableEntry BroadcastTable1[] = { {X86::VCVTW2PHZrr, X86::VCVTW2PHZrmb, TB_BCAST_W}, {X86::VEXP2PDZr, X86::VEXP2PDZmb, TB_BCAST_SD}, {X86::VEXP2PSZr, X86::VEXP2PSZmb, TB_BCAST_SS}, - {X86::VFPCLASSPBF16Z128ri, X86::VFPCLASSPBF16Z128mbi, TB_BCAST_SH}, - {X86::VFPCLASSPBF16Z256ri, X86::VFPCLASSPBF16Z256mbi, TB_BCAST_SH}, - {X86::VFPCLASSPBF16Zri, X86::VFPCLASSPBF16Zmbi, TB_BCAST_SH}, + {X86::VFPCLASSBF16Z128ri, X86::VFPCLASSBF16Z128mbi, TB_BCAST_SH}, + {X86::VFPCLASSBF16Z256ri, X86::VFPCLASSBF16Z256mbi, TB_BCAST_SH}, + {X86::VFPCLASSBF16Zri, X86::VFPCLASSBF16Zmbi, TB_BCAST_SH}, {X86::VFPCLASSPDZ128ri, X86::VFPCLASSPDZ128mbi, TB_BCAST_SD}, {X86::VFPCLASSPDZ256ri, X86::VFPCLASSPDZ256mbi, TB_BCAST_SD}, {X86::VFPCLASSPDZri, X86::VFPCLASSPDZmbi, TB_BCAST_SD}, @@ -7656,9 +7656,9 @@ static const X86FoldTableEntry BroadcastTable1[] = { {X86::VFPCLASSPSZ128ri, X86::VFPCLASSPSZ128mbi, TB_BCAST_SS}, {X86::VFPCLASSPSZ256ri, X86::VFPCLASSPSZ256mbi, TB_BCAST_SS}, {X86::VFPCLASSPSZri, X86::VFPCLASSPSZmbi, TB_BCAST_SS}, - {X86::VGETEXPPBF16Z128r, X86::VGETEXPPBF16Z128mb, TB_BCAST_SH}, - {X86::VGETEXPPBF16Z256r, X86::VGETEXPPBF16Z256mb, TB_BCAST_SH}, - {X86::VGETEXPPBF16Zr, X86::VGETEXPPBF16Zmb, TB_BCAST_SH}, + {X86::VGETEXPBF16Z128r, X86::VGETEXPBF16Z128mb, TB_BCAST_SH}, + {X86::VGETEXPBF16Z256r, X86::VGETEXPBF16Z256mb, TB_BCAST_SH}, + {X86::VGETEXPBF16Zr, X86::VGETEXPBF16Zmb, TB_BCAST_SH}, {X86::VGETEXPPDZ128r, X86::VGETEXPPDZ128mb, TB_BCAST_SD}, {X86::VGETEXPPDZ256r, X86::VGETEXPPDZ256mb, TB_BCAST_SD}, {X86::VGETEXPPDZr, X86::VGETEXPPDZmb, TB_BCAST_SD}, @@ -7668,9 +7668,9 @@ static const X86FoldTableEntry BroadcastTable1[] = { {X86::VGETEXPPSZ128r, X86::VGETEXPPSZ128mb, TB_BCAST_SS}, {X86::VGETEXPPSZ256r, X86::VGETEXPPSZ256mb, TB_BCAST_SS}, {X86::VGETEXPPSZr, X86::VGETEXPPSZmb, TB_BCAST_SS}, - {X86::VGETMANTPBF16Z128rri, X86::VGETMANTPBF16Z128rmbi, TB_BCAST_SH}, - {X86::VGETMANTPBF16Z256rri, X86::VGETMANTPBF16Z256rmbi, TB_BCAST_SH}, - {X86::VGETMANTPBF16Zrri, X86::VGETMANTPBF16Zrmbi, TB_BCAST_SH}, + {X86::VGETMANTBF16Z128rri, X86::VGETMANTBF16Z128rmbi, TB_BCAST_SH}, + {X86::VGETMANTBF16Z256rri, X86::VGETMANTBF16Z256rmbi, TB_BCAST_SH}, + {X86::VGETMANTBF16Zrri, X86::VGETMANTBF16Zrmbi, TB_BCAST_SH}, {X86::VGETMANTPDZ128rri, X86::VGETMANTPDZ128rmbi, TB_BCAST_SD}, {X86::VGETMANTPDZ256rri, X86::VGETMANTPDZ256rmbi, TB_BCAST_SD}, {X86::VGETMANTPDZrri, X86::VGETMANTPDZrmbi, TB_BCAST_SD}, @@ -7755,15 +7755,15 @@ static const X86FoldTableEntry BroadcastTable1[] = { {X86::VRCP14PSZr, X86::VRCP14PSZmb, TB_BCAST_SS}, {X86::VRCP28PDZr, X86::VRCP28PDZmb, TB_BCAST_SD}, {X86::VRCP28PSZr, X86::VRCP28PSZmb, TB_BCAST_SS}, - {X86::VRCPPBF16Z128r, X86::VRCPPBF16Z128mb, TB_BCAST_SH}, - {X86::VRCPPBF16Z256r, X86::VRCPPBF16Z256mb, TB_BCAST_SH}, - {X86::VRCPPBF16Zr, X86::VRCPPBF16Zmb, TB_BCAST_SH}, + {X86::VRCPBF16Z128r, X86::VRCPBF16Z128mb, TB_BCAST_SH}, + {X86::VRCPBF16Z256r, X86::VRCPBF16Z256mb, TB_BCAST_SH}, + {X86::VRCPBF16Zr, X86::VRCPBF16Zmb, TB_BCAST_SH}, {X86::VRCPPHZ128r, X86::VRCPPHZ128mb, TB_BCAST_SH}, {X86::VRCPPHZ256r, X86::VRCPPHZ256mb, TB_BCAST_SH}, {X86::VRCPPHZr, X86::VRCPPHZmb, TB_BCAST_SH}, - {X86::VREDUCENEPBF16Z128rri, X86::VREDUCENEPBF16Z128rmbi, TB_BCAST_SH}, - {X86::VREDUCENEPBF16Z256rri, X86::VREDUCENEPBF16Z256rmbi, TB_BCAST_SH}, - {X86::VREDUCENEPBF16Zrri, X86::VREDUCENEPBF16Zrmbi, TB_BCAST_SH}, + {X86::VREDUCEBF16Z128rri, X86::VREDUCEBF16Z128rmbi, TB_BCAST_SH}, + {X86::VREDUCEBF16Z256rri, X86::VREDUCEBF16Z256rmbi, TB_BCAST_SH}, + {X86::VREDUCEBF16Zrri, X86::VREDUCEBF16Zrmbi, TB_BCAST_SH}, {X86::VREDUCEPDZ128rri, X86::VREDUCEPDZ128rmbi, TB_BCAST_SD}, {X86::VREDUCEPDZ256rri, X86::VREDUCEPDZ256rmbi, TB_BCAST_SD}, {X86::VREDUCEPDZrri, X86::VREDUCEPDZrmbi, TB_BCAST_SD}, @@ -7773,9 +7773,9 @@ static const X86FoldTableEntry BroadcastTable1[] = { {X86::VREDUCEPSZ128rri, X86::VREDUCEPSZ128rmbi, TB_BCAST_SS}, {X86::VREDUCEPSZ256rri, X86::VREDUCEPSZ256rmbi, TB_BCAST_SS}, {X86::VREDUCEPSZrri, X86::VREDUCEPSZrmbi, TB_BCAST_SS}, - {X86::VRNDSCALENEPBF16Z128rri, X86::VRNDSCALENEPBF16Z128rmbi, TB_BCAST_SH}, - {X86::VRNDSCALENEPBF16Z256rri, X86::VRNDSCALENEPBF16Z256rmbi, TB_BCAST_SH}, - {X86::VRNDSCALENEPBF16Zrri, X86::VRNDSCALENEPBF16Zrmbi, TB_BCAST_SH}, + {X86::VRNDSCALEBF16Z128rri, X86::VRNDSCALEBF16Z128rmbi, TB_BCAST_SH}, + {X86::VRNDSCALEBF16Z256rri, X86::VRNDSCALEBF16Z256rmbi, TB_BCAST_SH}, + {X86::VRNDSCALEBF16Zrri, X86::VRNDSCALEBF16Zrmbi, TB_BCAST_SH}, {X86::VRNDSCALEPDZ128rri, X86::VRNDSCALEPDZ128rmbi, TB_BCAST_SD}, {X86::VRNDSCALEPDZ256rri, X86::VRNDSCALEPDZ256rmbi, TB_BCAST_SD}, {X86::VRNDSCALEPDZrri, X86::VRNDSCALEPDZrmbi, TB_BCAST_SD}, @@ -7793,15 +7793,15 @@ static const X86FoldTableEntry BroadcastTable1[] = { {X86::VRSQRT14PSZr, X86::VRSQRT14PSZmb, TB_BCAST_SS}, {X86::VRSQRT28PDZr, X86::VRSQRT28PDZmb, TB_BCAST_SD}, {X86::VRSQRT28PSZr, X86::VRSQRT28PSZmb, TB_BCAST_SS}, - {X86::VRSQRTPBF16Z128r, X86::VRSQRTPBF16Z128mb, TB_BCAST_SH}, - {X86::VRSQRTPBF16Z256r, X86::VRSQRTPBF16Z256mb, TB_BCAST_SH}, - {X86::VRSQRTPBF16Zr, X86::VRSQRTPBF16Zmb, TB_BCAST_SH}, + {X86::VRSQRTBF16Z128r, X86::VRSQRTBF16Z128mb, TB_BCAST_SH}, + {X86::VRSQRTBF16Z256r, X86::VRSQRTBF16Z256mb, TB_BCAST_SH}, + {X86::VRSQRTBF16Zr, X86::VRSQRTBF16Zmb, TB_BCAST_SH}, {X86::VRSQRTPHZ128r, X86::VRSQRTPHZ128mb, TB_BCAST_SH}, {X86::VRSQRTPHZ256r, X86::VRSQRTPHZ256mb, TB_BCAST_SH}, {X86::VRSQRTPHZr, X86::VRSQRTPHZmb, TB_BCAST_SH}, - {X86::VSQRTNEPBF16Z128r, X86::VSQRTNEPBF16Z128mb, TB_BCAST_SH}, - {X86::VSQRTNEPBF16Z256r, X86::VSQRTNEPBF16Z256mb, TB_BCAST_SH}, - {X86::VSQRTNEPBF16Zr, X86::VSQRTNEPBF16Zmb, TB_BCAST_SH}, + {X86::VSQRTBF16Z128r, X86::VSQRTBF16Z128mb, TB_BCAST_SH}, + {X86::VSQRTBF16Z256r, X86::VSQRTBF16Z256mb, TB_BCAST_SH}, + {X86::VSQRTBF16Zr, X86::VSQRTBF16Zmb, TB_BCAST_SH}, {X86::VSQRTPDZ128r, X86::VSQRTPDZ128mb, TB_BCAST_SD}, {X86::VSQRTPDZ256r, X86::VSQRTPDZ256mb, TB_BCAST_SD}, {X86::VSQRTPDZr, X86::VSQRTPDZmb, TB_BCAST_SD}, @@ -7814,9 +7814,9 @@ static const X86FoldTableEntry BroadcastTable1[] = { }; static const X86FoldTableEntry BroadcastTable2[] = { - {X86::VADDNEPBF16Z128rr, X86::VADDNEPBF16Z128rmb, TB_BCAST_SH}, - {X86::VADDNEPBF16Z256rr, X86::VADDNEPBF16Z256rmb, TB_BCAST_SH}, - {X86::VADDNEPBF16Zrr, X86::VADDNEPBF16Zrmb, TB_BCAST_SH}, + {X86::VADDBF16Z128rr, X86::VADDBF16Z128rmb, TB_BCAST_SH}, + {X86::VADDBF16Z256rr, X86::VADDBF16Z256rmb, TB_BCAST_SH}, + {X86::VADDBF16Zrr, X86::VADDBF16Zrmb, TB_BCAST_SH}, {X86::VADDPDZ128rr, X86::VADDPDZ128rmb, TB_BCAST_SD}, {X86::VADDPDZ256rr, X86::VADDPDZ256rmb, TB_BCAST_SD}, {X86::VADDPDZrr, X86::VADDPDZrmb, TB_BCAST_SD}, @@ -7850,9 +7850,9 @@ static const X86FoldTableEntry BroadcastTable2[] = { {X86::VBLENDMPSZ128rr, X86::VBLENDMPSZ128rmb, TB_BCAST_SS}, {X86::VBLENDMPSZ256rr, X86::VBLENDMPSZ256rmb, TB_BCAST_SS}, {X86::VBLENDMPSZrr, X86::VBLENDMPSZrmb, TB_BCAST_SS}, - {X86::VCMPPBF16Z128rri, X86::VCMPPBF16Z128rmbi, TB_BCAST_SH}, - {X86::VCMPPBF16Z256rri, X86::VCMPPBF16Z256rmbi, TB_BCAST_SH}, - {X86::VCMPPBF16Zrri, X86::VCMPPBF16Zrmbi, TB_BCAST_SH}, + {X86::VCMPBF16Z128rri, X86::VCMPBF16Z128rmbi, TB_BCAST_SH}, + {X86::VCMPBF16Z256rri, X86::VCMPBF16Z256rmbi, TB_BCAST_SH}, + {X86::VCMPBF16Zrri, X86::VCMPBF16Zrmbi, TB_BCAST_SH}, {X86::VCMPPDZ128rri, X86::VCMPPDZ128rmbi, TB_BCAST_SD}, {X86::VCMPPDZ256rri, X86::VCMPPDZ256rmbi, TB_BCAST_SD}, {X86::VCMPPDZrri, X86::VCMPPDZrmbi, TB_BCAST_SD}, @@ -8111,9 +8111,9 @@ static const X86FoldTableEntry BroadcastTable2[] = { {X86::VCVTW2PHZ128rrkz, X86::VCVTW2PHZ128rmbkz, TB_BCAST_W}, {X86::VCVTW2PHZ256rrkz, X86::VCVTW2PHZ256rmbkz, TB_BCAST_W}, {X86::VCVTW2PHZrrkz, X86::VCVTW2PHZrmbkz, TB_BCAST_W}, - {X86::VDIVNEPBF16Z128rr, X86::VDIVNEPBF16Z128rmb, TB_BCAST_SH}, - {X86::VDIVNEPBF16Z256rr, X86::VDIVNEPBF16Z256rmb, TB_BCAST_SH}, - {X86::VDIVNEPBF16Zrr, X86::VDIVNEPBF16Zrmb, TB_BCAST_SH}, + {X86::VDIVBF16Z128rr, X86::VDIVBF16Z128rmb, TB_BCAST_SH}, + {X86::VDIVBF16Z256rr, X86::VDIVBF16Z256rmb, TB_BCAST_SH}, + {X86::VDIVBF16Zrr, X86::VDIVBF16Zrmb, TB_BCAST_SH}, {X86::VDIVPDZ128rr, X86::VDIVPDZ128rmb, TB_BCAST_SD}, {X86::VDIVPDZ256rr, X86::VDIVPDZ256rmb, TB_BCAST_SD}, {X86::VDIVPDZrr, X86::VDIVPDZrmb, TB_BCAST_SD}, @@ -8131,9 +8131,9 @@ static const X86FoldTableEntry BroadcastTable2[] = { {X86::VFMULCPHZ128rr, X86::VFMULCPHZ128rmb, TB_BCAST_SS}, {X86::VFMULCPHZ256rr, X86::VFMULCPHZ256rmb, TB_BCAST_SS}, {X86::VFMULCPHZrr, X86::VFMULCPHZrmb, TB_BCAST_SS}, - {X86::VFPCLASSPBF16Z128rik, X86::VFPCLASSPBF16Z128mbik, TB_BCAST_SH}, - {X86::VFPCLASSPBF16Z256rik, X86::VFPCLASSPBF16Z256mbik, TB_BCAST_SH}, - {X86::VFPCLASSPBF16Zrik, X86::VFPCLASSPBF16Zmbik, TB_BCAST_SH}, + {X86::VFPCLASSBF16Z128rik, X86::VFPCLASSBF16Z128mbik, TB_BCAST_SH}, + {X86::VFPCLASSBF16Z256rik, X86::VFPCLASSBF16Z256mbik, TB_BCAST_SH}, + {X86::VFPCLASSBF16Zrik, X86::VFPCLASSBF16Zmbik, TB_BCAST_SH}, {X86::VFPCLASSPDZ128rik, X86::VFPCLASSPDZ128mbik, TB_BCAST_SD}, {X86::VFPCLASSPDZ256rik, X86::VFPCLASSPDZ256mbik, TB_BCAST_SD}, {X86::VFPCLASSPDZrik, X86::VFPCLASSPDZmbik, TB_BCAST_SD}, @@ -8143,9 +8143,9 @@ static const X86FoldTableEntry BroadcastTable2[] = { {X86::VFPCLASSPSZ128rik, X86::VFPCLASSPSZ128mbik, TB_BCAST_SS}, {X86::VFPCLASSPSZ256rik, X86::VFPCLASSPSZ256mbik, TB_BCAST_SS}, {X86::VFPCLASSPSZrik, X86::VFPCLASSPSZmbik, TB_BCAST_SS}, - {X86::VGETEXPPBF16Z128rkz, X86::VGETEXPPBF16Z128mbkz, TB_BCAST_SH}, - {X86::VGETEXPPBF16Z256rkz, X86::VGETEXPPBF16Z256mbkz, TB_BCAST_SH}, - {X86::VGETEXPPBF16Zrkz, X86::VGETEXPPBF16Zmbkz, TB_BCAST_SH}, + {X86::VGETEXPBF16Z128rkz, X86::VGETEXPBF16Z128mbkz, TB_BCAST_SH}, + {X86::VGETEXPBF16Z256rkz, X86::VGETEXPBF16Z256mbkz, TB_BCAST_SH}, + {X86::VGETEXPBF16Zrkz, X86::VGETEXPBF16Zmbkz, TB_BCAST_SH}, {X86::VGETEXPPDZ128rkz, X86::VGETEXPPDZ128mbkz, TB_BCAST_SD}, {X86::VGETEXPPDZ256rkz, X86::VGETEXPPDZ256mbkz, TB_BCAST_SD}, {X86::VGETEXPPDZrkz, X86::VGETEXPPDZmbkz, TB_BCAST_SD}, @@ -8155,9 +8155,9 @@ static const X86FoldTableEntry BroadcastTable2[] = { {X86::VGETEXPPSZ128rkz, X86::VGETEXPPSZ128mbkz, TB_BCAST_SS}, {X86::VGETEXPPSZ256rkz, X86::VGETEXPPSZ256mbkz, TB_BCAST_SS}, {X86::VGETEXPPSZrkz, X86::VGETEXPPSZmbkz, TB_BCAST_SS}, - {X86::VGETMANTPBF16Z128rrikz, X86::VGETMANTPBF16Z128rmbikz, TB_BCAST_SH}, - {X86::VGETMANTPBF16Z256rrikz, X86::VGETMANTPBF16Z256rmbikz, TB_BCAST_SH}, - {X86::VGETMANTPBF16Zrrikz, X86::VGETMANTPBF16Zrmbikz, TB_BCAST_SH}, + {X86::VGETMANTBF16Z128rrikz, X86::VGETMANTBF16Z128rmbikz, TB_BCAST_SH}, + {X86::VGETMANTBF16Z256rrikz, X86::VGETMANTBF16Z256rmbikz, TB_BCAST_SH}, + {X86::VGETMANTBF16Zrrikz, X86::VGETMANTBF16Zrmbikz, TB_BCAST_SH}, {X86::VGETMANTPDZ128rrikz, X86::VGETMANTPDZ128rmbikz, TB_BCAST_SD}, {X86::VGETMANTPDZ256rrikz, X86::VGETMANTPDZ256rmbikz, TB_BCAST_SD}, {X86::VGETMANTPDZrrikz, X86::VGETMANTPDZrmbikz, TB_BCAST_SD}, @@ -8173,6 +8173,9 @@ static const X86FoldTableEntry BroadcastTable2[] = { {X86::VGF2P8AFFINEQBZ128rri, X86::VGF2P8AFFINEQBZ128rmbi, TB_BCAST_Q}, {X86::VGF2P8AFFINEQBZ256rri, X86::VGF2P8AFFINEQBZ256rmbi, TB_BCAST_Q}, {X86::VGF2P8AFFINEQBZrri, X86::VGF2P8AFFINEQBZrmbi, TB_BCAST_Q}, + {X86::VMAXBF16Z128rr, X86::VMAXBF16Z128rmb, TB_BCAST_SH}, + {X86::VMAXBF16Z256rr, X86::VMAXBF16Z256rmb, TB_BCAST_SH}, + {X86::VMAXBF16Zrr, X86::VMAXBF16Zrmb, TB_BCAST_SH}, {X86::VMAXCPDZ128rr, X86::VMAXCPDZ128rmb, TB_BCAST_SD}, {X86::VMAXCPDZ256rr, X86::VMAXCPDZ256rmb, TB_BCAST_SD}, {X86::VMAXCPDZrr, X86::VMAXCPDZrmb, TB_BCAST_SD}, @@ -8182,9 +8185,6 @@ static const X86FoldTableEntry BroadcastTable2[] = { {X86::VMAXCPSZ128rr, X86::VMAXCPSZ128rmb, TB_BCAST_SS}, {X86::VMAXCPSZ256rr, X86::VMAXCPSZ256rmb, TB_BCAST_SS}, {X86::VMAXCPSZrr, X86::VMAXCPSZrmb, TB_BCAST_SS}, - {X86::VMAXPBF16Z128rr, X86::VMAXPBF16Z128rmb, TB_BCAST_SH}, - {X86::VMAXPBF16Z256rr, X86::VMAXPBF16Z256rmb, TB_BCAST_SH}, - {X86::VMAXPBF16Zrr, X86::VMAXPBF16Zrmb, TB_BCAST_SH}, {X86::VMAXPDZ128rr, X86::VMAXPDZ128rmb, TB_BCAST_SD}, {X86::VMAXPDZ256rr, X86::VMAXPDZ256rmb, TB_BCAST_SD}, {X86::VMAXPDZrr, X86::VMAXPDZrmb, TB_BCAST_SD}, @@ -8194,6 +8194,9 @@ static const X86FoldTableEntry BroadcastTable2[] = { {X86::VMAXPSZ128rr, X86::VMAXPSZ128rmb, TB_BCAST_SS}, {X86::VMAXPSZ256rr, X86::VMAXPSZ256rmb, TB_BCAST_SS}, {X86::VMAXPSZrr, X86::VMAXPSZrmb, TB_BCAST_SS}, + {X86::VMINBF16Z128rr, X86::VMINBF16Z128rmb, TB_BCAST_SH}, + {X86::VMINBF16Z256rr, X86::VMINBF16Z256rmb, TB_BCAST_SH}, + {X86::VMINBF16Zrr, X86::VMINBF16Zrmb, TB_BCAST_SH}, {X86::VMINCPDZ128rr, X86::VMINCPDZ128rmb, TB_BCAST_SD}, {X86::VMINCPDZ256rr, X86::VMINCPDZ256rmb, TB_BCAST_SD}, {X86::VMINCPDZrr, X86::VMINCPDZrmb, TB_BCAST_SD}, @@ -8215,9 +8218,6 @@ static const X86FoldTableEntry BroadcastTable2[] = { {X86::VMINMAXPSZ128rri, X86::VMINMAXPSZ128rmbi, TB_BCAST_SS}, {X86::VMINMAXPSZ256rri, X86::VMINMAXPSZ256rmbi, TB_BCAST_SS}, {X86::VMINMAXPSZrri, X86::VMINMAXPSZrmbi, TB_BCAST_SS}, - {X86::VMINPBF16Z128rr, X86::VMINPBF16Z128rmb, TB_BCAST_SH}, - {X86::VMINPBF16Z256rr, X86::VMINPBF16Z256rmb, TB_BCAST_SH}, - {X86::VMINPBF16Zrr, X86::VMINPBF16Zrmb, TB_BCAST_SH}, {X86::VMINPDZ128rr, X86::VMINPDZ128rmb, TB_BCAST_SD}, {X86::VMINPDZ256rr, X86::VMINPDZ256rmb, TB_BCAST_SD}, {X86::VMINPDZrr, X86::VMINPDZrmb, TB_BCAST_SD}, @@ -8227,9 +8227,9 @@ static const X86FoldTableEntry BroadcastTable2[] = { {X86::VMINPSZ128rr, X86::VMINPSZ128rmb, TB_BCAST_SS}, {X86::VMINPSZ256rr, X86::VMINPSZ256rmb, TB_BCAST_SS}, {X86::VMINPSZrr, X86::VMINPSZrmb, TB_BCAST_SS}, - {X86::VMULNEPBF16Z128rr, X86::VMULNEPBF16Z128rmb, TB_BCAST_SH}, - {X86::VMULNEPBF16Z256rr, X86::VMULNEPBF16Z256rmb, TB_BCAST_SH}, - {X86::VMULNEPBF16Zrr, X86::VMULNEPBF16Zrmb, TB_BCAST_SH}, + {X86::VMULBF16Z128rr, X86::VMULBF16Z128rmb, TB_BCAST_SH}, + {X86::VMULBF16Z256rr, X86::VMULBF16Z256rmb, TB_BCAST_SH}, + {X86::VMULBF16Zrr, X86::VMULBF16Zrmb, TB_BCAST_SH}, {X86::VMULPDZ128rr, X86::VMULPDZ128rmb, TB_BCAST_SD}, {X86::VMULPDZ256rr, X86::VMULPDZ256rmb, TB_BCAST_SD}, {X86::VMULPDZrr, X86::VMULPDZrmb, TB_BCAST_SD}, @@ -8523,15 +8523,15 @@ static const X86FoldTableEntry BroadcastTable2[] = { {X86::VRCP14PSZrkz, X86::VRCP14PSZmbkz, TB_BCAST_SS}, {X86::VRCP28PDZrkz, X86::VRCP28PDZmbkz, TB_BCAST_SD}, {X86::VRCP28PSZrkz, X86::VRCP28PSZmbkz, TB_BCAST_SS}, - {X86::VRCPPBF16Z128rkz, X86::VRCPPBF16Z128mbkz, TB_BCAST_SH}, - {X86::VRCPPBF16Z256rkz, X86::VRCPPBF16Z256mbkz, TB_BCAST_SH}, - {X86::VRCPPBF16Zrkz, X86::VRCPPBF16Zmbkz, TB_BCAST_SH}, + {X86::VRCPBF16Z128rkz, X86::VRCPBF16Z128mbkz, TB_BCAST_SH}, + {X86::VRCPBF16Z256rkz, X86::VRCPBF16Z256mbkz, TB_BCAST_SH}, + {X86::VRCPBF16Zrkz, X86::VRCPBF16Zmbkz, TB_BCAST_SH}, {X86::VRCPPHZ128rkz, X86::VRCPPHZ128mbkz, TB_BCAST_SH}, {X86::VRCPPHZ256rkz, X86::VRCPPHZ256mbkz, TB_BCAST_SH}, {X86::VRCPPHZrkz, X86::VRCPPHZmbkz, TB_BCAST_SH}, - {X86::VREDUCENEPBF16Z128rrikz, X86::VREDUCENEPBF16Z128rmbikz, TB_BCAST_SH}, - {X86::VREDUCENEPBF16Z256rrikz, X86::VREDUCENEPBF16Z256rmbikz, TB_BCAST_SH}, - {X86::VREDUCENEPBF16Zrrikz, X86::VREDUCENEPBF16Zrmbikz, TB_BCAST_SH}, + {X86::VREDUCEBF16Z128rrikz, X86::VREDUCEBF16Z128rmbikz, TB_BCAST_SH}, + {X86::VREDUCEBF16Z256rrikz, X86::VREDUCEBF16Z256rmbikz, TB_BCAST_SH}, + {X86::VREDUCEBF16Zrrikz, X86::VREDUCEBF16Zrmbikz, TB_BCAST_SH}, {X86::VREDUCEPDZ128rrikz, X86::VREDUCEPDZ128rmbikz, TB_BCAST_SD}, {X86::VREDUCEPDZ256rrikz, X86::VREDUCEPDZ256rmbikz, TB_BCAST_SD}, {X86::VREDUCEPDZrrikz, X86::VREDUCEPDZrmbikz, TB_BCAST_SD}, @@ -8541,9 +8541,9 @@ static const X86FoldTableEntry BroadcastTable2[] = { {X86::VREDUCEPSZ128rrikz, X86::VREDUCEPSZ128rmbikz, TB_BCAST_SS}, {X86::VREDUCEPSZ256rrikz, X86::VREDUCEPSZ256rmbikz, TB_BCAST_SS}, {X86::VREDUCEPSZrrikz, X86::VREDUCEPSZrmbikz, TB_BCAST_SS}, - {X86::VRNDSCALENEPBF16Z128rrikz, X86::VRNDSCALENEPBF16Z128rmbikz, TB_BCAST_SH}, - {X86::VRNDSCALENEPBF16Z256rrikz, X86::VRNDSCALENEPBF16Z256rmbikz, TB_BCAST_SH}, - {X86::VRNDSCALENEPBF16Zrrikz, X86::VRNDSCALENEPBF16Zrmbikz, TB_BCAST_SH}, + {X86::VRNDSCALEBF16Z128rrikz, X86::VRNDSCALEBF16Z128rmbikz, TB_BCAST_SH}, + {X86::VRNDSCALEBF16Z256rrikz, X86::VRNDSCALEBF16Z256rmbikz, TB_BCAST_SH}, + {X86::VRNDSCALEBF16Zrrikz, X86::VRNDSCALEBF16Zrmbikz, TB_BCAST_SH}, {X86::VRNDSCALEPDZ128rrikz, X86::VRNDSCALEPDZ128rmbikz, TB_BCAST_SD}, {X86::VRNDSCALEPDZ256rrikz, X86::VRNDSCALEPDZ256rmbikz, TB_BCAST_SD}, {X86::VRNDSCALEPDZrrikz, X86::VRNDSCALEPDZrmbikz, TB_BCAST_SD}, @@ -8561,15 +8561,15 @@ static const X86FoldTableEntry BroadcastTable2[] = { {X86::VRSQRT14PSZrkz, X86::VRSQRT14PSZmbkz, TB_BCAST_SS}, {X86::VRSQRT28PDZrkz, X86::VRSQRT28PDZmbkz, TB_BCAST_SD}, {X86::VRSQRT28PSZrkz, X86::VRSQRT28PSZmbkz, TB_BCAST_SS}, - {X86::VRSQRTPBF16Z128rkz, X86::VRSQRTPBF16Z128mbkz, TB_BCAST_SH}, - {X86::VRSQRTPBF16Z256rkz, X86::VRSQRTPBF16Z256mbkz, TB_BCAST_SH}, - {X86::VRSQRTPBF16Zrkz, X86::VRSQRTPBF16Zmbkz, TB_BCAST_SH}, + {X86::VRSQRTBF16Z128rkz, X86::VRSQRTBF16Z128mbkz, TB_BCAST_SH}, + {X86::VRSQRTBF16Z256rkz, X86::VRSQRTBF16Z256mbkz, TB_BCAST_SH}, + {X86::VRSQRTBF16Zrkz, X86::VRSQRTBF16Zmbkz, TB_BCAST_SH}, {X86::VRSQRTPHZ128rkz, X86::VRSQRTPHZ128mbkz, TB_BCAST_SH}, {X86::VRSQRTPHZ256rkz, X86::VRSQRTPHZ256mbkz, TB_BCAST_SH}, {X86::VRSQRTPHZrkz, X86::VRSQRTPHZmbkz, TB_BCAST_SH}, - {X86::VSCALEFPBF16Z128rr, X86::VSCALEFPBF16Z128rmb, TB_BCAST_SH}, - {X86::VSCALEFPBF16Z256rr, X86::VSCALEFPBF16Z256rmb, TB_BCAST_SH}, - {X86::VSCALEFPBF16Zrr, X86::VSCALEFPBF16Zrmb, TB_BCAST_SH}, + {X86::VSCALEFBF16Z128rr, X86::VSCALEFBF16Z128rmb, TB_BCAST_SH}, + {X86::VSCALEFBF16Z256rr, X86::VSCALEFBF16Z256rmb, TB_BCAST_SH}, + {X86::VSCALEFBF16Zrr, X86::VSCALEFBF16Zrmb, TB_BCAST_SH}, {X86::VSCALEFPDZ128rr, X86::VSCALEFPDZ128rmb, TB_BCAST_SD}, {X86::VSCALEFPDZ256rr, X86::VSCALEFPDZ256rmb, TB_BCAST_SD}, {X86::VSCALEFPDZrr, X86::VSCALEFPDZrmb, TB_BCAST_SD}, @@ -8593,9 +8593,9 @@ static const X86FoldTableEntry BroadcastTable2[] = { {X86::VSHUFPSZ128rri, X86::VSHUFPSZ128rmbi, TB_BCAST_SS}, {X86::VSHUFPSZ256rri, X86::VSHUFPSZ256rmbi, TB_BCAST_SS}, {X86::VSHUFPSZrri, X86::VSHUFPSZrmbi, TB_BCAST_SS}, - {X86::VSQRTNEPBF16Z128rkz, X86::VSQRTNEPBF16Z128mbkz, TB_BCAST_SH}, - {X86::VSQRTNEPBF16Z256rkz, X86::VSQRTNEPBF16Z256mbkz, TB_BCAST_SH}, - {X86::VSQRTNEPBF16Zrkz, X86::VSQRTNEPBF16Zmbkz, TB_BCAST_SH}, + {X86::VSQRTBF16Z128rkz, X86::VSQRTBF16Z128mbkz, TB_BCAST_SH}, + {X86::VSQRTBF16Z256rkz, X86::VSQRTBF16Z256mbkz, TB_BCAST_SH}, + {X86::VSQRTBF16Zrkz, X86::VSQRTBF16Zmbkz, TB_BCAST_SH}, {X86::VSQRTPDZ128rkz, X86::VSQRTPDZ128mbkz, TB_BCAST_SD}, {X86::VSQRTPDZ256rkz, X86::VSQRTPDZ256mbkz, TB_BCAST_SD}, {X86::VSQRTPDZrkz, X86::VSQRTPDZmbkz, TB_BCAST_SD}, @@ -8605,9 +8605,9 @@ static const X86FoldTableEntry BroadcastTable2[] = { {X86::VSQRTPSZ128rkz, X86::VSQRTPSZ128mbkz, TB_BCAST_SS}, {X86::VSQRTPSZ256rkz, X86::VSQRTPSZ256mbkz, TB_BCAST_SS}, {X86::VSQRTPSZrkz, X86::VSQRTPSZmbkz, TB_BCAST_SS}, - {X86::VSUBNEPBF16Z128rr, X86::VSUBNEPBF16Z128rmb, TB_BCAST_SH}, - {X86::VSUBNEPBF16Z256rr, X86::VSUBNEPBF16Z256rmb, TB_BCAST_SH}, - {X86::VSUBNEPBF16Zrr, X86::VSUBNEPBF16Zrmb, TB_BCAST_SH}, + {X86::VSUBBF16Z128rr, X86::VSUBBF16Z128rmb, TB_BCAST_SH}, + {X86::VSUBBF16Z256rr, X86::VSUBBF16Z256rmb, TB_BCAST_SH}, + {X86::VSUBBF16Zrr, X86::VSUBBF16Zrmb, TB_BCAST_SH}, {X86::VSUBPDZ128rr, X86::VSUBPDZ128rmb, TB_BCAST_SD}, {X86::VSUBPDZ256rr, X86::VSUBPDZ256rmb, TB_BCAST_SD}, {X86::VSUBPDZrr, X86::VSUBPDZrmb, TB_BCAST_SD}, @@ -8638,9 +8638,9 @@ static const X86FoldTableEntry BroadcastTable2[] = { }; static const X86FoldTableEntry BroadcastTable3[] = { - {X86::VADDNEPBF16Z128rrkz, X86::VADDNEPBF16Z128rmbkz, TB_BCAST_SH}, - {X86::VADDNEPBF16Z256rrkz, X86::VADDNEPBF16Z256rmbkz, TB_BCAST_SH}, - {X86::VADDNEPBF16Zrrkz, X86::VADDNEPBF16Zrmbkz, TB_BCAST_SH}, + {X86::VADDBF16Z128rrkz, X86::VADDBF16Z128rmbkz, TB_BCAST_SH}, + {X86::VADDBF16Z256rrkz, X86::VADDBF16Z256rmbkz, TB_BCAST_SH}, + {X86::VADDBF16Zrrkz, X86::VADDBF16Zrmbkz, TB_BCAST_SH}, {X86::VADDPDZ128rrkz, X86::VADDPDZ128rmbkz, TB_BCAST_SD}, {X86::VADDPDZ256rrkz, X86::VADDPDZ256rmbkz, TB_BCAST_SD}, {X86::VADDPDZrrkz, X86::VADDPDZrmbkz, TB_BCAST_SD}, @@ -8674,9 +8674,9 @@ static const X86FoldTableEntry BroadcastTable3[] = { {X86::VBLENDMPSZ128rrk, X86::VBLENDMPSZ128rmbk, TB_BCAST_SS}, {X86::VBLENDMPSZ256rrk, X86::VBLENDMPSZ256rmbk, TB_BCAST_SS}, {X86::VBLENDMPSZrrk, X86::VBLENDMPSZrmbk, TB_BCAST_SS}, - {X86::VCMPPBF16Z128rrik, X86::VCMPPBF16Z128rmbik, TB_BCAST_SH}, - {X86::VCMPPBF16Z256rrik, X86::VCMPPBF16Z256rmbik, TB_BCAST_SH}, - {X86::VCMPPBF16Zrrik, X86::VCMPPBF16Zrmbik, TB_BCAST_SH}, + {X86::VCMPBF16Z128rrik, X86::VCMPBF16Z128rmbik, TB_BCAST_SH}, + {X86::VCMPBF16Z256rrik, X86::VCMPBF16Z256rmbik, TB_BCAST_SH}, + {X86::VCMPBF16Zrrik, X86::VCMPBF16Zrmbik, TB_BCAST_SH}, {X86::VCMPPDZ128rrik, X86::VCMPPDZ128rmbik, TB_BCAST_SD}, {X86::VCMPPDZ256rrik, X86::VCMPPDZ256rmbik, TB_BCAST_SD}, {X86::VCMPPDZrrik, X86::VCMPPDZrmbik, TB_BCAST_SD}, @@ -8935,9 +8935,9 @@ static const X86FoldTableEntry BroadcastTable3[] = { {X86::VCVTW2PHZ128rrk, X86::VCVTW2PHZ128rmbk, TB_BCAST_W}, {X86::VCVTW2PHZ256rrk, X86::VCVTW2PHZ256rmbk, TB_BCAST_W}, {X86::VCVTW2PHZrrk, X86::VCVTW2PHZrmbk, TB_BCAST_W}, - {X86::VDIVNEPBF16Z128rrkz, X86::VDIVNEPBF16Z128rmbkz, TB_BCAST_SH}, - {X86::VDIVNEPBF16Z256rrkz, X86::VDIVNEPBF16Z256rmbkz, TB_BCAST_SH}, - {X86::VDIVNEPBF16Zrrkz, X86::VDIVNEPBF16Zrmbkz, TB_BCAST_SH}, + {X86::VDIVBF16Z128rrkz, X86::VDIVBF16Z128rmbkz, TB_BCAST_SH}, + {X86::VDIVBF16Z256rrkz, X86::VDIVBF16Z256rmbkz, TB_BCAST_SH}, + {X86::VDIVBF16Zrrkz, X86::VDIVBF16Zrmbkz, TB_BCAST_SH}, {X86::VDIVPDZ128rrkz, X86::VDIVPDZ128rmbkz, TB_BCAST_SD}, {X86::VDIVPDZ256rrkz, X86::VDIVPDZ256rmbkz, TB_BCAST_SD}, {X86::VDIVPDZrrkz, X86::VDIVPDZrmbkz, TB_BCAST_SD}, @@ -8967,9 +8967,9 @@ static const X86FoldTableEntry BroadcastTable3[] = { {X86::VFIXUPIMMPSZ128rri, X86::VFIXUPIMMPSZ128rmbi, TB_BCAST_SS}, {X86::VFIXUPIMMPSZ256rri, X86::VFIXUPIMMPSZ256rmbi, TB_BCAST_SS}, {X86::VFIXUPIMMPSZrri, X86::VFIXUPIMMPSZrmbi, TB_BCAST_SS}, - {X86::VFMADD132NEPBF16Z128r, X86::VFMADD132NEPBF16Z128mb, TB_BCAST_SH}, - {X86::VFMADD132NEPBF16Z256r, X86::VFMADD132NEPBF16Z256mb, TB_BCAST_SH}, - {X86::VFMADD132NEPBF16Zr, X86::VFMADD132NEPBF16Zmb, TB_BCAST_SH}, + {X86::VFMADD132BF16Z128r, X86::VFMADD132BF16Z128mb, TB_BCAST_SH}, + {X86::VFMADD132BF16Z256r, X86::VFMADD132BF16Z256mb, TB_BCAST_SH}, + {X86::VFMADD132BF16Zr, X86::VFMADD132BF16Zmb, TB_BCAST_SH}, {X86::VFMADD132PDZ128r, X86::VFMADD132PDZ128mb, TB_BCAST_SD}, {X86::VFMADD132PDZ256r, X86::VFMADD132PDZ256mb, TB_BCAST_SD}, {X86::VFMADD132PDZr, X86::VFMADD132PDZmb, TB_BCAST_SD}, @@ -8979,9 +8979,9 @@ static const X86FoldTableEntry BroadcastTable3[] = { {X86::VFMADD132PSZ128r, X86::VFMADD132PSZ128mb, TB_BCAST_SS}, {X86::VFMADD132PSZ256r, X86::VFMADD132PSZ256mb, TB_BCAST_SS}, {X86::VFMADD132PSZr, X86::VFMADD132PSZmb, TB_BCAST_SS}, - {X86::VFMADD213NEPBF16Z128r, X86::VFMADD213NEPBF16Z128mb, TB_BCAST_SH}, - {X86::VFMADD213NEPBF16Z256r, X86::VFMADD213NEPBF16Z256mb, TB_BCAST_SH}, - {X86::VFMADD213NEPBF16Zr, X86::VFMADD213NEPBF16Zmb, TB_BCAST_SH}, + {X86::VFMADD213BF16Z128r, X86::VFMADD213BF16Z128mb, TB_BCAST_SH}, + {X86::VFMADD213BF16Z256r, X86::VFMADD213BF16Z256mb, TB_BCAST_SH}, + {X86::VFMADD213BF16Zr, X86::VFMADD213BF16Zmb, TB_BCAST_SH}, {X86::VFMADD213PDZ128r, X86::VFMADD213PDZ128mb, TB_BCAST_SD}, {X86::VFMADD213PDZ256r, X86::VFMADD213PDZ256mb, TB_BCAST_SD}, {X86::VFMADD213PDZr, X86::VFMADD213PDZmb, TB_BCAST_SD}, @@ -8991,9 +8991,9 @@ static const X86FoldTableEntry BroadcastTable3[] = { {X86::VFMADD213PSZ128r, X86::VFMADD213PSZ128mb, TB_BCAST_SS}, {X86::VFMADD213PSZ256r, X86::VFMADD213PSZ256mb, TB_BCAST_SS}, {X86::VFMADD213PSZr, X86::VFMADD213PSZmb, TB_BCAST_SS}, - {X86::VFMADD231NEPBF16Z128r, X86::VFMADD231NEPBF16Z128mb, TB_BCAST_SH}, - {X86::VFMADD231NEPBF16Z256r, X86::VFMADD231NEPBF16Z256mb, TB_BCAST_SH}, - {X86::VFMADD231NEPBF16Zr, X86::VFMADD231NEPBF16Zmb, TB_BCAST_SH}, + {X86::VFMADD231BF16Z128r, X86::VFMADD231BF16Z128mb, TB_BCAST_SH}, + {X86::VFMADD231BF16Z256r, X86::VFMADD231BF16Z256mb, TB_BCAST_SH}, + {X86::VFMADD231BF16Zr, X86::VFMADD231BF16Zmb, TB_BCAST_SH}, {X86::VFMADD231PDZ128r, X86::VFMADD231PDZ128mb, TB_BCAST_SD}, {X86::VFMADD231PDZ256r, X86::VFMADD231PDZ256mb, TB_BCAST_SD}, {X86::VFMADD231PDZr, X86::VFMADD231PDZmb, TB_BCAST_SD}, @@ -9033,9 +9033,9 @@ static const X86FoldTableEntry BroadcastTable3[] = { {X86::VFMADDSUB231PSZ128r, X86::VFMADDSUB231PSZ128mb, TB_BCAST_SS}, {X86::VFMADDSUB231PSZ256r, X86::VFMADDSUB231PSZ256mb, TB_BCAST_SS}, {X86::VFMADDSUB231PSZr, X86::VFMADDSUB231PSZmb, TB_BCAST_SS}, - {X86::VFMSUB132NEPBF16Z128r, X86::VFMSUB132NEPBF16Z128mb, TB_BCAST_SH}, - {X86::VFMSUB132NEPBF16Z256r, X86::VFMSUB132NEPBF16Z256mb, TB_BCAST_SH}, - {X86::VFMSUB132NEPBF16Zr, X86::VFMSUB132NEPBF16Zmb, TB_BCAST_SH}, + {X86::VFMSUB132BF16Z128r, X86::VFMSUB132BF16Z128mb, TB_BCAST_SH}, + {X86::VFMSUB132BF16Z256r, X86::VFMSUB132BF16Z256mb, TB_BCAST_SH}, + {X86::VFMSUB132BF16Zr, X86::VFMSUB132BF16Zmb, TB_BCAST_SH}, {X86::VFMSUB132PDZ128r, X86::VFMSUB132PDZ128mb, TB_BCAST_SD}, {X86::VFMSUB132PDZ256r, X86::VFMSUB132PDZ256mb, TB_BCAST_SD}, {X86::VFMSUB132PDZr, X86::VFMSUB132PDZmb, TB_BCAST_SD}, @@ -9045,9 +9045,9 @@ static const X86FoldTableEntry BroadcastTable3[] = { {X86::VFMSUB132PSZ128r, X86::VFMSUB132PSZ128mb, TB_BCAST_SS}, {X86::VFMSUB132PSZ256r, X86::VFMSUB132PSZ256mb, TB_BCAST_SS}, {X86::VFMSUB132PSZr, X86::VFMSUB132PSZmb, TB_BCAST_SS}, - {X86::VFMSUB213NEPBF16Z128r, X86::VFMSUB213NEPBF16Z128mb, TB_BCAST_SH}, - {X86::VFMSUB213NEPBF16Z256r, X86::VFMSUB213NEPBF16Z256mb, TB_BCAST_SH}, - {X86::VFMSUB213NEPBF16Zr, X86::VFMSUB213NEPBF16Zmb, TB_BCAST_SH}, + {X86::VFMSUB213BF16Z128r, X86::VFMSUB213BF16Z128mb, TB_BCAST_SH}, + {X86::VFMSUB213BF16Z256r, X86::VFMSUB213BF16Z256mb, TB_BCAST_SH}, + {X86::VFMSUB213BF16Zr, X86::VFMSUB213BF16Zmb, TB_BCAST_SH}, {X86::VFMSUB213PDZ128r, X86::VFMSUB213PDZ128mb, TB_BCAST_SD}, {X86::VFMSUB213PDZ256r, X86::VFMSUB213PDZ256mb, TB_BCAST_SD}, {X86::VFMSUB213PDZr, X86::VFMSUB213PDZmb, TB_BCAST_SD}, @@ -9057,9 +9057,9 @@ static const X86FoldTableEntry BroadcastTable3[] = { {X86::VFMSUB213PSZ128r, X86::VFMSUB213PSZ128mb, TB_BCAST_SS}, {X86::VFMSUB213PSZ256r, X86::VFMSUB213PSZ256mb, TB_BCAST_SS}, {X86::VFMSUB213PSZr, X86::VFMSUB213PSZmb, TB_BCAST_SS}, - {X86::VFMSUB231NEPBF16Z128r, X86::VFMSUB231NEPBF16Z128mb, TB_BCAST_SH}, - {X86::VFMSUB231NEPBF16Z256r, X86::VFMSUB231NEPBF16Z256mb, TB_BCAST_SH}, - {X86::VFMSUB231NEPBF16Zr, X86::VFMSUB231NEPBF16Zmb, TB_BCAST_SH}, + {X86::VFMSUB231BF16Z128r, X86::VFMSUB231BF16Z128mb, TB_BCAST_SH}, + {X86::VFMSUB231BF16Z256r, X86::VFMSUB231BF16Z256mb, TB_BCAST_SH}, + {X86::VFMSUB231BF16Zr, X86::VFMSUB231BF16Zmb, TB_BCAST_SH}, {X86::VFMSUB231PDZ128r, X86::VFMSUB231PDZ128mb, TB_BCAST_SD}, {X86::VFMSUB231PDZ256r, X86::VFMSUB231PDZ256mb, TB_BCAST_SD}, {X86::VFMSUB231PDZr, X86::VFMSUB231PDZmb, TB_BCAST_SD}, @@ -9099,9 +9099,9 @@ static const X86FoldTableEntry BroadcastTable3[] = { {X86::VFMULCPHZ128rrkz, X86::VFMULCPHZ128rmbkz, TB_BCAST_SS}, {X86::VFMULCPHZ256rrkz, X86::VFMULCPHZ256rmbkz, TB_BCAST_SS}, {X86::VFMULCPHZrrkz, X86::VFMULCPHZrmbkz, TB_BCAST_SS}, - {X86::VFNMADD132NEPBF16Z128r, X86::VFNMADD132NEPBF16Z128mb, TB_BCAST_SH}, - {X86::VFNMADD132NEPBF16Z256r, X86::VFNMADD132NEPBF16Z256mb, TB_BCAST_SH}, - {X86::VFNMADD132NEPBF16Zr, X86::VFNMADD132NEPBF16Zmb, TB_BCAST_SH}, + {X86::VFNMADD132BF16Z128r, X86::VFNMADD132BF16Z128mb, TB_BCAST_SH}, + {X86::VFNMADD132BF16Z256r, X86::VFNMADD132BF16Z256mb, TB_BCAST_SH}, + {X86::VFNMADD132BF16Zr, X86::VFNMADD132BF16Zmb, TB_BCAST_SH}, {X86::VFNMADD132PDZ128r, X86::VFNMADD132PDZ128mb, TB_BCAST_SD}, {X86::VFNMADD132PDZ256r, X86::VFNMADD132PDZ256mb, TB_BCAST_SD}, {X86::VFNMADD132PDZr, X86::VFNMADD132PDZmb, TB_BCAST_SD}, @@ -9111,9 +9111,9 @@ static const X86FoldTableEntry BroadcastTable3[] = { {X86::VFNMADD132PSZ128r, X86::VFNMADD132PSZ128mb, TB_BCAST_SS}, {X86::VFNMADD132PSZ256r, X86::VFNMADD132PSZ256mb, TB_BCAST_SS}, {X86::VFNMADD132PSZr, X86::VFNMADD132PSZmb, TB_BCAST_SS}, - {X86::VFNMADD213NEPBF16Z128r, X86::VFNMADD213NEPBF16Z128mb, TB_BCAST_SH}, - {X86::VFNMADD213NEPBF16Z256r, X86::VFNMADD213NEPBF16Z256mb, TB_BCAST_SH}, - {X86::VFNMADD213NEPBF16Zr, X86::VFNMADD213NEPBF16Zmb, TB_BCAST_SH}, + {X86::VFNMADD213BF16Z128r, X86::VFNMADD213BF16Z128mb, TB_BCAST_SH}, + {X86::VFNMADD213BF16Z256r, X86::VFNMADD213BF16Z256mb, TB_BCAST_SH}, + {X86::VFNMADD213BF16Zr, X86::VFNMADD213BF16Zmb, TB_BCAST_SH}, {X86::VFNMADD213PDZ128r, X86::VFNMADD213PDZ128mb, TB_BCAST_SD}, {X86::VFNMADD213PDZ256r, X86::VFNMADD213PDZ256mb, TB_BCAST_SD}, {X86::VFNMADD213PDZr, X86::VFNMADD213PDZmb, TB_BCAST_SD}, @@ -9123,9 +9123,9 @@ static const X86FoldTableEntry BroadcastTable3[] = { {X86::VFNMADD213PSZ128r, X86::VFNMADD213PSZ128mb, TB_BCAST_SS}, {X86::VFNMADD213PSZ256r, X86::VFNMADD213PSZ256mb, TB_BCAST_SS}, {X86::VFNMADD213PSZr, X86::VFNMADD213PSZmb, TB_BCAST_SS}, - {X86::VFNMADD231NEPBF16Z128r, X86::VFNMADD231NEPBF16Z128mb, TB_BCAST_SH}, - {X86::VFNMADD231NEPBF16Z256r, X86::VFNMADD231NEPBF16Z256mb, TB_BCAST_SH}, - {X86::VFNMADD231NEPBF16Zr, X86::VFNMADD231NEPBF16Zmb, TB_BCAST_SH}, + {X86::VFNMADD231BF16Z128r, X86::VFNMADD231BF16Z128mb, TB_BCAST_SH}, + {X86::VFNMADD231BF16Z256r, X86::VFNMADD231BF16Z256mb, TB_BCAST_SH}, + {X86::VFNMADD231BF16Zr, X86::VFNMADD231BF16Zmb, TB_BCAST_SH}, {X86::VFNMADD231PDZ128r, X86::VFNMADD231PDZ128mb, TB_BCAST_SD}, {X86::VFNMADD231PDZ256r, X86::VFNMADD231PDZ256mb, TB_BCAST_SD}, {X86::VFNMADD231PDZr, X86::VFNMADD231PDZmb, TB_BCAST_SD}, @@ -9135,9 +9135,9 @@ static const X86FoldTableEntry BroadcastTable3[] = { {X86::VFNMADD231PSZ128r, X86::VFNMADD231PSZ128mb, TB_BCAST_SS}, {X86::VFNMADD231PSZ256r, X86::VFNMADD231PSZ256mb, TB_BCAST_SS}, {X86::VFNMADD231PSZr, X86::VFNMADD231PSZmb, TB_BCAST_SS}, - {X86::VFNMSUB132NEPBF16Z128r, X86::VFNMSUB132NEPBF16Z128mb, TB_BCAST_SH}, - {X86::VFNMSUB132NEPBF16Z256r, X86::VFNMSUB132NEPBF16Z256mb, TB_BCAST_SH}, - {X86::VFNMSUB132NEPBF16Zr, X86::VFNMSUB132NEPBF16Zmb, TB_BCAST_SH}, + {X86::VFNMSUB132BF16Z128r, X86::VFNMSUB132BF16Z128mb, TB_BCAST_SH}, + {X86::VFNMSUB132BF16Z256r, X86::VFNMSUB132BF16Z256mb, TB_BCAST_SH}, + {X86::VFNMSUB132BF16Zr, X86::VFNMSUB132BF16Zmb, TB_BCAST_SH}, {X86::VFNMSUB132PDZ128r, X86::VFNMSUB132PDZ128mb, TB_BCAST_SD}, {X86::VFNMSUB132PDZ256r, X86::VFNMSUB132PDZ256mb, TB_BCAST_SD}, {X86::VFNMSUB132PDZr, X86::VFNMSUB132PDZmb, TB_BCAST_SD}, @@ -9147,9 +9147,9 @@ static const X86FoldTableEntry BroadcastTable3[] = { {X86::VFNMSUB132PSZ128r, X86::VFNMSUB132PSZ128mb, TB_BCAST_SS}, {X86::VFNMSUB132PSZ256r, X86::VFNMSUB132PSZ256mb, TB_BCAST_SS}, {X86::VFNMSUB132PSZr, X86::VFNMSUB132PSZmb, TB_BCAST_SS}, - {X86::VFNMSUB213NEPBF16Z128r, X86::VFNMSUB213NEPBF16Z128mb, TB_BCAST_SH}, - {X86::VFNMSUB213NEPBF16Z256r, X86::VFNMSUB213NEPBF16Z256mb, TB_BCAST_SH}, - {X86::VFNMSUB213NEPBF16Zr, X86::VFNMSUB213NEPBF16Zmb, TB_BCAST_SH}, + {X86::VFNMSUB213BF16Z128r, X86::VFNMSUB213BF16Z128mb, TB_BCAST_SH}, + {X86::VFNMSUB213BF16Z256r, X86::VFNMSUB213BF16Z256mb, TB_BCAST_SH}, + {X86::VFNMSUB213BF16Zr, X86::VFNMSUB213BF16Zmb, TB_BCAST_SH}, {X86::VFNMSUB213PDZ128r, X86::VFNMSUB213PDZ128mb, TB_BCAST_SD}, {X86::VFNMSUB213PDZ256r, X86::VFNMSUB213PDZ256mb, TB_BCAST_SD}, {X86::VFNMSUB213PDZr, X86::VFNMSUB213PDZmb, TB_BCAST_SD}, @@ -9159,9 +9159,9 @@ static const X86FoldTableEntry BroadcastTable3[] = { {X86::VFNMSUB213PSZ128r, X86::VFNMSUB213PSZ128mb, TB_BCAST_SS}, {X86::VFNMSUB213PSZ256r, X86::VFNMSUB213PSZ256mb, TB_BCAST_SS}, {X86::VFNMSUB213PSZr, X86::VFNMSUB213PSZmb, TB_BCAST_SS}, - {X86::VFNMSUB231NEPBF16Z128r, X86::VFNMSUB231NEPBF16Z128mb, TB_BCAST_SH}, - {X86::VFNMSUB231NEPBF16Z256r, X86::VFNMSUB231NEPBF16Z256mb, TB_BCAST_SH}, - {X86::VFNMSUB231NEPBF16Zr, X86::VFNMSUB231NEPBF16Zmb, TB_BCAST_SH}, + {X86::VFNMSUB231BF16Z128r, X86::VFNMSUB231BF16Z128mb, TB_BCAST_SH}, + {X86::VFNMSUB231BF16Z256r, X86::VFNMSUB231BF16Z256mb, TB_BCAST_SH}, + {X86::VFNMSUB231BF16Zr, X86::VFNMSUB231BF16Zmb, TB_BCAST_SH}, {X86::VFNMSUB231PDZ128r, X86::VFNMSUB231PDZ128mb, TB_BCAST_SD}, {X86::VFNMSUB231PDZ256r, X86::VFNMSUB231PDZ256mb, TB_BCAST_SD}, {X86::VFNMSUB231PDZr, X86::VFNMSUB231PDZmb, TB_BCAST_SD}, @@ -9171,9 +9171,9 @@ static const X86FoldTableEntry BroadcastTable3[] = { {X86::VFNMSUB231PSZ128r, X86::VFNMSUB231PSZ128mb, TB_BCAST_SS}, {X86::VFNMSUB231PSZ256r, X86::VFNMSUB231PSZ256mb, TB_BCAST_SS}, {X86::VFNMSUB231PSZr, X86::VFNMSUB231PSZmb, TB_BCAST_SS}, - {X86::VGETEXPPBF16Z128rk, X86::VGETEXPPBF16Z128mbk, TB_BCAST_SH}, - {X86::VGETEXPPBF16Z256rk, X86::VGETEXPPBF16Z256mbk, TB_BCAST_SH}, - {X86::VGETEXPPBF16Zrk, X86::VGETEXPPBF16Zmbk, TB_BCAST_SH}, + {X86::VGETEXPBF16Z128rk, X86::VGETEXPBF16Z128mbk, TB_BCAST_SH}, + {X86::VGETEXPBF16Z256rk, X86::VGETEXPBF16Z256mbk, TB_BCAST_SH}, + {X86::VGETEXPBF16Zrk, X86::VGETEXPBF16Zmbk, TB_BCAST_SH}, {X86::VGETEXPPDZ128rk, X86::VGETEXPPDZ128mbk, TB_BCAST_SD}, {X86::VGETEXPPDZ256rk, X86::VGETEXPPDZ256mbk, TB_BCAST_SD}, {X86::VGETEXPPDZrk, X86::VGETEXPPDZmbk, TB_BCAST_SD}, @@ -9183,9 +9183,9 @@ static const X86FoldTableEntry BroadcastTable3[] = { {X86::VGETEXPPSZ128rk, X86::VGETEXPPSZ128mbk, TB_BCAST_SS}, {X86::VGETEXPPSZ256rk, X86::VGETEXPPSZ256mbk, TB_BCAST_SS}, {X86::VGETEXPPSZrk, X86::VGETEXPPSZmbk, TB_BCAST_SS}, - {X86::VGETMANTPBF16Z128rrik, X86::VGETMANTPBF16Z128rmbik, TB_BCAST_SH}, - {X86::VGETMANTPBF16Z256rrik, X86::VGETMANTPBF16Z256rmbik, TB_BCAST_SH}, - {X86::VGETMANTPBF16Zrrik, X86::VGETMANTPBF16Zrmbik, TB_BCAST_SH}, + {X86::VGETMANTBF16Z128rrik, X86::VGETMANTBF16Z128rmbik, TB_BCAST_SH}, + {X86::VGETMANTBF16Z256rrik, X86::VGETMANTBF16Z256rmbik, TB_BCAST_SH}, + {X86::VGETMANTBF16Zrrik, X86::VGETMANTBF16Zrmbik, TB_BCAST_SH}, {X86::VGETMANTPDZ128rrik, X86::VGETMANTPDZ128rmbik, TB_BCAST_SD}, {X86::VGETMANTPDZ256rrik, X86::VGETMANTPDZ256rmbik, TB_BCAST_SD}, {X86::VGETMANTPDZrrik, X86::VGETMANTPDZrmbik, TB_BCAST_SD}, @@ -9201,6 +9201,9 @@ static const X86FoldTableEntry BroadcastTable3[] = { {X86::VGF2P8AFFINEQBZ128rrikz, X86::VGF2P8AFFINEQBZ128rmbikz, TB_BCAST_Q}, {X86::VGF2P8AFFINEQBZ256rrikz, X86::VGF2P8AFFINEQBZ256rmbikz, TB_BCAST_Q}, {X86::VGF2P8AFFINEQBZrrikz, X86::VGF2P8AFFINEQBZrmbikz, TB_BCAST_Q}, + {X86::VMAXBF16Z128rrkz, X86::VMAXBF16Z128rmbkz, TB_BCAST_SH}, + {X86::VMAXBF16Z256rrkz, X86::VMAXBF16Z256rmbkz, TB_BCAST_SH}, + {X86::VMAXBF16Zrrkz, X86::VMAXBF16Zrmbkz, TB_BCAST_SH}, {X86::VMAXCPDZ128rrkz, X86::VMAXCPDZ128rmbkz, TB_BCAST_SD}, {X86::VMAXCPDZ256rrkz, X86::VMAXCPDZ256rmbkz, TB_BCAST_SD}, {X86::VMAXCPDZrrkz, X86::VMAXCPDZrmbkz, TB_BCAST_SD}, @@ -9210,9 +9213,6 @@ static const X86FoldTableEntry BroadcastTable3[] = { {X86::VMAXCPSZ128rrkz, X86::VMAXCPSZ128rmbkz, TB_BCAST_SS}, {X86::VMAXCPSZ256rrkz, X86::VMAXCPSZ256rmbkz, TB_BCAST_SS}, {X86::VMAXCPSZrrkz, X86::VMAXCPSZrmbkz, TB_BCAST_SS}, - {X86::VMAXPBF16Z128rrkz, X86::VMAXPBF16Z128rmbkz, TB_BCAST_SH}, - {X86::VMAXPBF16Z256rrkz, X86::VMAXPBF16Z256rmbkz, TB_BCAST_SH}, - {X86::VMAXPBF16Zrrkz, X86::VMAXPBF16Zrmbkz, TB_BCAST_SH}, {X86::VMAXPDZ128rrkz, X86::VMAXPDZ128rmbkz, TB_BCAST_SD}, {X86::VMAXPDZ256rrkz, X86::VMAXPDZ256rmbkz, TB_BCAST_SD}, {X86::VMAXPDZrrkz, X86::VMAXPDZrmbkz, TB_BCAST_SD}, @@ -9222,6 +9222,9 @@ static const X86FoldTableEntry BroadcastTable3[] = { {X86::VMAXPSZ128rrkz, X86::VMAXPSZ128rmbkz, TB_BCAST_SS}, {X86::VMAXPSZ256rrkz, X86::VMAXPSZ256rmbkz, TB_BCAST_SS}, {X86::VMAXPSZrrkz, X86::VMAXPSZrmbkz, TB_BCAST_SS}, + {X86::VMINBF16Z128rrkz, X86::VMINBF16Z128rmbkz, TB_BCAST_SH}, + {X86::VMINBF16Z256rrkz, X86::VMINBF16Z256rmbkz, TB_BCAST_SH}, + {X86::VMINBF16Zrrkz, X86::VMINBF16Zrmbkz, TB_BCAST_SH}, {X86::VMINCPDZ128rrkz, X86::VMINCPDZ128rmbkz, TB_BCAST_SD}, {X86::VMINCPDZ256rrkz, X86::VMINCPDZ256rmbkz, TB_BCAST_SD}, {X86::VMINCPDZrrkz, X86::VMINCPDZrmbkz, TB_BCAST_SD}, @@ -9243,9 +9246,6 @@ static const X86FoldTableEntry BroadcastTable3[] = { {X86::VMINMAXPSZ128rrikz, X86::VMINMAXPSZ128rmbikz, TB_BCAST_SS}, {X86::VMINMAXPSZ256rrikz, X86::VMINMAXPSZ256rmbikz, TB_BCAST_SS}, {X86::VMINMAXPSZrrikz, X86::VMINMAXPSZrmbikz, TB_BCAST_SS}, - {X86::VMINPBF16Z128rrkz, X86::VMINPBF16Z128rmbkz, TB_BCAST_SH}, - {X86::VMINPBF16Z256rrkz, X86::VMINPBF16Z256rmbkz, TB_BCAST_SH}, - {X86::VMINPBF16Zrrkz, X86::VMINPBF16Zrmbkz, TB_BCAST_SH}, {X86::VMINPDZ128rrkz, X86::VMINPDZ128rmbkz, TB_BCAST_SD}, {X86::VMINPDZ256rrkz, X86::VMINPDZ256rmbkz, TB_BCAST_SD}, {X86::VMINPDZrrkz, X86::VMINPDZrmbkz, TB_BCAST_SD}, @@ -9255,9 +9255,9 @@ static const X86FoldTableEntry BroadcastTable3[] = { {X86::VMINPSZ128rrkz, X86::VMINPSZ128rmbkz, TB_BCAST_SS}, {X86::VMINPSZ256rrkz, X86::VMINPSZ256rmbkz, TB_BCAST_SS}, {X86::VMINPSZrrkz, X86::VMINPSZrmbkz, TB_BCAST_SS}, - {X86::VMULNEPBF16Z128rrkz, X86::VMULNEPBF16Z128rmbkz, TB_BCAST_SH}, - {X86::VMULNEPBF16Z256rrkz, X86::VMULNEPBF16Z256rmbkz, TB_BCAST_SH}, - {X86::VMULNEPBF16Zrrkz, X86::VMULNEPBF16Zrmbkz, TB_BCAST_SH}, + {X86::VMULBF16Z128rrkz, X86::VMULBF16Z128rmbkz, TB_BCAST_SH}, + {X86::VMULBF16Z256rrkz, X86::VMULBF16Z256rmbkz, TB_BCAST_SH}, + {X86::VMULBF16Zrrkz, X86::VMULBF16Zrmbkz, TB_BCAST_SH}, {X86::VMULPDZ128rrkz, X86::VMULPDZ128rmbkz, TB_BCAST_SD}, {X86::VMULPDZ256rrkz, X86::VMULPDZ256rmbkz, TB_BCAST_SD}, {X86::VMULPDZrrkz, X86::VMULPDZrmbkz, TB_BCAST_SD}, @@ -9641,15 +9641,15 @@ static const X86FoldTableEntry BroadcastTable3[] = { {X86::VRCP14PSZrk, X86::VRCP14PSZmbk, TB_BCAST_SS}, {X86::VRCP28PDZrk, X86::VRCP28PDZmbk, TB_BCAST_SD}, {X86::VRCP28PSZrk, X86::VRCP28PSZmbk, TB_BCAST_SS}, - {X86::VRCPPBF16Z128rk, X86::VRCPPBF16Z128mbk, TB_BCAST_SH}, - {X86::VRCPPBF16Z256rk, X86::VRCPPBF16Z256mbk, TB_BCAST_SH}, - {X86::VRCPPBF16Zrk, X86::VRCPPBF16Zmbk, TB_BCAST_SH}, + {X86::VRCPBF16Z128rk, X86::VRCPBF16Z128mbk, TB_BCAST_SH}, + {X86::VRCPBF16Z256rk, X86::VRCPBF16Z256mbk, TB_BCAST_SH}, + {X86::VRCPBF16Zrk, X86::VRCPBF16Zmbk, TB_BCAST_SH}, {X86::VRCPPHZ128rk, X86::VRCPPHZ128mbk, TB_BCAST_SH}, {X86::VRCPPHZ256rk, X86::VRCPPHZ256mbk, TB_BCAST_SH}, {X86::VRCPPHZrk, X86::VRCPPHZmbk, TB_BCAST_SH}, - {X86::VREDUCENEPBF16Z128rrik, X86::VREDUCENEPBF16Z128rmbik, TB_BCAST_SH}, - {X86::VREDUCENEPBF16Z256rrik, X86::VREDUCENEPBF16Z256rmbik, TB_BCAST_SH}, - {X86::VREDUCENEPBF16Zrrik, X86::VREDUCENEPBF16Zrmbik, TB_BCAST_SH}, + {X86::VREDUCEBF16Z128rrik, X86::VREDUCEBF16Z128rmbik, TB_BCAST_SH}, + {X86::VREDUCEBF16Z256rrik, X86::VREDUCEBF16Z256rmbik, TB_BCAST_SH}, + {X86::VREDUCEBF16Zrrik, X86::VREDUCEBF16Zrmbik, TB_BCAST_SH}, {X86::VREDUCEPDZ128rrik, X86::VREDUCEPDZ128rmbik, TB_BCAST_SD}, {X86::VREDUCEPDZ256rrik, X86::VREDUCEPDZ256rmbik, TB_BCAST_SD}, {X86::VREDUCEPDZrrik, X86::VREDUCEPDZrmbik, TB_BCAST_SD}, @@ -9659,9 +9659,9 @@ static const X86FoldTableEntry BroadcastTable3[] = { {X86::VREDUCEPSZ128rrik, X86::VREDUCEPSZ128rmbik, TB_BCAST_SS}, {X86::VREDUCEPSZ256rrik, X86::VREDUCEPSZ256rmbik, TB_BCAST_SS}, {X86::VREDUCEPSZrrik, X86::VREDUCEPSZrmbik, TB_BCAST_SS}, - {X86::VRNDSCALENEPBF16Z128rrik, X86::VRNDSCALENEPBF16Z128rmbik, TB_BCAST_SH}, - {X86::VRNDSCALENEPBF16Z256rrik, X86::VRNDSCALENEPBF16Z256rmbik, TB_BCAST_SH}, - {X86::VRNDSCALENEPBF16Zrrik, X86::VRNDSCALENEPBF16Zrmbik, TB_BCAST_SH}, + {X86::VRNDSCALEBF16Z128rrik, X86::VRNDSCALEBF16Z128rmbik, TB_BCAST_SH}, + {X86::VRNDSCALEBF16Z256rrik, X86::VRNDSCALEBF16Z256rmbik, TB_BCAST_SH}, + {X86::VRNDSCALEBF16Zrrik, X86::VRNDSCALEBF16Zrmbik, TB_BCAST_SH}, {X86::VRNDSCALEPDZ128rrik, X86::VRNDSCALEPDZ128rmbik, TB_BCAST_SD}, {X86::VRNDSCALEPDZ256rrik, X86::VRNDSCALEPDZ256rmbik, TB_BCAST_SD}, {X86::VRNDSCALEPDZrrik, X86::VRNDSCALEPDZrmbik, TB_BCAST_SD}, @@ -9679,15 +9679,15 @@ static const X86FoldTableEntry BroadcastTable3[] = { {X86::VRSQRT14PSZrk, X86::VRSQRT14PSZmbk, TB_BCAST_SS}, {X86::VRSQRT28PDZrk, X86::VRSQRT28PDZmbk, TB_BCAST_SD}, {X86::VRSQRT28PSZrk, X86::VRSQRT28PSZmbk, TB_BCAST_SS}, - {X86::VRSQRTPBF16Z128rk, X86::VRSQRTPBF16Z128mbk, TB_BCAST_SH}, - {X86::VRSQRTPBF16Z256rk, X86::VRSQRTPBF16Z256mbk, TB_BCAST_SH}, - {X86::VRSQRTPBF16Zrk, X86::VRSQRTPBF16Zmbk, TB_BCAST_SH}, + {X86::VRSQRTBF16Z128rk, X86::VRSQRTBF16Z128mbk, TB_BCAST_SH}, + {X86::VRSQRTBF16Z256rk, X86::VRSQRTBF16Z256mbk, TB_BCAST_SH}, + {X86::VRSQRTBF16Zrk, X86::VRSQRTBF16Zmbk, TB_BCAST_SH}, {X86::VRSQRTPHZ128rk, X86::VRSQRTPHZ128mbk, TB_BCAST_SH}, {X86::VRSQRTPHZ256rk, X86::VRSQRTPHZ256mbk, TB_BCAST_SH}, {X86::VRSQRTPHZrk, X86::VRSQRTPHZmbk, TB_BCAST_SH}, - {X86::VSCALEFPBF16Z128rrkz, X86::VSCALEFPBF16Z128rmbkz, TB_BCAST_SH}, - {X86::VSCALEFPBF16Z256rrkz, X86::VSCALEFPBF16Z256rmbkz, TB_BCAST_SH}, - {X86::VSCALEFPBF16Zrrkz, X86::VSCALEFPBF16Zrmbkz, TB_BCAST_SH}, + {X86::VSCALEFBF16Z128rrkz, X86::VSCALEFBF16Z128rmbkz, TB_BCAST_SH}, + {X86::VSCALEFBF16Z256rrkz, X86::VSCALEFBF16Z256rmbkz, TB_BCAST_SH}, + {X86::VSCALEFBF16Zrrkz, X86::VSCALEFBF16Zrmbkz, TB_BCAST_SH}, {X86::VSCALEFPDZ128rrkz, X86::VSCALEFPDZ128rmbkz, TB_BCAST_SD}, {X86::VSCALEFPDZ256rrkz, X86::VSCALEFPDZ256rmbkz, TB_BCAST_SD}, {X86::VSCALEFPDZrrkz, X86::VSCALEFPDZrmbkz, TB_BCAST_SD}, @@ -9711,9 +9711,9 @@ static const X86FoldTableEntry BroadcastTable3[] = { {X86::VSHUFPSZ128rrikz, X86::VSHUFPSZ128rmbikz, TB_BCAST_SS}, {X86::VSHUFPSZ256rrikz, X86::VSHUFPSZ256rmbikz, TB_BCAST_SS}, {X86::VSHUFPSZrrikz, X86::VSHUFPSZrmbikz, TB_BCAST_SS}, - {X86::VSQRTNEPBF16Z128rk, X86::VSQRTNEPBF16Z128mbk, TB_BCAST_SH}, - {X86::VSQRTNEPBF16Z256rk, X86::VSQRTNEPBF16Z256mbk, TB_BCAST_SH}, - {X86::VSQRTNEPBF16Zrk, X86::VSQRTNEPBF16Zmbk, TB_BCAST_SH}, + {X86::VSQRTBF16Z128rk, X86::VSQRTBF16Z128mbk, TB_BCAST_SH}, + {X86::VSQRTBF16Z256rk, X86::VSQRTBF16Z256mbk, TB_BCAST_SH}, + {X86::VSQRTBF16Zrk, X86::VSQRTBF16Zmbk, TB_BCAST_SH}, {X86::VSQRTPDZ128rk, X86::VSQRTPDZ128mbk, TB_BCAST_SD}, {X86::VSQRTPDZ256rk, X86::VSQRTPDZ256mbk, TB_BCAST_SD}, {X86::VSQRTPDZrk, X86::VSQRTPDZmbk, TB_BCAST_SD}, @@ -9723,9 +9723,9 @@ static const X86FoldTableEntry BroadcastTable3[] = { {X86::VSQRTPSZ128rk, X86::VSQRTPSZ128mbk, TB_BCAST_SS}, {X86::VSQRTPSZ256rk, X86::VSQRTPSZ256mbk, TB_BCAST_SS}, {X86::VSQRTPSZrk, X86::VSQRTPSZmbk, TB_BCAST_SS}, - {X86::VSUBNEPBF16Z128rrkz, X86::VSUBNEPBF16Z128rmbkz, TB_BCAST_SH}, - {X86::VSUBNEPBF16Z256rrkz, X86::VSUBNEPBF16Z256rmbkz, TB_BCAST_SH}, - {X86::VSUBNEPBF16Zrrkz, X86::VSUBNEPBF16Zrmbkz, TB_BCAST_SH}, + {X86::VSUBBF16Z128rrkz, X86::VSUBBF16Z128rmbkz, TB_BCAST_SH}, + {X86::VSUBBF16Z256rrkz, X86::VSUBBF16Z256rmbkz, TB_BCAST_SH}, + {X86::VSUBBF16Zrrkz, X86::VSUBBF16Zrmbkz, TB_BCAST_SH}, {X86::VSUBPDZ128rrkz, X86::VSUBPDZ128rmbkz, TB_BCAST_SD}, {X86::VSUBPDZ256rrkz, X86::VSUBPDZ256rmbkz, TB_BCAST_SD}, {X86::VSUBPDZrrkz, X86::VSUBPDZrmbkz, TB_BCAST_SD}, @@ -9756,9 +9756,9 @@ static const X86FoldTableEntry BroadcastTable3[] = { }; static const X86FoldTableEntry BroadcastTable4[] = { - {X86::VADDNEPBF16Z128rrk, X86::VADDNEPBF16Z128rmbk, TB_BCAST_SH}, - {X86::VADDNEPBF16Z256rrk, X86::VADDNEPBF16Z256rmbk, TB_BCAST_SH}, - {X86::VADDNEPBF16Zrrk, X86::VADDNEPBF16Zrmbk, TB_BCAST_SH}, + {X86::VADDBF16Z128rrk, X86::VADDBF16Z128rmbk, TB_BCAST_SH}, + {X86::VADDBF16Z256rrk, X86::VADDBF16Z256rmbk, TB_BCAST_SH}, + {X86::VADDBF16Zrrk, X86::VADDBF16Zrmbk, TB_BCAST_SH}, {X86::VADDPDZ128rrk, X86::VADDPDZ128rmbk, TB_BCAST_SD}, {X86::VADDPDZ256rrk, X86::VADDPDZ256rmbk, TB_BCAST_SD}, {X86::VADDPDZrrk, X86::VADDPDZrmbk, TB_BCAST_SD}, @@ -9816,9 +9816,9 @@ static const X86FoldTableEntry BroadcastTable4[] = { {X86::VCVTNE2PS2BF16Z128rrk, X86::VCVTNE2PS2BF16Z128rmbk, TB_BCAST_SS}, {X86::VCVTNE2PS2BF16Z256rrk, X86::VCVTNE2PS2BF16Z256rmbk, TB_BCAST_SS}, {X86::VCVTNE2PS2BF16Zrrk, X86::VCVTNE2PS2BF16Zrmbk, TB_BCAST_SS}, - {X86::VDIVNEPBF16Z128rrk, X86::VDIVNEPBF16Z128rmbk, TB_BCAST_SH}, - {X86::VDIVNEPBF16Z256rrk, X86::VDIVNEPBF16Z256rmbk, TB_BCAST_SH}, - {X86::VDIVNEPBF16Zrrk, X86::VDIVNEPBF16Zrmbk, TB_BCAST_SH}, + {X86::VDIVBF16Z128rrk, X86::VDIVBF16Z128rmbk, TB_BCAST_SH}, + {X86::VDIVBF16Z256rrk, X86::VDIVBF16Z256rmbk, TB_BCAST_SH}, + {X86::VDIVBF16Zrrk, X86::VDIVBF16Zrmbk, TB_BCAST_SH}, {X86::VDIVPDZ128rrk, X86::VDIVPDZ128rmbk, TB_BCAST_SD}, {X86::VDIVPDZ256rrk, X86::VDIVPDZ256rmbk, TB_BCAST_SD}, {X86::VDIVPDZrrk, X86::VDIVPDZrmbk, TB_BCAST_SD}, @@ -9861,12 +9861,12 @@ static const X86FoldTableEntry BroadcastTable4[] = { {X86::VFIXUPIMMPSZ256rrikz, X86::VFIXUPIMMPSZ256rmbikz, TB_BCAST_SS}, {X86::VFIXUPIMMPSZrrik, X86::VFIXUPIMMPSZrmbik, TB_BCAST_SS}, {X86::VFIXUPIMMPSZrrikz, X86::VFIXUPIMMPSZrmbikz, TB_BCAST_SS}, - {X86::VFMADD132NEPBF16Z128rk, X86::VFMADD132NEPBF16Z128mbk, TB_BCAST_SH}, - {X86::VFMADD132NEPBF16Z128rkz, X86::VFMADD132NEPBF16Z128mbkz, TB_BCAST_SH}, - {X86::VFMADD132NEPBF16Z256rk, X86::VFMADD132NEPBF16Z256mbk, TB_BCAST_SH}, - {X86::VFMADD132NEPBF16Z256rkz, X86::VFMADD132NEPBF16Z256mbkz, TB_BCAST_SH}, - {X86::VFMADD132NEPBF16Zrk, X86::VFMADD132NEPBF16Zmbk, TB_BCAST_SH}, - {X86::VFMADD132NEPBF16Zrkz, X86::VFMADD132NEPBF16Zmbkz, TB_BCAST_SH}, + {X86::VFMADD132BF16Z128rk, X86::VFMADD132BF16Z128mbk, TB_BCAST_SH}, + {X86::VFMADD132BF16Z128rkz, X86::VFMADD132BF16Z128mbkz, TB_BCAST_SH}, + {X86::VFMADD132BF16Z256rk, X86::VFMADD132BF16Z256mbk, TB_BCAST_SH}, + {X86::VFMADD132BF16Z256rkz, X86::VFMADD132BF16Z256mbkz, TB_BCAST_SH}, + {X86::VFMADD132BF16Zrk, X86::VFMADD132BF16Zmbk, TB_BCAST_SH}, + {X86::VFMADD132BF16Zrkz, X86::VFMADD132BF16Zmbkz, TB_BCAST_SH}, {X86::VFMADD132PDZ128rk, X86::VFMADD132PDZ128mbk, TB_BCAST_SD}, {X86::VFMADD132PDZ128rkz, X86::VFMADD132PDZ128mbkz, TB_BCAST_SD}, {X86::VFMADD132PDZ256rk, X86::VFMADD132PDZ256mbk, TB_BCAST_SD}, @@ -9885,12 +9885,12 @@ static const X86FoldTableEntry BroadcastTable4[] = { {X86::VFMADD132PSZ256rkz, X86::VFMADD132PSZ256mbkz, TB_BCAST_SS}, {X86::VFMADD132PSZrk, X86::VFMADD132PSZmbk, TB_BCAST_SS}, {X86::VFMADD132PSZrkz, X86::VFMADD132PSZmbkz, TB_BCAST_SS}, - {X86::VFMADD213NEPBF16Z128rk, X86::VFMADD213NEPBF16Z128mbk, TB_BCAST_SH}, - {X86::VFMADD213NEPBF16Z128rkz, X86::VFMADD213NEPBF16Z128mbkz, TB_BCAST_SH}, - {X86::VFMADD213NEPBF16Z256rk, X86::VFMADD213NEPBF16Z256mbk, TB_BCAST_SH}, - {X86::VFMADD213NEPBF16Z256rkz, X86::VFMADD213NEPBF16Z256mbkz, TB_BCAST_SH}, - {X86::VFMADD213NEPBF16Zrk, X86::VFMADD213NEPBF16Zmbk, TB_BCAST_SH}, - {X86::VFMADD213NEPBF16Zrkz, X86::VFMADD213NEPBF16Zmbkz, TB_BCAST_SH}, + {X86::VFMADD213BF16Z128rk, X86::VFMADD213BF16Z128mbk, TB_BCAST_SH}, + {X86::VFMADD213BF16Z128rkz, X86::VFMADD213BF16Z128mbkz, TB_BCAST_SH}, + {X86::VFMADD213BF16Z256rk, X86::VFMADD213BF16Z256mbk, TB_BCAST_SH}, + {X86::VFMADD213BF16Z256rkz, X86::VFMADD213BF16Z256mbkz, TB_BCAST_SH}, + {X86::VFMADD213BF16Zrk, X86::VFMADD213BF16Zmbk, TB_BCAST_SH}, + {X86::VFMADD213BF16Zrkz, X86::VFMADD213BF16Zmbkz, TB_BCAST_SH}, {X86::VFMADD213PDZ128rk, X86::VFMADD213PDZ128mbk, TB_BCAST_SD}, {X86::VFMADD213PDZ128rkz, X86::VFMADD213PDZ128mbkz, TB_BCAST_SD}, {X86::VFMADD213PDZ256rk, X86::VFMADD213PDZ256mbk, TB_BCAST_SD}, @@ -9909,12 +9909,12 @@ static const X86FoldTableEntry BroadcastTable4[] = { {X86::VFMADD213PSZ256rkz, X86::VFMADD213PSZ256mbkz, TB_BCAST_SS}, {X86::VFMADD213PSZrk, X86::VFMADD213PSZmbk, TB_BCAST_SS}, {X86::VFMADD213PSZrkz, X86::VFMADD213PSZmbkz, TB_BCAST_SS}, - {X86::VFMADD231NEPBF16Z128rk, X86::VFMADD231NEPBF16Z128mbk, TB_BCAST_SH}, - {X86::VFMADD231NEPBF16Z128rkz, X86::VFMADD231NEPBF16Z128mbkz, TB_BCAST_SH}, - {X86::VFMADD231NEPBF16Z256rk, X86::VFMADD231NEPBF16Z256mbk, TB_BCAST_SH}, - {X86::VFMADD231NEPBF16Z256rkz, X86::VFMADD231NEPBF16Z256mbkz, TB_BCAST_SH}, - {X86::VFMADD231NEPBF16Zrk, X86::VFMADD231NEPBF16Zmbk, TB_BCAST_SH}, - {X86::VFMADD231NEPBF16Zrkz, X86::VFMADD231NEPBF16Zmbkz, TB_BCAST_SH}, + {X86::VFMADD231BF16Z128rk, X86::VFMADD231BF16Z128mbk, TB_BCAST_SH}, + {X86::VFMADD231BF16Z128rkz, X86::VFMADD231BF16Z128mbkz, TB_BCAST_SH}, + {X86::VFMADD231BF16Z256rk, X86::VFMADD231BF16Z256mbk, TB_BCAST_SH}, + {X86::VFMADD231BF16Z256rkz, X86::VFMADD231BF16Z256mbkz, TB_BCAST_SH}, + {X86::VFMADD231BF16Zrk, X86::VFMADD231BF16Zmbk, TB_BCAST_SH}, + {X86::VFMADD231BF16Zrkz, X86::VFMADD231BF16Zmbkz, TB_BCAST_SH}, {X86::VFMADD231PDZ128rk, X86::VFMADD231PDZ128mbk, TB_BCAST_SD}, {X86::VFMADD231PDZ128rkz, X86::VFMADD231PDZ128mbkz, TB_BCAST_SD}, {X86::VFMADD231PDZ256rk, X86::VFMADD231PDZ256mbk, TB_BCAST_SD}, @@ -9993,12 +9993,12 @@ static const X86FoldTableEntry BroadcastTable4[] = { {X86::VFMADDSUB231PSZ256rkz, X86::VFMADDSUB231PSZ256mbkz, TB_BCAST_SS}, {X86::VFMADDSUB231PSZrk, X86::VFMADDSUB231PSZmbk, TB_BCAST_SS}, {X86::VFMADDSUB231PSZrkz, X86::VFMADDSUB231PSZmbkz, TB_BCAST_SS}, - {X86::VFMSUB132NEPBF16Z128rk, X86::VFMSUB132NEPBF16Z128mbk, TB_BCAST_SH}, - {X86::VFMSUB132NEPBF16Z128rkz, X86::VFMSUB132NEPBF16Z128mbkz, TB_BCAST_SH}, - {X86::VFMSUB132NEPBF16Z256rk, X86::VFMSUB132NEPBF16Z256mbk, TB_BCAST_SH}, - {X86::VFMSUB132NEPBF16Z256rkz, X86::VFMSUB132NEPBF16Z256mbkz, TB_BCAST_SH}, - {X86::VFMSUB132NEPBF16Zrk, X86::VFMSUB132NEPBF16Zmbk, TB_BCAST_SH}, - {X86::VFMSUB132NEPBF16Zrkz, X86::VFMSUB132NEPBF16Zmbkz, TB_BCAST_SH}, + {X86::VFMSUB132BF16Z128rk, X86::VFMSUB132BF16Z128mbk, TB_BCAST_SH}, + {X86::VFMSUB132BF16Z128rkz, X86::VFMSUB132BF16Z128mbkz, TB_BCAST_SH}, + {X86::VFMSUB132BF16Z256rk, X86::VFMSUB132BF16Z256mbk, TB_BCAST_SH}, + {X86::VFMSUB132BF16Z256rkz, X86::VFMSUB132BF16Z256mbkz, TB_BCAST_SH}, + {X86::VFMSUB132BF16Zrk, X86::VFMSUB132BF16Zmbk, TB_BCAST_SH}, + {X86::VFMSUB132BF16Zrkz, X86::VFMSUB132BF16Zmbkz, TB_BCAST_SH}, {X86::VFMSUB132PDZ128rk, X86::VFMSUB132PDZ128mbk, TB_BCAST_SD}, {X86::VFMSUB132PDZ128rkz, X86::VFMSUB132PDZ128mbkz, TB_BCAST_SD}, {X86::VFMSUB132PDZ256rk, X86::VFMSUB132PDZ256mbk, TB_BCAST_SD}, @@ -10017,12 +10017,12 @@ static const X86FoldTableEntry BroadcastTable4[] = { {X86::VFMSUB132PSZ256rkz, X86::VFMSUB132PSZ256mbkz, TB_BCAST_SS}, {X86::VFMSUB132PSZrk, X86::VFMSUB132PSZmbk, TB_BCAST_SS}, {X86::VFMSUB132PSZrkz, X86::VFMSUB132PSZmbkz, TB_BCAST_SS}, - {X86::VFMSUB213NEPBF16Z128rk, X86::VFMSUB213NEPBF16Z128mbk, TB_BCAST_SH}, - {X86::VFMSUB213NEPBF16Z128rkz, X86::VFMSUB213NEPBF16Z128mbkz, TB_BCAST_SH}, - {X86::VFMSUB213NEPBF16Z256rk, X86::VFMSUB213NEPBF16Z256mbk, TB_BCAST_SH}, - {X86::VFMSUB213NEPBF16Z256rkz, X86::VFMSUB213NEPBF16Z256mbkz, TB_BCAST_SH}, - {X86::VFMSUB213NEPBF16Zrk, X86::VFMSUB213NEPBF16Zmbk, TB_BCAST_SH}, - {X86::VFMSUB213NEPBF16Zrkz, X86::VFMSUB213NEPBF16Zmbkz, TB_BCAST_SH}, + {X86::VFMSUB213BF16Z128rk, X86::VFMSUB213BF16Z128mbk, TB_BCAST_SH}, + {X86::VFMSUB213BF16Z128rkz, X86::VFMSUB213BF16Z128mbkz, TB_BCAST_SH}, + {X86::VFMSUB213BF16Z256rk, X86::VFMSUB213BF16Z256mbk, TB_BCAST_SH}, + {X86::VFMSUB213BF16Z256rkz, X86::VFMSUB213BF16Z256mbkz, TB_BCAST_SH}, + {X86::VFMSUB213BF16Zrk, X86::VFMSUB213BF16Zmbk, TB_BCAST_SH}, + {X86::VFMSUB213BF16Zrkz, X86::VFMSUB213BF16Zmbkz, TB_BCAST_SH}, {X86::VFMSUB213PDZ128rk, X86::VFMSUB213PDZ128mbk, TB_BCAST_SD}, {X86::VFMSUB213PDZ128rkz, X86::VFMSUB213PDZ128mbkz, TB_BCAST_SD}, {X86::VFMSUB213PDZ256rk, X86::VFMSUB213PDZ256mbk, TB_BCAST_SD}, @@ -10041,12 +10041,12 @@ static const X86FoldTableEntry BroadcastTable4[] = { {X86::VFMSUB213PSZ256rkz, X86::VFMSUB213PSZ256mbkz, TB_BCAST_SS}, {X86::VFMSUB213PSZrk, X86::VFMSUB213PSZmbk, TB_BCAST_SS}, {X86::VFMSUB213PSZrkz, X86::VFMSUB213PSZmbkz, TB_BCAST_SS}, - {X86::VFMSUB231NEPBF16Z128rk, X86::VFMSUB231NEPBF16Z128mbk, TB_BCAST_SH}, - {X86::VFMSUB231NEPBF16Z128rkz, X86::VFMSUB231NEPBF16Z128mbkz, TB_BCAST_SH}, - {X86::VFMSUB231NEPBF16Z256rk, X86::VFMSUB231NEPBF16Z256mbk, TB_BCAST_SH}, - {X86::VFMSUB231NEPBF16Z256rkz, X86::VFMSUB231NEPBF16Z256mbkz, TB_BCAST_SH}, - {X86::VFMSUB231NEPBF16Zrk, X86::VFMSUB231NEPBF16Zmbk, TB_BCAST_SH}, - {X86::VFMSUB231NEPBF16Zrkz, X86::VFMSUB231NEPBF16Zmbkz, TB_BCAST_SH}, + {X86::VFMSUB231BF16Z128rk, X86::VFMSUB231BF16Z128mbk, TB_BCAST_SH}, + {X86::VFMSUB231BF16Z128rkz, X86::VFMSUB231BF16Z128mbkz, TB_BCAST_SH}, + {X86::VFMSUB231BF16Z256rk, X86::VFMSUB231BF16Z256mbk, TB_BCAST_SH}, + {X86::VFMSUB231BF16Z256rkz, X86::VFMSUB231BF16Z256mbkz, TB_BCAST_SH}, + {X86::VFMSUB231BF16Zrk, X86::VFMSUB231BF16Zmbk, TB_BCAST_SH}, + {X86::VFMSUB231BF16Zrkz, X86::VFMSUB231BF16Zmbkz, TB_BCAST_SH}, {X86::VFMSUB231PDZ128rk, X86::VFMSUB231PDZ128mbk, TB_BCAST_SD}, {X86::VFMSUB231PDZ128rkz, X86::VFMSUB231PDZ128mbkz, TB_BCAST_SD}, {X86::VFMSUB231PDZ256rk, X86::VFMSUB231PDZ256mbk, TB_BCAST_SD}, @@ -10122,12 +10122,12 @@ static const X86FoldTableEntry BroadcastTable4[] = { {X86::VFMULCPHZ128rrk, X86::VFMULCPHZ128rmbk, TB_BCAST_SS}, {X86::VFMULCPHZ256rrk, X86::VFMULCPHZ256rmbk, TB_BCAST_SS}, {X86::VFMULCPHZrrk, X86::VFMULCPHZrmbk, TB_BCAST_SS}, - {X86::VFNMADD132NEPBF16Z128rk, X86::VFNMADD132NEPBF16Z128mbk, TB_BCAST_SH}, - {X86::VFNMADD132NEPBF16Z128rkz, X86::VFNMADD132NEPBF16Z128mbkz, TB_BCAST_SH}, - {X86::VFNMADD132NEPBF16Z256rk, X86::VFNMADD132NEPBF16Z256mbk, TB_BCAST_SH}, - {X86::VFNMADD132NEPBF16Z256rkz, X86::VFNMADD132NEPBF16Z256mbkz, TB_BCAST_SH}, - {X86::VFNMADD132NEPBF16Zrk, X86::VFNMADD132NEPBF16Zmbk, TB_BCAST_SH}, - {X86::VFNMADD132NEPBF16Zrkz, X86::VFNMADD132NEPBF16Zmbkz, TB_BCAST_SH}, + {X86::VFNMADD132BF16Z128rk, X86::VFNMADD132BF16Z128mbk, TB_BCAST_SH}, + {X86::VFNMADD132BF16Z128rkz, X86::VFNMADD132BF16Z128mbkz, TB_BCAST_SH}, + {X86::VFNMADD132BF16Z256rk, X86::VFNMADD132BF16Z256mbk, TB_BCAST_SH}, + {X86::VFNMADD132BF16Z256rkz, X86::VFNMADD132BF16Z256mbkz, TB_BCAST_SH}, + {X86::VFNMADD132BF16Zrk, X86::VFNMADD132BF16Zmbk, TB_BCAST_SH}, + {X86::VFNMADD132BF16Zrkz, X86::VFNMADD132BF16Zmbkz, TB_BCAST_SH}, {X86::VFNMADD132PDZ128rk, X86::VFNMADD132PDZ128mbk, TB_BCAST_SD}, {X86::VFNMADD132PDZ128rkz, X86::VFNMADD132PDZ128mbkz, TB_BCAST_SD}, {X86::VFNMADD132PDZ256rk, X86::VFNMADD132PDZ256mbk, TB_BCAST_SD}, @@ -10146,12 +10146,12 @@ static const X86FoldTableEntry BroadcastTable4[] = { {X86::VFNMADD132PSZ256rkz, X86::VFNMADD132PSZ256mbkz, TB_BCAST_SS}, {X86::VFNMADD132PSZrk, X86::VFNMADD132PSZmbk, TB_BCAST_SS}, {X86::VFNMADD132PSZrkz, X86::VFNMADD132PSZmbkz, TB_BCAST_SS}, - {X86::VFNMADD213NEPBF16Z128rk, X86::VFNMADD213NEPBF16Z128mbk, TB_BCAST_SH}, - {X86::VFNMADD213NEPBF16Z128rkz, X86::VFNMADD213NEPBF16Z128mbkz, TB_BCAST_SH}, - {X86::VFNMADD213NEPBF16Z256rk, X86::VFNMADD213NEPBF16Z256mbk, TB_BCAST_SH}, - {X86::VFNMADD213NEPBF16Z256rkz, X86::VFNMADD213NEPBF16Z256mbkz, TB_BCAST_SH}, - {X86::VFNMADD213NEPBF16Zrk, X86::VFNMADD213NEPBF16Zmbk, TB_BCAST_SH}, - {X86::VFNMADD213NEPBF16Zrkz, X86::VFNMADD213NEPBF16Zmbkz, TB_BCAST_SH}, + {X86::VFNMADD213BF16Z128rk, X86::VFNMADD213BF16Z128mbk, TB_BCAST_SH}, + {X86::VFNMADD213BF16Z128rkz, X86::VFNMADD213BF16Z128mbkz, TB_BCAST_SH}, + {X86::VFNMADD213BF16Z256rk, X86::VFNMADD213BF16Z256mbk, TB_BCAST_SH}, + {X86::VFNMADD213BF16Z256rkz, X86::VFNMADD213BF16Z256mbkz, TB_BCAST_SH}, + {X86::VFNMADD213BF16Zrk, X86::VFNMADD213BF16Zmbk, TB_BCAST_SH}, + {X86::VFNMADD213BF16Zrkz, X86::VFNMADD213BF16Zmbkz, TB_BCAST_SH}, {X86::VFNMADD213PDZ128rk, X86::VFNMADD213PDZ128mbk, TB_BCAST_SD}, {X86::VFNMADD213PDZ128rkz, X86::VFNMADD213PDZ128mbkz, TB_BCAST_SD}, {X86::VFNMADD213PDZ256rk, X86::VFNMADD213PDZ256mbk, TB_BCAST_SD}, @@ -10170,12 +10170,12 @@ static const X86FoldTableEntry BroadcastTable4[] = { {X86::VFNMADD213PSZ256rkz, X86::VFNMADD213PSZ256mbkz, TB_BCAST_SS}, {X86::VFNMADD213PSZrk, X86::VFNMADD213PSZmbk, TB_BCAST_SS}, {X86::VFNMADD213PSZrkz, X86::VFNMADD213PSZmbkz, TB_BCAST_SS}, - {X86::VFNMADD231NEPBF16Z128rk, X86::VFNMADD231NEPBF16Z128mbk, TB_BCAST_SH}, - {X86::VFNMADD231NEPBF16Z128rkz, X86::VFNMADD231NEPBF16Z128mbkz, TB_BCAST_SH}, - {X86::VFNMADD231NEPBF16Z256rk, X86::VFNMADD231NEPBF16Z256mbk, TB_BCAST_SH}, - {X86::VFNMADD231NEPBF16Z256rkz, X86::VFNMADD231NEPBF16Z256mbkz, TB_BCAST_SH}, - {X86::VFNMADD231NEPBF16Zrk, X86::VFNMADD231NEPBF16Zmbk, TB_BCAST_SH}, - {X86::VFNMADD231NEPBF16Zrkz, X86::VFNMADD231NEPBF16Zmbkz, TB_BCAST_SH}, + {X86::VFNMADD231BF16Z128rk, X86::VFNMADD231BF16Z128mbk, TB_BCAST_SH}, + {X86::VFNMADD231BF16Z128rkz, X86::VFNMADD231BF16Z128mbkz, TB_BCAST_SH}, + {X86::VFNMADD231BF16Z256rk, X86::VFNMADD231BF16Z256mbk, TB_BCAST_SH}, + {X86::VFNMADD231BF16Z256rkz, X86::VFNMADD231BF16Z256mbkz, TB_BCAST_SH}, + {X86::VFNMADD231BF16Zrk, X86::VFNMADD231BF16Zmbk, TB_BCAST_SH}, + {X86::VFNMADD231BF16Zrkz, X86::VFNMADD231BF16Zmbkz, TB_BCAST_SH}, {X86::VFNMADD231PDZ128rk, X86::VFNMADD231PDZ128mbk, TB_BCAST_SD}, {X86::VFNMADD231PDZ128rkz, X86::VFNMADD231PDZ128mbkz, TB_BCAST_SD}, {X86::VFNMADD231PDZ256rk, X86::VFNMADD231PDZ256mbk, TB_BCAST_SD}, @@ -10194,12 +10194,12 @@ static const X86FoldTableEntry BroadcastTable4[] = { {X86::VFNMADD231PSZ256rkz, X86::VFNMADD231PSZ256mbkz, TB_BCAST_SS}, {X86::VFNMADD231PSZrk, X86::VFNMADD231PSZmbk, TB_BCAST_SS}, {X86::VFNMADD231PSZrkz, X86::VFNMADD231PSZmbkz, TB_BCAST_SS}, - {X86::VFNMSUB132NEPBF16Z128rk, X86::VFNMSUB132NEPBF16Z128mbk, TB_BCAST_SH}, - {X86::VFNMSUB132NEPBF16Z128rkz, X86::VFNMSUB132NEPBF16Z128mbkz, TB_BCAST_SH}, - {X86::VFNMSUB132NEPBF16Z256rk, X86::VFNMSUB132NEPBF16Z256mbk, TB_BCAST_SH}, - {X86::VFNMSUB132NEPBF16Z256rkz, X86::VFNMSUB132NEPBF16Z256mbkz, TB_BCAST_SH}, - {X86::VFNMSUB132NEPBF16Zrk, X86::VFNMSUB132NEPBF16Zmbk, TB_BCAST_SH}, - {X86::VFNMSUB132NEPBF16Zrkz, X86::VFNMSUB132NEPBF16Zmbkz, TB_BCAST_SH}, + {X86::VFNMSUB132BF16Z128rk, X86::VFNMSUB132BF16Z128mbk, TB_BCAST_SH}, + {X86::VFNMSUB132BF16Z128rkz, X86::VFNMSUB132BF16Z128mbkz, TB_BCAST_SH}, + {X86::VFNMSUB132BF16Z256rk, X86::VFNMSUB132BF16Z256mbk, TB_BCAST_SH}, + {X86::VFNMSUB132BF16Z256rkz, X86::VFNMSUB132BF16Z256mbkz, TB_BCAST_SH}, + {X86::VFNMSUB132BF16Zrk, X86::VFNMSUB132BF16Zmbk, TB_BCAST_SH}, + {X86::VFNMSUB132BF16Zrkz, X86::VFNMSUB132BF16Zmbkz, TB_BCAST_SH}, {X86::VFNMSUB132PDZ128rk, X86::VFNMSUB132PDZ128mbk, TB_BCAST_SD}, {X86::VFNMSUB132PDZ128rkz, X86::VFNMSUB132PDZ128mbkz, TB_BCAST_SD}, {X86::VFNMSUB132PDZ256rk, X86::VFNMSUB132PDZ256mbk, TB_BCAST_SD}, @@ -10218,12 +10218,12 @@ static const X86FoldTableEntry BroadcastTable4[] = { {X86::VFNMSUB132PSZ256rkz, X86::VFNMSUB132PSZ256mbkz, TB_BCAST_SS}, {X86::VFNMSUB132PSZrk, X86::VFNMSUB132PSZmbk, TB_BCAST_SS}, {X86::VFNMSUB132PSZrkz, X86::VFNMSUB132PSZmbkz, TB_BCAST_SS}, - {X86::VFNMSUB213NEPBF16Z128rk, X86::VFNMSUB213NEPBF16Z128mbk, TB_BCAST_SH}, - {X86::VFNMSUB213NEPBF16Z128rkz, X86::VFNMSUB213NEPBF16Z128mbkz, TB_BCAST_SH}, - {X86::VFNMSUB213NEPBF16Z256rk, X86::VFNMSUB213NEPBF16Z256mbk, TB_BCAST_SH}, - {X86::VFNMSUB213NEPBF16Z256rkz, X86::VFNMSUB213NEPBF16Z256mbkz, TB_BCAST_SH}, - {X86::VFNMSUB213NEPBF16Zrk, X86::VFNMSUB213NEPBF16Zmbk, TB_BCAST_SH}, - {X86::VFNMSUB213NEPBF16Zrkz, X86::VFNMSUB213NEPBF16Zmbkz, TB_BCAST_SH}, + {X86::VFNMSUB213BF16Z128rk, X86::VFNMSUB213BF16Z128mbk, TB_BCAST_SH}, + {X86::VFNMSUB213BF16Z128rkz, X86::VFNMSUB213BF16Z128mbkz, TB_BCAST_SH}, + {X86::VFNMSUB213BF16Z256rk, X86::VFNMSUB213BF16Z256mbk, TB_BCAST_SH}, + {X86::VFNMSUB213BF16Z256rkz, X86::VFNMSUB213BF16Z256mbkz, TB_BCAST_SH}, + {X86::VFNMSUB213BF16Zrk, X86::VFNMSUB213BF16Zmbk, TB_BCAST_SH}, + {X86::VFNMSUB213BF16Zrkz, X86::VFNMSUB213BF16Zmbkz, TB_BCAST_SH}, {X86::VFNMSUB213PDZ128rk, X86::VFNMSUB213PDZ128mbk, TB_BCAST_SD}, {X86::VFNMSUB213PDZ128rkz, X86::VFNMSUB213PDZ128mbkz, TB_BCAST_SD}, {X86::VFNMSUB213PDZ256rk, X86::VFNMSUB213PDZ256mbk, TB_BCAST_SD}, @@ -10242,12 +10242,12 @@ static const X86FoldTableEntry BroadcastTable4[] = { {X86::VFNMSUB213PSZ256rkz, X86::VFNMSUB213PSZ256mbkz, TB_BCAST_SS}, {X86::VFNMSUB213PSZrk, X86::VFNMSUB213PSZmbk, TB_BCAST_SS}, {X86::VFNMSUB213PSZrkz, X86::VFNMSUB213PSZmbkz, TB_BCAST_SS}, - {X86::VFNMSUB231NEPBF16Z128rk, X86::VFNMSUB231NEPBF16Z128mbk, TB_BCAST_SH}, - {X86::VFNMSUB231NEPBF16Z128rkz, X86::VFNMSUB231NEPBF16Z128mbkz, TB_BCAST_SH}, - {X86::VFNMSUB231NEPBF16Z256rk, X86::VFNMSUB231NEPBF16Z256mbk, TB_BCAST_SH}, - {X86::VFNMSUB231NEPBF16Z256rkz, X86::VFNMSUB231NEPBF16Z256mbkz, TB_BCAST_SH}, - {X86::VFNMSUB231NEPBF16Zrk, X86::VFNMSUB231NEPBF16Zmbk, TB_BCAST_SH}, - {X86::VFNMSUB231NEPBF16Zrkz, X86::VFNMSUB231NEPBF16Zmbkz, TB_BCAST_SH}, + {X86::VFNMSUB231BF16Z128rk, X86::VFNMSUB231BF16Z128mbk, TB_BCAST_SH}, + {X86::VFNMSUB231BF16Z128rkz, X86::VFNMSUB231BF16Z128mbkz, TB_BCAST_SH}, + {X86::VFNMSUB231BF16Z256rk, X86::VFNMSUB231BF16Z256mbk, TB_BCAST_SH}, + {X86::VFNMSUB231BF16Z256rkz, X86::VFNMSUB231BF16Z256mbkz, TB_BCAST_SH}, + {X86::VFNMSUB231BF16Zrk, X86::VFNMSUB231BF16Zmbk, TB_BCAST_SH}, + {X86::VFNMSUB231BF16Zrkz, X86::VFNMSUB231BF16Zmbkz, TB_BCAST_SH}, {X86::VFNMSUB231PDZ128rk, X86::VFNMSUB231PDZ128mbk, TB_BCAST_SD}, {X86::VFNMSUB231PDZ128rkz, X86::VFNMSUB231PDZ128mbkz, TB_BCAST_SD}, {X86::VFNMSUB231PDZ256rk, X86::VFNMSUB231PDZ256mbk, TB_BCAST_SD}, @@ -10272,6 +10272,9 @@ static const X86FoldTableEntry BroadcastTable4[] = { {X86::VGF2P8AFFINEQBZ128rrik, X86::VGF2P8AFFINEQBZ128rmbik, TB_BCAST_Q}, {X86::VGF2P8AFFINEQBZ256rrik, X86::VGF2P8AFFINEQBZ256rmbik, TB_BCAST_Q}, {X86::VGF2P8AFFINEQBZrrik, X86::VGF2P8AFFINEQBZrmbik, TB_BCAST_Q}, + {X86::VMAXBF16Z128rrk, X86::VMAXBF16Z128rmbk, TB_BCAST_SH}, + {X86::VMAXBF16Z256rrk, X86::VMAXBF16Z256rmbk, TB_BCAST_SH}, + {X86::VMAXBF16Zrrk, X86::VMAXBF16Zrmbk, TB_BCAST_SH}, {X86::VMAXCPDZ128rrk, X86::VMAXCPDZ128rmbk, TB_BCAST_SD}, {X86::VMAXCPDZ256rrk, X86::VMAXCPDZ256rmbk, TB_BCAST_SD}, {X86::VMAXCPDZrrk, X86::VMAXCPDZrmbk, TB_BCAST_SD}, @@ -10281,9 +10284,6 @@ static const X86FoldTableEntry BroadcastTable4[] = { {X86::VMAXCPSZ128rrk, X86::VMAXCPSZ128rmbk, TB_BCAST_SS}, {X86::VMAXCPSZ256rrk, X86::VMAXCPSZ256rmbk, TB_BCAST_SS}, {X86::VMAXCPSZrrk, X86::VMAXCPSZrmbk, TB_BCAST_SS}, - {X86::VMAXPBF16Z128rrk, X86::VMAXPBF16Z128rmbk, TB_BCAST_SH}, - {X86::VMAXPBF16Z256rrk, X86::VMAXPBF16Z256rmbk, TB_BCAST_SH}, - {X86::VMAXPBF16Zrrk, X86::VMAXPBF16Zrmbk, TB_BCAST_SH}, {X86::VMAXPDZ128rrk, X86::VMAXPDZ128rmbk, TB_BCAST_SD}, {X86::VMAXPDZ256rrk, X86::VMAXPDZ256rmbk, TB_BCAST_SD}, {X86::VMAXPDZrrk, X86::VMAXPDZrmbk, TB_BCAST_SD}, @@ -10293,6 +10293,9 @@ static const X86FoldTableEntry BroadcastTable4[] = { {X86::VMAXPSZ128rrk, X86::VMAXPSZ128rmbk, TB_BCAST_SS}, {X86::VMAXPSZ256rrk, X86::VMAXPSZ256rmbk, TB_BCAST_SS}, {X86::VMAXPSZrrk, X86::VMAXPSZrmbk, TB_BCAST_SS}, + {X86::VMINBF16Z128rrk, X86::VMINBF16Z128rmbk, TB_BCAST_SH}, + {X86::VMINBF16Z256rrk, X86::VMINBF16Z256rmbk, TB_BCAST_SH}, + {X86::VMINBF16Zrrk, X86::VMINBF16Zrmbk, TB_BCAST_SH}, {X86::VMINCPDZ128rrk, X86::VMINCPDZ128rmbk, TB_BCAST_SD}, {X86::VMINCPDZ256rrk, X86::VMINCPDZ256rmbk, TB_BCAST_SD}, {X86::VMINCPDZrrk, X86::VMINCPDZrmbk, TB_BCAST_SD}, @@ -10314,9 +10317,6 @@ static const X86FoldTableEntry BroadcastTable4[] = { {X86::VMINMAXPSZ128rrik, X86::VMINMAXPSZ128rmbik, TB_BCAST_SS}, {X86::VMINMAXPSZ256rrik, X86::VMINMAXPSZ256rmbik, TB_BCAST_SS}, {X86::VMINMAXPSZrrik, X86::VMINMAXPSZrmbik, TB_BCAST_SS}, - {X86::VMINPBF16Z128rrk, X86::VMINPBF16Z128rmbk, TB_BCAST_SH}, - {X86::VMINPBF16Z256rrk, X86::VMINPBF16Z256rmbk, TB_BCAST_SH}, - {X86::VMINPBF16Zrrk, X86::VMINPBF16Zrmbk, TB_BCAST_SH}, {X86::VMINPDZ128rrk, X86::VMINPDZ128rmbk, TB_BCAST_SD}, {X86::VMINPDZ256rrk, X86::VMINPDZ256rmbk, TB_BCAST_SD}, {X86::VMINPDZrrk, X86::VMINPDZrmbk, TB_BCAST_SD}, @@ -10326,9 +10326,9 @@ static const X86FoldTableEntry BroadcastTable4[] = { {X86::VMINPSZ128rrk, X86::VMINPSZ128rmbk, TB_BCAST_SS}, {X86::VMINPSZ256rrk, X86::VMINPSZ256rmbk, TB_BCAST_SS}, {X86::VMINPSZrrk, X86::VMINPSZrmbk, TB_BCAST_SS}, - {X86::VMULNEPBF16Z128rrk, X86::VMULNEPBF16Z128rmbk, TB_BCAST_SH}, - {X86::VMULNEPBF16Z256rrk, X86::VMULNEPBF16Z256rmbk, TB_BCAST_SH}, - {X86::VMULNEPBF16Zrrk, X86::VMULNEPBF16Zrmbk, TB_BCAST_SH}, + {X86::VMULBF16Z128rrk, X86::VMULBF16Z128rmbk, TB_BCAST_SH}, + {X86::VMULBF16Z256rrk, X86::VMULBF16Z256rmbk, TB_BCAST_SH}, + {X86::VMULBF16Zrrk, X86::VMULBF16Zrmbk, TB_BCAST_SH}, {X86::VMULPDZ128rrk, X86::VMULPDZ128rmbk, TB_BCAST_SD}, {X86::VMULPDZ256rrk, X86::VMULPDZ256rmbk, TB_BCAST_SD}, {X86::VMULPDZrrk, X86::VMULPDZrmbk, TB_BCAST_SD}, @@ -10691,9 +10691,9 @@ static const X86FoldTableEntry BroadcastTable4[] = { {X86::VRANGEPSZ128rrik, X86::VRANGEPSZ128rmbik, TB_BCAST_SS}, {X86::VRANGEPSZ256rrik, X86::VRANGEPSZ256rmbik, TB_BCAST_SS}, {X86::VRANGEPSZrrik, X86::VRANGEPSZrmbik, TB_BCAST_SS}, - {X86::VSCALEFPBF16Z128rrk, X86::VSCALEFPBF16Z128rmbk, TB_BCAST_SH}, - {X86::VSCALEFPBF16Z256rrk, X86::VSCALEFPBF16Z256rmbk, TB_BCAST_SH}, - {X86::VSCALEFPBF16Zrrk, X86::VSCALEFPBF16Zrmbk, TB_BCAST_SH}, + {X86::VSCALEFBF16Z128rrk, X86::VSCALEFBF16Z128rmbk, TB_BCAST_SH}, + {X86::VSCALEFBF16Z256rrk, X86::VSCALEFBF16Z256rmbk, TB_BCAST_SH}, + {X86::VSCALEFBF16Zrrk, X86::VSCALEFBF16Zrmbk, TB_BCAST_SH}, {X86::VSCALEFPDZ128rrk, X86::VSCALEFPDZ128rmbk, TB_BCAST_SD}, {X86::VSCALEFPDZ256rrk, X86::VSCALEFPDZ256rmbk, TB_BCAST_SD}, {X86::VSCALEFPDZrrk, X86::VSCALEFPDZrmbk, TB_BCAST_SD}, @@ -10717,9 +10717,9 @@ static const X86FoldTableEntry BroadcastTable4[] = { {X86::VSHUFPSZ128rrik, X86::VSHUFPSZ128rmbik, TB_BCAST_SS}, {X86::VSHUFPSZ256rrik, X86::VSHUFPSZ256rmbik, TB_BCAST_SS}, {X86::VSHUFPSZrrik, X86::VSHUFPSZrmbik, TB_BCAST_SS}, - {X86::VSUBNEPBF16Z128rrk, X86::VSUBNEPBF16Z128rmbk, TB_BCAST_SH}, - {X86::VSUBNEPBF16Z256rrk, X86::VSUBNEPBF16Z256rmbk, TB_BCAST_SH}, - {X86::VSUBNEPBF16Zrrk, X86::VSUBNEPBF16Zrmbk, TB_BCAST_SH}, + {X86::VSUBBF16Z128rrk, X86::VSUBBF16Z128rmbk, TB_BCAST_SH}, + {X86::VSUBBF16Z256rrk, X86::VSUBBF16Z256rmbk, TB_BCAST_SH}, + {X86::VSUBBF16Zrrk, X86::VSUBBF16Zrmbk, TB_BCAST_SH}, {X86::VSUBPDZ128rrk, X86::VSUBPDZ128rmbk, TB_BCAST_SD}, {X86::VSUBPDZ256rrk, X86::VSUBPDZ256rmbk, TB_BCAST_SD}, {X86::VSUBPDZrrk, X86::VSUBPDZrmbk, TB_BCAST_SD}, From 91a342924174855fd867c3b4c54a6ace8bb87996 Mon Sep 17 00:00:00 2001 From: "Wang, Phoebe" Date: Thu, 23 Jan 2025 22:57:09 +0800 Subject: [PATCH 2/2] Format X86InstrFMA3Info.cpp --- llvm/lib/Target/X86/X86InstrFMA3Info.cpp | 10 +++++----- 1 file changed, 5 insertions(+), 5 deletions(-) diff --git a/llvm/lib/Target/X86/X86InstrFMA3Info.cpp b/llvm/lib/Target/X86/X86InstrFMA3Info.cpp index d0c508d9934c3..86f6c733bdf75 100644 --- a/llvm/lib/Target/X86/X86InstrFMA3Info.cpp +++ b/llvm/lib/Target/X86/X86InstrFMA3Info.cpp @@ -52,7 +52,7 @@ using namespace llvm; FMA3GROUP_PACKED_WIDTHS_Z(Name, PH, Attrs) \ FMA3GROUP_PACKED_WIDTHS_ALL(Name, PS, Attrs) -#define FMA3GROUP_PACKED_BF16(Name, Attrs) \ +#define FMA3GROUP_PACKED_BF16(Name, Attrs) \ FMA3GROUP_PACKED_WIDTHS_Z(Name, BF16, Attrs) #define FMA3GROUP_SCALAR_WIDTHS_Z(Name, Suf, Attrs) \ @@ -92,10 +92,10 @@ static const X86InstrFMA3Group Groups[] = { FMA3GROUP_MASKED(Name, Type##Z256##Suf, Attrs) \ FMA3GROUP_MASKED(Name, Type##Z##Suf, Attrs) -#define FMA3GROUP_PACKED_AVX512_ALL(Name, Suf, Attrs) \ - FMA3GROUP_PACKED_AVX512_WIDTHS(Name, BF16, Suf, Attrs) \ - FMA3GROUP_PACKED_AVX512_WIDTHS(Name, PD, Suf, Attrs) \ - FMA3GROUP_PACKED_AVX512_WIDTHS(Name, PH, Suf, Attrs) \ +#define FMA3GROUP_PACKED_AVX512_ALL(Name, Suf, Attrs) \ + FMA3GROUP_PACKED_AVX512_WIDTHS(Name, BF16, Suf, Attrs) \ + FMA3GROUP_PACKED_AVX512_WIDTHS(Name, PD, Suf, Attrs) \ + FMA3GROUP_PACKED_AVX512_WIDTHS(Name, PH, Suf, Attrs) \ FMA3GROUP_PACKED_AVX512_WIDTHS(Name, PS, Suf, Attrs) #define FMA3GROUP_PACKED_AVX512_DHS(Name, Suf, Attrs) \